Resolved comments

itholic · itholic · commit f4d9843145fd · 2021-05-20T17:57:51.000+09:00
diff --git a/docs/sql-data-sources-json.md b/docs/sql-data-sources-json.md
@@ -116,12 +116,6 @@ Data source options of JSON can be set via:
     </td>
     <td>read/write</td>
   </tr>
-  <tr>
-    <td><code>maxFilesPerTrigger</code></td>
-    <td>None</td>
-    <td>Sets the maximum number of new files to be considered in every trigger.</td>
-    <td>read</td>
-  </tr>
   <tr>
     <td><code>primitivesAsString</code></td>
     <td>None</td>
diff --git a/python/pyspark/sql/readwriter.py b/python/pyspark/sql/readwriter.py
@@ -108,35 +108,13 @@ def schema(self, schema):
     @since(1.5)
     def option(self, key, value):
         """Adds an input option for the underlying data source.
-
-        You can set the following option(s) for reading files:
-            * ``pathGlobFilter``: an optional glob pattern to only include files with paths matching
-                the pattern. The syntax follows org.apache.hadoop.fs.GlobFilter.
-                It does not change the behavior of partition discovery.
-            * ``modifiedBefore``: an optional timestamp to only include files with
-                modification times occurring before the specified time. The provided timestamp
-                must be in the following format: YYYY-MM-DDTHH:mm:ss (e.g. 2020-06-01T13:00:00)
-            * ``modifiedAfter``: an optional timestamp to only include files with
-                modification times occurring after the specified time. The provided timestamp
-                must be in the following format: YYYY-MM-DDTHH:mm:ss (e.g. 2020-06-01T13:00:00)
         """
         self._jreader = self._jreader.option(key, to_str(value))
         return self
 
     @since(1.4)
     def options(self, **options):
         """Adds input options for the underlying data source.
-
-        You can set the following option(s) for reading files:
-            * ``pathGlobFilter``: an optional glob pattern to only include files with paths matching
-                the pattern. The syntax follows org.apache.hadoop.fs.GlobFilter.
-                It does not change the behavior of partition discovery.
-            * ``modifiedBefore``: an optional timestamp to only include files with
-                modification times occurring before the specified time. The provided timestamp
-                must be in the following format: YYYY-MM-DDTHH:mm:ss (e.g. 2020-06-01T13:00:00)
-            * ``modifiedAfter``: an optional timestamp to only include files with
-                modification times occurring after the specified time. The provided timestamp
-                must be in the following format: YYYY-MM-DDTHH:mm:ss (e.g. 2020-06-01T13:00:00)
         """
         for k in options:
             self._jreader = self._jreader.option(k, to_str(options[k]))
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/DataFrameReader.scala b/sql/core/src/main/scala/org/apache/spark/sql/DataFrameReader.scala
@@ -392,8 +392,8 @@ class DataFrameReader private[sql](sparkSession: SparkSession) extends Logging {
    *
    * You can find the JSON-specific options for reading JSON files in
    * <a href="https://spark.apache.org/docs/latest/sql-data-sources-json.html#data-source-option">
-   *   Data Source Option</a>
-   * and
+   *   Data Source Option</a> in the version you use.
+   * More general options can be found in
    * <a href=
    *   "https://spark.apache.org/docs/latest/sql-data-sources-generic-options.html">
    *   Generic Files Source Options</a> in the version you use.
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/streaming/DataStreamReader.scala b/sql/core/src/main/scala/org/apache/spark/sql/streaming/DataStreamReader.scala
@@ -218,10 +218,16 @@ final class DataStreamReader private[sql](sparkSession: SparkSession) extends Lo
    * This function goes through the input once to determine the input schema. If you know the
    * schema in advance, use the version that specifies the schema to avoid the extra scan.
    *
+   * You can set the following structured streaming option(s):
+   * <ul>
+   * <li>`maxFilesPerTrigger` (default: no max limit): sets the maximum number of new files to be
+   * considered in every trigger.</li>
+   * </ul>
+   *
    * You can find the JSON-specific options for reading JSON file stream in
    * <a href="https://spark.apache.org/docs/latest/sql-data-sources-json.html#data-source-option">
-   *   Data Source Option</a>
-   * and
+   *   Data Source Option</a> in the version you use.
+   * More general options can be found in
    * <a href=
    *   "https://spark.apache.org/docs/latest/sql-data-sources-generic-options.html">
    *   Generic Files Source Options</a> in the version you use.