apache
diff --git a/‎api/src/main/java/org/apache/iceberg/FileScanTask.java‎
Lines changed: 4 additions & 0 deletions b/‎api/src/main/java/org/apache/iceberg/FileScanTask.java‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎api/src/main/java/org/apache/iceberg/events/LimitAwareScanTaskEvent.java‎
Lines changed: 38 additions & 0 deletions b/‎api/src/main/java/org/apache/iceberg/events/LimitAwareScanTaskEvent.java‎
Lines changed: 38 additions & 0 deletions
diff --git a/‎core/src/main/java/org/apache/iceberg/util/TableScanUtil.java‎
Lines changed: 71 additions & 15 deletions b/‎core/src/main/java/org/apache/iceberg/util/TableScanUtil.java‎
Lines changed: 71 additions & 15 deletions
diff --git a/‎spark/v3.5/spark-extensions/src/jmh/java/org/apache/iceberg/spark/LimitPushDownBenchmark.java‎
Lines changed: 172 additions & 0 deletions b/‎spark/v3.5/spark-extensions/src/jmh/java/org/apache/iceberg/spark/LimitPushDownBenchmark.java‎
Lines changed: 172 additions & 0 deletions
diff --git a/‎spark/v3.5/spark/src/main/java/org/apache/iceberg/spark/SparkReadConf.java‎
Lines changed: 8 additions & 0 deletions b/‎spark/v3.5/spark/src/main/java/org/apache/iceberg/spark/SparkReadConf.java‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎spark/v3.5/spark/src/main/java/org/apache/iceberg/spark/SparkSQLProperties.java‎
Lines changed: 4 additions & 0 deletions b/‎spark/v3.5/spark/src/main/java/org/apache/iceberg/spark/SparkSQLProperties.java‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎spark/v3.5/spark/src/main/java/org/apache/iceberg/spark/source/SparkBatchQueryScan.java‎
Lines changed: 3 additions & 2 deletions b/‎spark/v3.5/spark/src/main/java/org/apache/iceberg/spark/source/SparkBatchQueryScan.java‎
Lines changed: 3 additions & 2 deletions
@@ -54,4 +54,8 @@ default boolean isFileScanTask() {
   default FileScanTask asFileScanTask() {
     return this;
   }
+
+  default long minRecordCountEstimate() {
+    return deletes().isEmpty() ? file().recordCount() : 0;
+  }
 }
@@ -0,0 +1,38 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+package org.apache.iceberg.events;
+
+/** Event sent to listeners when a scan task is planned, used for limit push down tracking. */
+public final class LimitAwareScanTaskEvent {
+  private final String taskName;
+  private final long minRecordCountEstimate;
+
+  public LimitAwareScanTaskEvent(String taskName, long minRecordCountEstimate) {
+    this.taskName = taskName;
+    this.minRecordCountEstimate = minRecordCountEstimate;
+  }
+
+  public String taskName() {
+    return taskName;
+  }
+
+  public long minRecordCountEstimate() {
+    return minRecordCountEstimate;
+  }
+}
@@ -35,6 +35,8 @@
 import org.apache.iceberg.ScanTaskGroup;
 import org.apache.iceberg.SplittableScanTask;
 import org.apache.iceberg.StructLike;
+import org.apache.iceberg.events.LimitAwareScanTaskEvent;
+import org.apache.iceberg.events.Listeners;
 import org.apache.iceberg.io.CloseableIterable;
 import org.apache.iceberg.relocated.com.google.common.base.Preconditions;
 import org.apache.iceberg.relocated.com.google.common.collect.FluentIterable;
@@ -107,25 +109,35 @@ public static <T extends ScanTask> List<ScanTaskGroup<T>> planTaskGroups(
         planTaskGroups(CloseableIterable.withNoopClose(tasks), splitSize, lookback, openFileCost));
   }
 
-  @SuppressWarnings("unchecked")
   public static <T extends ScanTask> CloseableIterable<ScanTaskGroup<T>> planTaskGroups(
       CloseableIterable<T> tasks, long splitSize, int lookback, long openFileCost) {
+    return planTaskGroups(tasks, splitSize, lookback, openFileCost, 0);
+  }
 
-    validatePlanningArguments(splitSize, lookback, openFileCost);
+  @SuppressWarnings("unchecked")
+  public static <T extends ScanTask> CloseableIterable<ScanTaskGroup<T>> planTaskGroups(
+      CloseableIterable<T> tasks, long splitSize, int lookback, long openFileCost, int limit) {
 
-    // capture manifests which can be closed after scan planning
-    CloseableIterable<T> splitTasks =
-        CloseableIterable.combine(
-            FluentIterable.from(tasks)
-                .transformAndConcat(
-                    task -> {
-                      if (task instanceof SplittableScanTask<?>) {
-                        return ((SplittableScanTask<? extends T>) task).split(splitSize);
-                      } else {
-                        return ImmutableList.of(task);
-                      }
-                    }),
-            tasks);
+    validatePlanningArguments(splitSize, lookback, openFileCost);
+    CloseableIterable<T> splitTasks;
+    if (limit > 0) {
+      // optimize scan planning by stopping early when estimated row count reaches limit
+      splitTasks = splitScanTasksWithLimitPushDown(tasks, splitSize, limit);
+    } else {
+      // capture manifests which can be closed after scan planning
+      splitTasks =
+          CloseableIterable.combine(
+              FluentIterable.from(tasks)
+                  .transformAndConcat(
+                      task -> {
+                        if (task instanceof SplittableScanTask<?>) {
+                          return ((SplittableScanTask<? extends T>) task).split(splitSize);
+                        } else {
+                          return ImmutableList.of(task);
+                        }
+                      }),
+              tasks);
+    }
 
     Function<T, Long> weightFunc =
         task -> Math.max(task.sizeBytes(), task.filesCount() * openFileCost);
@@ -249,4 +261,48 @@ private static void validatePlanningArguments(long splitSize, int lookback, long
     Preconditions.checkArgument(lookback > 0, "Split planning lookback must be > 0: %s", lookback);
     Preconditions.checkArgument(openFileCost >= 0, "File open cost must be >= 0: %s", openFileCost);
   }
+
+  private static <T> CloseableIterable<T> splitScanTasksWithLimitPushDown(
+      CloseableIterable<T> tasks, long splitSize, int limit) {
+
+    List<T> candidateTasks = Lists.newArrayList();
+    long remainingLimit = limit;
+
+    for (T task : tasks) {
+      if (task instanceof SplittableScanTask<?>) {
+        @SuppressWarnings("unchecked")
+        SplittableScanTask<? extends T> splittable = (SplittableScanTask<? extends T>) task;
+        for (T splitTask : splittable.split(splitSize)) {
+          candidateTasks.add(splitTask);
+          remainingLimit = updateRemainingLimit(splitTask, remainingLimit);
+          if (remainingLimit <= 0) {
+            break;
+          }
+        }
+      } else {
+        candidateTasks.add(task);
+        remainingLimit = updateRemainingLimit(task, remainingLimit);
+      }
+
+      if (remainingLimit <= 0) {
+        break;
+      }
+    }
+
+    return CloseableIterable.combine(candidateTasks, tasks);
+  }
+
+  @SuppressWarnings("unchecked")
+  private static <T> long updateRemainingLimit(T task, long remainingLimit) {
+    if (task instanceof ScanTask) {
+      ScanTask scanTask = (ScanTask) task;
+      if (scanTask.isFileScanTask()) {
+        FileScanTask fileTask = scanTask.asFileScanTask();
+        long estimate = fileTask.minRecordCountEstimate();
+        Listeners.notifyAll(new LimitAwareScanTaskEvent(fileTask.toString(), estimate));
+        return remainingLimit - estimate;
+      }
+    }
+    return remainingLimit;
+  }
 }
@@ -0,0 +1,172 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+package org.apache.iceberg.spark;
+
+import com.google.errorprone.annotations.FormatMethod;
+import com.google.errorprone.annotations.FormatString;
+import java.util.Locale;
+import java.util.concurrent.TimeUnit;
+import org.apache.iceberg.spark.extensions.IcebergSparkSessionExtensions;
+import org.apache.spark.sql.Dataset;
+import org.apache.spark.sql.Row;
+import org.apache.spark.sql.SparkSession;
+import org.apache.spark.sql.catalyst.analysis.NoSuchTableException;
+import org.apache.spark.sql.catalyst.parser.ParseException;
+import org.openjdk.jmh.annotations.Benchmark;
+import org.openjdk.jmh.annotations.BenchmarkMode;
+import org.openjdk.jmh.annotations.Fork;
+import org.openjdk.jmh.annotations.Measurement;
+import org.openjdk.jmh.annotations.Mode;
+import org.openjdk.jmh.annotations.Param;
+import org.openjdk.jmh.annotations.Scope;
+import org.openjdk.jmh.annotations.Setup;
+import org.openjdk.jmh.annotations.State;
+import org.openjdk.jmh.annotations.TearDown;
+import org.openjdk.jmh.annotations.Threads;
+import org.openjdk.jmh.annotations.Timeout;
+import org.openjdk.jmh.annotations.Warmup;
+import org.openjdk.jmh.infra.Blackhole;
+
+/**
+ * A benchmark that evaluates the limit push down performance.
+ *
+ * <p>To run this benchmark for spark-3.5: <code>
+ *   ./gradlew -DsparkVersions=3.5 :iceberg-spark:iceberg-spark-extensions-3.5_2.12:jmh
+ *       -PjmhIncludeRegex=LimitPushDownBenchmark
+ *       -PjmhOutputPath=benchmark/iceberg-limit-push-down-benchmark.txt
+ * </code>
+ */
+@Fork(1)
+@State(Scope.Benchmark)
+@Warmup(iterations = 3)
+@Measurement(iterations = 5)
+@Timeout(time = 10, timeUnit = TimeUnit.MINUTES)
+@BenchmarkMode(Mode.AverageTime)
+public class LimitPushDownBenchmark {
+
+  private static final String TABLE_NAME = "test_limit_table";
+
+  @Param({"100", "1000", "10000"})
+  private int limitValue;
+
+  @Param({"true", "false"})
+  private boolean limitPushDownEnabled;
+
+  private SparkSession spark;
+
+  @Setup
+  public void setupBenchmark() throws NoSuchTableException, ParseException {
+    setupSpark();
+    setupTable();
+  }
+
+  @TearDown
+  public void tearDownBenchmark() {
+    dropTable();
+    tearDownSpark();
+  }
+
+  @Benchmark
+  @Threads(1)
+  public void limitQuery(Blackhole blackhole) {
+    spark
+        .conf()
+        .set("spark.sql.iceberg.limit-push-down.enabled", String.valueOf(limitPushDownEnabled));
+
+    Dataset<Row> result =
+        spark.sql(
+            String.format(Locale.ROOT, "SELECT * FROM local.%s LIMIT %d", TABLE_NAME, limitValue));
+
+    blackhole.consume(result.count());
+  }
+
+  @Benchmark
+  @Threads(1)
+  public void limitQueryWithPartitionPruning(Blackhole blackhole) {
+    spark
+        .conf()
+        .set("spark.sql.iceberg.limit-push-down.enabled", String.valueOf(limitPushDownEnabled));
+
+    Dataset<Row> result =
+        spark.sql(
+            String.format(
+                Locale.ROOT,
+                "SELECT * FROM local.%s WHERE category != '0' LIMIT %d",
+                TABLE_NAME,
+                limitValue));
+
+    blackhole.consume(result.count());
+  }
+
+  private void setupSpark() {
+    this.spark =
+        SparkSession.builder()
+            .appName("limit-push-down-benchmark")
+            .master("local[1]")
+            .config("spark.sql.extensions", IcebergSparkSessionExtensions.class.getName())
+            .config("spark.sql.catalog.local", "org.apache.iceberg.spark.SparkCatalog")
+            .config("spark.sql.catalog.local.type", "hadoop")
+            .config("spark.sql.catalog.local.warehouse", "/tmp/iceberg-benchmark-warehouse")
+            .getOrCreate();
+  }
+
+  private void setupTable() {
+    sql("DROP TABLE IF EXISTS local.%s PURGE", TABLE_NAME);
+
+    sql(
+        "CREATE TABLE local.%s (id BIGINT, data STRING, value DOUBLE, category STRING) "
+            + "USING iceberg PARTITIONED BY (id)",
+        TABLE_NAME);
+
+    // Insert substantial data across multiple partitions
+    for (int partition = 0; partition < 100; partition++) {
+      StringBuilder values = new StringBuilder();
+      for (int row = 0; row < 5000; row++) {
+        int id = partition * 5000 + row;
+        if (values.length() > 0) {
+          values.append(", ");
+        }
+        values.append(
+            String.format(
+                Locale.ROOT,
+                "(%d, 'data_%d', %f, 'category_%d')",
+                id,
+                id,
+                Math.random() * 1000,
+                partition));
+      }
+      sql("INSERT INTO local.%s VALUES %s", TABLE_NAME, values.toString());
+    }
+  }
+
+  private void dropTable() {
+    sql("DROP TABLE IF EXISTS local.%s PURGE", TABLE_NAME);
+  }
+
+  private void tearDownSpark() {
+    if (spark != null) {
+      spark.stop();
+    }
+  }
+
+  @FormatMethod
+  private void sql(@FormatString String query, Object... args) {
+    spark.sql(String.format(query, args));
+  }
+}
@@ -277,6 +277,14 @@ public boolean aggregatePushDownEnabled() {
         .parse();
   }
 
+  public boolean limitPushDownEnabled() {
+    return confParser
+        .booleanConf()
+        .sessionConf(SparkSQLProperties.LIMIT_PUSH_DOWN_ENABLED)
+        .defaultValue(SparkSQLProperties.LIMIT_PUSH_DOWN_ENABLED_DEFAULT)
+        .parse();
+  }
+
   public boolean adaptiveSplitSizeEnabled() {
     return confParser
         .booleanConf()
 
@@ -101,4 +101,8 @@ private SparkSQLProperties() {}
   // Controls whether to report available column statistics to Spark for query optimization.
   public static final String REPORT_COLUMN_STATS = "spark.sql.iceberg.report-column-stats";
   public static final boolean REPORT_COLUMN_STATS_DEFAULT = true;
+
+  // Controls whether to push down limit to Iceberg scan planning
+  public static final String LIMIT_PUSH_DOWN_ENABLED = "spark.sql.iceberg.limit-push-down.enabled";
+  public static final boolean LIMIT_PUSH_DOWN_ENABLED_DEFAULT = true;
 }
@@ -81,8 +81,9 @@ class SparkBatchQueryScan extends SparkPartitioningAwareScan<PartitionScanTask>
       SparkReadConf readConf,
       Schema expectedSchema,
       List<Expression> filters,
-      Supplier<ScanReport> scanReportSupplier) {
-    super(spark, table, scan, readConf, expectedSchema, filters, scanReportSupplier);
+      Supplier<ScanReport> scanReportSupplier,
+      int pushedLimit) {
+    super(spark, table, scan, readConf, expectedSchema, filters, scanReportSupplier, pushedLimit);
 
     this.snapshotId = readConf.snapshotId();
     this.startSnapshotId = readConf.startSnapshotId();
Original file line number	Diff line number	Diff line change
`@@ -54,4 +54,8 @@ default boolean isFileScanTask() {`
`54`	`54`	`default FileScanTask asFileScanTask() {`
`55`	`55`	`return this;`
`56`	`56`	`}`
	`57`	`+`
	`58`	`+ default long minRecordCountEstimate() {`
	`59`	`+ return deletes().isEmpty() ? file().recordCount() : 0;`
	`60`	`+ }`
`57`	`61`	`}`
Original file line number	Diff line number	Diff line change
`@@ -101,4 +101,8 @@ private SparkSQLProperties() {}`
`101`	`101`	`// Controls whether to report available column statistics to Spark for query optimization.`
`102`	`102`	`public static final String REPORT_COLUMN_STATS = "spark.sql.iceberg.report-column-stats";`
`103`	`103`	`public static final boolean REPORT_COLUMN_STATS_DEFAULT = true;`
	`104`	`+`
	`105`	`+ // Controls whether to push down limit to Iceberg scan planning`
	`106`	`+ public static final String LIMIT_PUSH_DOWN_ENABLED = "spark.sql.iceberg.limit-push-down.enabled";`
	`107`	`+ public static final boolean LIMIT_PUSH_DOWN_ENABLED_DEFAULT = true;`
`104`	`108`	`}`