diff --git a/‎core/src/main/java/org/apache/iceberg/BaseFileScanTask.java‎
Lines changed: 5 additions & 1 deletion b/‎core/src/main/java/org/apache/iceberg/BaseFileScanTask.java‎
Lines changed: 5 additions & 1 deletion
diff --git a/‎data/src/test/java/org/apache/iceberg/data/orc/TestOrcRowLevelFiltering.java‎
Lines changed: 183 additions & 0 deletions b/‎data/src/test/java/org/apache/iceberg/data/orc/TestOrcRowLevelFiltering.java‎
Lines changed: 183 additions & 0 deletions
diff --git a/‎orc/src/main/java/org/apache/iceberg/orc/ORC.java‎
Lines changed: 7 additions & 1 deletion b/‎orc/src/main/java/org/apache/iceberg/orc/ORC.java‎
Lines changed: 7 additions & 1 deletion
diff --git a/‎orc/src/main/java/org/apache/iceberg/orc/OrcIterable.java‎
Lines changed: 85 additions & 24 deletions b/‎orc/src/main/java/org/apache/iceberg/orc/OrcIterable.java‎
Lines changed: 85 additions & 24 deletions
@@ -169,7 +169,7 @@ public FileScanTask next() {
     }
   }
 
-  private static final class SplitScanTask implements FileScanTask {
+  public static final class SplitScanTask implements FileScanTask {
     private final long len;
     private final long offset;
     private final FileScanTask fileScanTask;
@@ -209,5 +209,9 @@ public Expression residual() {
     public Iterable<FileScanTask> split(long splitSize) {
       throw new UnsupportedOperationException("Cannot split a task which is already split");
     }
+
+    public FileScanTask underlyingFileScanTask() {
+      return fileScanTask;
+    }
   }
 }
@@ -0,0 +1,183 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.iceberg.data.orc;
+
+import java.io.File;
+import java.io.IOException;
+import java.util.List;
+import java.util.stream.Collectors;
+import java.util.stream.LongStream;
+import org.apache.iceberg.Files;
+import org.apache.iceberg.Schema;
+import org.apache.iceberg.data.DataTestHelpers;
+import org.apache.iceberg.data.GenericRecord;
+import org.apache.iceberg.data.Record;
+import org.apache.iceberg.io.CloseableIterable;
+import org.apache.iceberg.io.FileAppender;
+import org.apache.iceberg.orc.ORC;
+import org.apache.iceberg.orc.OrcRowFilter;
+import org.apache.iceberg.relocated.com.google.common.collect.ImmutableList;
+import org.apache.iceberg.relocated.com.google.common.collect.Lists;
+import org.apache.iceberg.types.Types;
+import org.junit.Assert;
+import org.junit.Rule;
+import org.junit.Test;
+import org.junit.rules.TemporaryFolder;
+
+import static org.apache.iceberg.types.Types.NestedField.optional;
+import static org.apache.iceberg.types.Types.NestedField.required;
+
+public class TestOrcRowLevelFiltering {
+
+  @Rule
+  public TemporaryFolder temp = new TemporaryFolder();
+
+  private static final Schema SCHEMA = new Schema(
+      required(100, "id", Types.LongType.get()),
+      required(101, "data1", Types.StringType.get()),
+      required(102, "data2", Types.StringType.get())
+  );
+
+  private static final List<Record> RECORDS = LongStream.range(0, 100).mapToObj(i -> {
+    Record record = GenericRecord.create(SCHEMA);
+    record.set(0, i);
+    record.set(1, "data1:" + i);
+    record.set(2, "data2:" + i);
+    return record;
+  }).collect(Collectors.toList());
+
+  @Test
+  public void testReadOrcWithRowFilterNoProjection() throws IOException {
+    testReadOrcWithRowFilter(SCHEMA, rowFilterId(), RECORDS.subList(75, 100));
+  }
+
+  @Test
+  public void testReadOrcWithRowFilterProjection() throws IOException {
+    Schema projectedSchema = new Schema(
+        required(101, "data1", Types.StringType.get())
+    );
+
+    List<Record> expected = RECORDS.subList(75, 100).stream().map(r -> {
+      Record record = GenericRecord.create(projectedSchema);
+      record.set(0, r.get(1));
+      return record;
+    }).collect(Collectors.toList());
+
+    testReadOrcWithRowFilter(projectedSchema, rowFilterId(), expected);
+  }
+
+  @Test
+  public void testReadOrcWithRowFilterPartialFilterColumns() throws IOException {
+    Schema projectedSchema = new Schema(
+        required(101, "data1", Types.StringType.get()),
+        required(102, "data2", Types.StringType.get())
+    );
+
+    List<Record> expected = RECORDS.subList(25, 75).stream().map(r -> {
+      Record record = GenericRecord.create(projectedSchema);
+      record.set(0, r.get(1));
+      record.set(1, r.get(2));
+      return record;
+    }).collect(Collectors.toList());
+
+    testReadOrcWithRowFilter(projectedSchema, rowFilterIdAndData1(), expected);
+  }
+
+  @Test
+  public void testReadOrcWithRowFilterNonExistentColumn() throws IOException {
+    testReadOrcWithRowFilter(SCHEMA, rowFilterData3(), ImmutableList.of());
+  }
+
+  private void testReadOrcWithRowFilter(Schema schema, OrcRowFilter rowFilter, List<Record> expected)
+      throws IOException {
+    File testFile = temp.newFile();
+    Assert.assertTrue("Delete should succeed", testFile.delete());
+    try (FileAppender<Record> writer = ORC.write(Files.localOutput(testFile))
+        .schema(SCHEMA)
+        .createWriterFunc(GenericOrcWriter::buildWriter)
+        .build()) {
+      for (Record rec : RECORDS) {
+        writer.add(rec);
+      }
+    }
+
+    List<Record> rows;
+    try (CloseableIterable<Record> reader = ORC.read(Files.localInput(testFile))
+        .project(schema)
+        .createReaderFunc(fileSchema -> GenericOrcReader.buildReader(schema, fileSchema))
+        .rowFilter(rowFilter)
+        .build()) {
+      rows = Lists.newArrayList(reader);
+    }
+
+    for (int i = 0; i < expected.size(); i += 1) {
+      DataTestHelpers.assertEquals(schema.asStruct(), expected.get(i), rows.get(i));
+    }
+  }
+
+  private OrcRowFilter rowFilterId() {
+    return new OrcRowFilter() {
+      @Override
+      public Schema requiredSchema() {
+        return new Schema(
+            required(100, "id", Types.LongType.get())
+        );
+      }
+
+      @Override
+      public boolean shouldKeep(Object[] values) {
+        return (Long) values[0] >= 75;
+      }
+    };
+  }
+
+  private OrcRowFilter rowFilterIdAndData1() {
+    return new OrcRowFilter() {
+      @Override
+      public Schema requiredSchema() {
+        return new Schema(
+            SCHEMA.findField("id"),
+            SCHEMA.findField("data1")
+        );
+      }
+
+      @Override
+      public boolean shouldKeep(Object[] values) {
+        return (Long) values[0] >= 25 && ((String) values[1]).compareTo("data1:75") < 0;
+      }
+    };
+  }
+
+  private OrcRowFilter rowFilterData3() {
+    return new OrcRowFilter() {
+      @Override
+      public Schema requiredSchema() {
+        return new Schema(
+            optional(104, "data3", Types.LongType.get())
+        );
+      }
+
+      @Override
+      public boolean shouldKeep(Object[] values) {
+        return values[0] != null && (Long) values[0] >= 25;
+      }
+    };
+  }
+}
@@ -126,6 +126,7 @@ public static class ReadBuilder {
     private Long length = null;
     private Expression filter = null;
     private boolean caseSensitive = true;
+    private OrcRowFilter rowFilter = null;
 
     private Function<TypeDescription, OrcRowReader<?>> readerFunc;
     private Function<TypeDescription, OrcBatchReader<?>> batchedReaderFunc;
@@ -194,10 +195,15 @@ public ReadBuilder recordsPerBatch(int numRecordsPerBatch) {
       return this;
     }
 
+    public ReadBuilder rowFilter(OrcRowFilter newRowFilter) {
+      this.rowFilter = newRowFilter;
+      return this;
+    }
+
     public <D> CloseableIterable<D> build() {
       Preconditions.checkNotNull(schema, "Schema is required");
       return new OrcIterable<>(file, conf, schema, start, length, readerFunc, caseSensitive, filter, batchedReaderFunc,
-          recordsPerBatch);
+          recordsPerBatch, rowFilter);
     }
   }
 
 
@@ -20,6 +20,7 @@
 package org.apache.iceberg.orc;
 
 import java.io.IOException;
+import java.util.Set;
 import java.util.function.Function;
 import org.apache.hadoop.conf.Configuration;
 import org.apache.iceberg.Schema;
@@ -31,6 +32,9 @@
 import org.apache.iceberg.io.CloseableIterable;
 import org.apache.iceberg.io.CloseableIterator;
 import org.apache.iceberg.io.InputFile;
+import org.apache.iceberg.relocated.com.google.common.base.Preconditions;
+import org.apache.iceberg.relocated.com.google.common.collect.Sets;
+import org.apache.iceberg.types.TypeUtil;
 import org.apache.iceberg.util.Pair;
 import org.apache.orc.Reader;
 import org.apache.orc.TypeDescription;
@@ -51,11 +55,13 @@ class OrcIterable<T> extends CloseableGroup implements CloseableIterable<T> {
   private final boolean caseSensitive;
   private final Function<TypeDescription, OrcBatchReader<?>> batchReaderFunction;
   private final int recordsPerBatch;
+  private final OrcRowFilter rowFilter;
 
   OrcIterable(InputFile file, Configuration config, Schema schema,
               Long start, Long length,
               Function<TypeDescription, OrcRowReader<?>> readerFunction, boolean caseSensitive, Expression filter,
-              Function<TypeDescription, OrcBatchReader<?>> batchReaderFunction, int recordsPerBatch) {
+              Function<TypeDescription, OrcBatchReader<?>> batchReaderFunction, int recordsPerBatch,
+              OrcRowFilter rowFilter) {
     this.schema = schema;
     this.readerFunction = readerFunction;
     this.file = file;
@@ -66,6 +72,7 @@ class OrcIterable<T> extends CloseableGroup implements CloseableIterable<T> {
     this.filter = (filter == Expressions.alwaysTrue()) ? null : filter;
     this.batchReaderFunction = batchReaderFunction;
     this.recordsPerBatch = recordsPerBatch;
+    this.rowFilter = rowFilter;
   }
 
   @SuppressWarnings("unchecked")
@@ -81,16 +88,37 @@ public CloseableIterator<T> iterator() {
       sarg = ExpressionToSearchArgument.convert(boundFilter, readOrcSchema);
     }
 
-    VectorizedRowBatchIterator rowBatchIterator = newOrcIterator(file, readOrcSchema, start, length, orcFileReader,
-        sarg, recordsPerBatch);
-    if (batchReaderFunction != null) {
-      OrcBatchReader<T> batchReader = (OrcBatchReader<T>) batchReaderFunction.apply(readOrcSchema);
-      return CloseableIterator.transform(rowBatchIterator, pair -> {
-        batchReader.setBatchContext(pair.second());
-        return batchReader.read(pair.first());
-      });
+    if (rowFilter == null) {
+      VectorizedRowBatchIterator rowBatchIterator = newOrcIterator(file, readOrcSchema, start, length, orcFileReader,
+          sarg, recordsPerBatch);
+      if (batchReaderFunction != null) {
+        OrcBatchReader<T> batchReader = (OrcBatchReader<T>) batchReaderFunction.apply(readOrcSchema);
+        return CloseableIterator.transform(rowBatchIterator, pair -> {
+          batchReader.setBatchContext(pair.second());
+          return batchReader.read(pair.first());
+        });
+      } else {
+        return new OrcRowIterator<>(rowBatchIterator, (OrcRowReader<T>) readerFunction.apply(readOrcSchema),
+            null, null);
+      }
     } else {
-      return new OrcRowIterator<>(rowBatchIterator, (OrcRowReader<T>) readerFunction.apply(readOrcSchema));
+      Preconditions.checkArgument(batchReaderFunction == null,
+          "Row-level filtering not supported by vectorized reader");
+      Set<Integer> filterColumnIds = TypeUtil.getProjectedIds(rowFilter.requiredSchema());
+      Set<Integer> filterColumnIdsNotInReadSchema = Sets.difference(filterColumnIds,
+          TypeUtil.getProjectedIds(schema));
+      Schema extraFilterColumns = TypeUtil.select(rowFilter.requiredSchema(), filterColumnIdsNotInReadSchema);
+      Schema finalReadSchema = TypeUtil.join(schema, extraFilterColumns);
+
+      TypeDescription finalReadOrcSchema = ORCSchemaUtil.buildOrcProjection(finalReadSchema,
+          orcFileReader.getSchema());
+      TypeDescription rowFilterOrcSchema = ORCSchemaUtil.buildOrcProjection(rowFilter.requiredSchema(),
+          orcFileReader.getSchema());
+      RowFilterValueReader filterReader = new RowFilterValueReader(finalReadOrcSchema, rowFilterOrcSchema);
+
+      return new OrcRowIterator<>(
+          newOrcIterator(file, finalReadOrcSchema, start, length, orcFileReader, sarg, recordsPerBatch),
+          (OrcRowReader<T>) readerFunction.apply(readOrcSchema), rowFilter, filterReader);
     }
   }
 
@@ -116,34 +144,67 @@ private static VectorizedRowBatchIterator newOrcIterator(InputFile file,
 
   private static class OrcRowIterator<T> implements CloseableIterator<T> {
 
-    private int nextRow;
-    private VectorizedRowBatch current;
+    private int currentRow;
+    private VectorizedRowBatch currentBatch;
+    private boolean advanced = false;
 
     private final VectorizedRowBatchIterator batchIter;
     private final OrcRowReader<T> reader;
+    private final OrcRowFilter filter;
+    private final RowFilterValueReader filterReader;
 
-    OrcRowIterator(VectorizedRowBatchIterator batchIter, OrcRowReader<T> reader) {
+    OrcRowIterator(VectorizedRowBatchIterator batchIter, OrcRowReader<T> reader, OrcRowFilter filter,
+        RowFilterValueReader filterReader) {
       this.batchIter = batchIter;
       this.reader = reader;
-      current = null;
-      nextRow = 0;
+      this.filter = filter;
+      this.filterReader = filterReader;
+      currentBatch = null;
+      currentRow = 0;
+    }
+
+    private void advance() {
+      if (!advanced) {
+        while (true) {
+          currentRow++;
+          // if batch has been consumed, move to next batch
+          if (currentBatch == null || currentRow >= currentBatch.size) {
+            if (batchIter.hasNext()) {
+              Pair<VectorizedRowBatch, Long> nextBatch = batchIter.next();
+              currentBatch = nextBatch.first();
+              currentRow = 0;
+              reader.setBatchContext(nextBatch.second());
+              if (filterReader != null) {
+                filterReader.setBatchContext(nextBatch.second());
+              }
+            } else {
+              // no more batches left to process
+              currentBatch = null;
+              currentRow = -1;
+              break;
+            }
+          }
+          if (filter == null || filter.shouldKeep(filterReader.read(currentBatch, currentRow))) {
+            // we have found our row
+            break;
+          }
+        }
+        advanced = true;
+      }
     }
 
     @Override
     public boolean hasNext() {
-      return (current != null && nextRow < current.size) || batchIter.hasNext();
+      advance();
+      return currentBatch != null;
     }
 
     @Override
     public T next() {
-      if (current == null || nextRow >= current.size) {
-        Pair<VectorizedRowBatch, Long> nextBatch = batchIter.next();
-        current = nextBatch.first();
-        nextRow = 0;
-        this.reader.setBatchContext(nextBatch.second());
-      }
-
-      return this.reader.read(current, nextRow++);
+      advance();
+      // mark current row as used
+      advanced = false;
+      return this.reader.read(currentBatch, currentRow);
     }
 
     @Override
Original file line number	Diff line number	Diff line change
`@@ -169,7 +169,7 @@ public FileScanTask next() {`
`169`	`169`	`}`
`170`	`170`	`}`
`171`	`171`
`172`		`- private static final class SplitScanTask implements FileScanTask {`
	`172`	`+ public static final class SplitScanTask implements FileScanTask {`
`173`	`173`	`private final long len;`
`174`	`174`	`private final long offset;`
`175`	`175`	`private final FileScanTask fileScanTask;`
`@@ -209,5 +209,9 @@ public Expression residual() {`
`209`	`209`	`public Iterable<FileScanTask> split(long splitSize) {`
`210`	`210`	`throw new UnsupportedOperationException("Cannot split a task which is already split");`
`211`	`211`	`}`
	`212`	`+`
	`213`	`+ public FileScanTask underlyingFileScanTask() {`
	`214`	`+ return fileScanTask;`
	`215`	`+ }`
`212`	`216`	`}`
`213`	`217`	`}`