polyzos
diff --git a/‎fluss-lake/fluss-lake-iceberg/src/main/java/org/apache/fluss/lake/iceberg/source/FlussRowAsIcebergRecord.java‎
Lines changed: 182 additions & 0 deletions b/‎fluss-lake/fluss-lake-iceberg/src/main/java/org/apache/fluss/lake/iceberg/source/FlussRowAsIcebergRecord.java‎
Lines changed: 182 additions & 0 deletions
diff --git a/‎fluss-lake/fluss-lake-iceberg/src/main/java/org/apache/fluss/lake/iceberg/source/IcebergLakeSource.java‎
Lines changed: 31 additions & 4 deletions b/‎fluss-lake/fluss-lake-iceberg/src/main/java/org/apache/fluss/lake/iceberg/source/IcebergLakeSource.java‎
Lines changed: 31 additions & 4 deletions
diff --git a/‎fluss-lake/fluss-lake-iceberg/src/main/java/org/apache/fluss/lake/iceberg/source/IcebergRecordReader.java‎
Lines changed: 7 additions & 1 deletion b/‎fluss-lake/fluss-lake-iceberg/src/main/java/org/apache/fluss/lake/iceberg/source/IcebergRecordReader.java‎
Lines changed: 7 additions & 1 deletion
diff --git a/‎fluss-lake/fluss-lake-iceberg/src/main/java/org/apache/fluss/lake/iceberg/source/IcebergSplitPlanner.java‎
Lines changed: 13 additions & 7 deletions b/‎fluss-lake/fluss-lake-iceberg/src/main/java/org/apache/fluss/lake/iceberg/source/IcebergSplitPlanner.java‎
Lines changed: 13 additions & 7 deletions
@@ -0,0 +1,182 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.fluss.lake.iceberg.source;
+
+import org.apache.fluss.row.InternalRow;
+import org.apache.fluss.types.BigIntType;
+import org.apache.fluss.types.BinaryType;
+import org.apache.fluss.types.BooleanType;
+import org.apache.fluss.types.BytesType;
+import org.apache.fluss.types.CharType;
+import org.apache.fluss.types.DataType;
+import org.apache.fluss.types.DateType;
+import org.apache.fluss.types.DecimalType;
+import org.apache.fluss.types.DoubleType;
+import org.apache.fluss.types.FloatType;
+import org.apache.fluss.types.IntType;
+import org.apache.fluss.types.LocalZonedTimestampType;
+import org.apache.fluss.types.RowType;
+import org.apache.fluss.types.SmallIntType;
+import org.apache.fluss.types.StringType;
+import org.apache.fluss.types.TimeType;
+import org.apache.fluss.types.TimestampType;
+import org.apache.fluss.types.TinyIntType;
+import org.apache.fluss.utils.DateTimeUtils;
+
+import org.apache.iceberg.data.Record;
+import org.apache.iceberg.types.Types;
+
+import java.nio.ByteBuffer;
+import java.time.Instant;
+import java.time.OffsetDateTime;
+import java.time.ZoneOffset;
+import java.util.Map;
+
+/** Wrap Fluss {@link InternalRow} as Iceberg {@link Record}. */
+public class FlussRowAsIcebergRecord implements Record {
+
+    protected InternalRow internalRow;
+    protected final Types.StructType structType;
+    protected final RowType flussRowType;
+    private final FlussRowToIcebergFieldConverter[] fieldConverters;
+
+    public FlussRowAsIcebergRecord(Types.StructType structType, RowType flussRowType) {
+        this.structType = structType;
+        this.flussRowType = flussRowType;
+        fieldConverters = new FlussRowToIcebergFieldConverter[flussRowType.getFieldCount()];
+        for (int pos = 0; pos < flussRowType.getFieldCount(); pos++) {
+            DataType flussType = flussRowType.getTypeAt(pos);
+            fieldConverters[pos] = createTypeConverter(flussType, pos);
+        }
+    }
+
+    public FlussRowAsIcebergRecord(
+            Types.StructType structType, RowType flussRowType, InternalRow internalRow) {
+        this(structType, flussRowType);
+        this.internalRow = internalRow;
+    }
+
+    @Override
+    public Types.StructType struct() {
+        return structType;
+    }
+
+    @Override
+    public Object getField(String name) {
+        return get(structType.fields().indexOf(structType.field(name)));
+    }
+
+    @Override
+    public void setField(String name, Object value) {
+        throw new UnsupportedOperationException("method setField is not supported.");
+    }
+
+    @Override
+    public Object get(int pos) {
+        // handle normal columns
+        if (internalRow.isNullAt(pos)) {
+            return null;
+        }
+        return fieldConverters[pos].convert(internalRow);
+    }
+
+    @Override
+    public Record copy() {
+        throw new UnsupportedOperationException("method copy is not supported.");
+    }
+
+    @Override
+    public Record copy(Map<String, Object> overwriteValues) {
+        throw new UnsupportedOperationException("method copy is not supported.");
+    }
+
+    @Override
+    public int size() {
+        return structType.fields().size();
+    }
+
+    @Override
+    public <T> T get(int pos, Class<T> javaClass) {
+        Object value = get(pos);
+        if (value == null || javaClass.isInstance(value)) {
+            return javaClass.cast(value);
+        } else {
+            throw new IllegalStateException(
+                    "Not an instance of " + javaClass.getName() + ": " + value);
+        }
+    }
+
+    @Override
+    public <T> void set(int pos, T value) {
+        throw new UnsupportedOperationException("method set is not supported.");
+    }
+
+    private interface FlussRowToIcebergFieldConverter {
+        Object convert(InternalRow value);
+    }
+
+    private FlussRowToIcebergFieldConverter createTypeConverter(DataType flussType, int pos) {
+        if (flussType instanceof BooleanType) {
+            return row -> row.getBoolean(pos);
+        } else if (flussType instanceof TinyIntType) {
+            return row -> (int) row.getByte(pos);
+        } else if (flussType instanceof SmallIntType) {
+            return row -> (int) row.getShort(pos);
+        } else if (flussType instanceof IntType) {
+            return row -> row.getInt(pos);
+        } else if (flussType instanceof BigIntType) {
+            return row -> row.getLong(pos);
+        } else if (flussType instanceof FloatType) {
+            return row -> row.getFloat(pos);
+        } else if (flussType instanceof DoubleType) {
+            return row -> row.getDouble(pos);
+        } else if (flussType instanceof StringType) {
+            return row -> row.getString(pos).toString();
+        } else if (flussType instanceof CharType) {
+            CharType charType = (CharType) flussType;
+            return row -> row.getChar(pos, charType.getLength()).toString();
+        } else if (flussType instanceof BytesType || flussType instanceof BinaryType) {
+            return row -> ByteBuffer.wrap(row.getBytes(pos));
+        } else if (flussType instanceof DecimalType) {
+            DecimalType decimalType = (DecimalType) flussType;
+            return row ->
+                    row.getDecimal(pos, decimalType.getPrecision(), decimalType.getScale())
+                            .toBigDecimal();
+        } else if (flussType instanceof LocalZonedTimestampType) {
+            LocalZonedTimestampType ltzType = (LocalZonedTimestampType) flussType;
+            return row ->
+                    toIcebergTimestampLtz(
+                            row.getTimestampLtz(pos, ltzType.getPrecision()).toInstant());
+        } else if (flussType instanceof TimestampType) {
+            TimestampType tsType = (TimestampType) flussType;
+            return row -> row.getTimestampNtz(pos, tsType.getPrecision()).toLocalDateTime();
+        } else if (flussType instanceof DateType) {
+            return row -> DateTimeUtils.toLocalDate(row.getInt(pos));
+        } else if (flussType instanceof TimeType) {
+            return row -> DateTimeUtils.toLocalTime(row.getInt(pos));
+        } else {
+            throw new UnsupportedOperationException(
+                    "Unsupported data type conversion for Fluss type: "
+                            + flussType.getClass().getSimpleName());
+        }
+    }
+
+    private OffsetDateTime toIcebergTimestampLtz(Instant instant) {
+        return OffsetDateTime.ofInstant(instant, ZoneOffset.UTC);
+    }
+}
@@ -19,6 +19,7 @@
 package org.apache.fluss.lake.iceberg.source;
 
 import org.apache.fluss.config.Configuration;
+import org.apache.fluss.lake.iceberg.utils.FlussToIcebergPredicateConverter;
 import org.apache.fluss.lake.iceberg.utils.IcebergCatalogUtils;
 import org.apache.fluss.lake.serializer.SimpleVersionedSerializer;
 import org.apache.fluss.lake.source.LakeSource;
@@ -27,14 +28,18 @@
 import org.apache.fluss.metadata.TablePath;
 import org.apache.fluss.predicate.Predicate;
 
+import org.apache.iceberg.Schema;
 import org.apache.iceberg.Table;
 import org.apache.iceberg.catalog.Catalog;
+import org.apache.iceberg.expressions.Expression;
+import org.apache.iceberg.expressions.Expressions;
 
 import javax.annotation.Nullable;
 
 import java.io.IOException;
-import java.util.Collections;
+import java.util.ArrayList;
 import java.util.List;
+import java.util.Optional;
 
 import static org.apache.fluss.lake.iceberg.utils.IcebergConversions.toIceberg;
 
@@ -44,6 +49,7 @@ public class IcebergLakeSource implements LakeSource<IcebergSplit> {
     private final Configuration icebergConfig;
     private final TablePath tablePath;
     private @Nullable int[][] project;
+    private @Nullable Expression filter;
 
     public IcebergLakeSource(Configuration icebergConfig, TablePath tablePath) {
         this.icebergConfig = icebergConfig;
@@ -62,13 +68,29 @@ public void withLimit(int limit) {
 
     @Override
     public FilterPushDownResult withFilters(List<Predicate> predicates) {
-        // TODO: Support filter push down. #1676
-        return FilterPushDownResult.of(Collections.emptyList(), predicates);
+        List<Predicate> unConsumedPredicates = new ArrayList<>();
+        List<Predicate> consumedPredicates = new ArrayList<>();
+        List<Expression> converted = new ArrayList<>();
+        Schema schema = getSchema(tablePath);
+        for (Predicate predicate : predicates) {
+            Optional<Expression> optPredicate =
+                    FlussToIcebergPredicateConverter.convert(schema, predicate);
+            if (optPredicate.isPresent()) {
+                consumedPredicates.add(predicate);
+                converted.add(optPredicate.get());
+            } else {
+                unConsumedPredicates.add(predicate);
+            }
+        }
+        if (!converted.isEmpty()) {
+            filter = converted.stream().reduce(Expressions::and).orElse(null);
+        }
+        return FilterPushDownResult.of(consumedPredicates, unConsumedPredicates);
     }
 
     @Override
     public Planner<IcebergSplit> createPlanner(PlannerContext context) throws IOException {
-        return new IcebergSplitPlanner(icebergConfig, tablePath, context.snapshotId());
+        return new IcebergSplitPlanner(icebergConfig, tablePath, context.snapshotId(), filter);
     }
 
     @Override
@@ -82,4 +104,9 @@ public RecordReader createRecordReader(ReaderContext<IcebergSplit> context) thro
     public SimpleVersionedSerializer<IcebergSplit> getSplitSerializer() {
         return new IcebergSplitSerializer();
     }
+
+    private Schema getSchema(TablePath tablePath) {
+        Catalog catalog = IcebergCatalogUtils.createIcebergCatalog(icebergConfig);
+        return catalog.loadTable(toIceberg(tablePath)).schema();
+    }
 }
@@ -45,7 +45,13 @@
 import static org.apache.fluss.metadata.TableDescriptor.OFFSET_COLUMN_NAME;
 import static org.apache.fluss.metadata.TableDescriptor.TIMESTAMP_COLUMN_NAME;
 
-/** Iceberg record reader. */
+/**
+ * Iceberg record reader. The filter is applied during the plan phase of IcebergSplitPlanner, so the
+ * RecordReader does not need to apply the filter again.
+ *
+ * <p>Refer to {@link org.apache.iceberg.data.GenericReader#open(FileScanTask)} and {@link
+ * org.apache.iceberg.Scan#ignoreResiduals()} for details.
+ */
 public class IcebergRecordReader implements RecordReader {
     protected IcebergRecordAsFlussRecordIterator iterator;
     protected @Nullable int[][] project;
 
@@ -27,9 +27,13 @@
 import org.apache.iceberg.PartitionField;
 import org.apache.iceberg.PartitionSpec;
 import org.apache.iceberg.Table;
+import org.apache.iceberg.TableScan;
 import org.apache.iceberg.catalog.Catalog;
+import org.apache.iceberg.expressions.Expression;
 import org.apache.iceberg.io.CloseableIterable;
 
+import javax.annotation.Nullable;
+
 import java.io.IOException;
 import java.util.ArrayList;
 import java.util.Collections;
@@ -47,11 +51,14 @@ public class IcebergSplitPlanner implements Planner<IcebergSplit> {
     private final Configuration icebergConfig;
     private final TablePath tablePath;
     private final long snapshotId;
+    private final @Nullable Expression filter;
 
-    public IcebergSplitPlanner(Configuration icebergConfig, TablePath tablePath, long snapshotId) {
+    public IcebergSplitPlanner(
+            Configuration icebergConfig, TablePath tablePath, long snapshotId, Expression filter) {
         this.icebergConfig = icebergConfig;
         this.tablePath = tablePath;
         this.snapshotId = snapshotId;
+        this.filter = filter;
     }
 
     @Override
@@ -61,12 +68,11 @@ public List<IcebergSplit> plan() throws IOException {
         Table table = catalog.loadTable(toIceberg(tablePath));
         Function<FileScanTask, List<String>> partitionExtract = createPartitionExtractor(table);
         Function<FileScanTask, Integer> bucketExtractor = createBucketExtractor(table);
-        try (CloseableIterable<FileScanTask> tasks =
-                table.newScan()
-                        .useSnapshot(snapshotId)
-                        .includeColumnStats()
-                        .ignoreResiduals()
-                        .planFiles()) {
+        TableScan tableScan = table.newScan().useSnapshot(snapshotId).includeColumnStats();
+        if (filter != null) {
+            tableScan = tableScan.filter(filter);
+        }
+        try (CloseableIterable<FileScanTask> tasks = tableScan.planFiles()) {
             tasks.forEach(
                     task ->
                             splits.add(