fix comments

xx789633 · xx789633 · commit 2582ab991d36 · 2025-08-18T22:31:28.000+08:00
diff --git a/fluss-lake/fluss-lake-iceberg/src/main/java/com/alibaba/fluss/lake/iceberg/tiering/IcebergLakeCommitter.java b/fluss-lake/fluss-lake-iceberg/src/main/java/com/alibaba/fluss/lake/iceberg/tiering/IcebergLakeCommitter.java
@@ -31,6 +31,7 @@
 import org.apache.iceberg.DeleteFile;
 import org.apache.iceberg.RowDelta;
 import org.apache.iceberg.Snapshot;
+import org.apache.iceberg.SnapshotUpdate;
 import org.apache.iceberg.Table;
 import org.apache.iceberg.catalog.Catalog;
 import org.apache.iceberg.catalog.TableIdentifier;
@@ -102,31 +103,21 @@ public long commit(IcebergCommittable committable, Map<String, String> snapshotP
                 for (DataFile dataFile : committable.getDataFiles()) {
                     appendFiles.appendFile(dataFile);
                 }
-                if (!committable.getDeleteFiles().isEmpty()) {
-                    throw new IllegalStateException(
-                            "Delete files are not supported in append-only mode. "
-                                    + "Found "
-                                    + committable.getDeleteFiles().size()
-                                    + " delete files.");
-                }
 
                 addFlussProperties(appendFiles, snapshotProperties);
 
                 appendFiles.commit();
             } else {
-                // Row delta validations are not needed for streaming changes that write equality
-                // deletes.
-                // Equality deletes are applied to data in all previous sequence numbers, so retries
-                // may
-                // push deletes further in the future, but do not affect correctness. Position
-                // deletes
-                // committed to the table in this path are used only to delete rows from data files
-                // that are
-                // being added in this commit. There is no way for data files added along with the
-                // delete
-                // files to be concurrently removed, so there is no need to validate the files
-                // referenced by
-                // the position delete files that are being committed.
+                /**
+                 * Row delta validations are not needed for streaming changes that write equality
+                 * deletes. Equality deletes are applied to data in all previous sequence numbers,
+                 * so retries may push deletes further in the future, but do not affect correctness.
+                 * Position deletes committed to the table in this path are used only to delete rows
+                 * from data files that are being added in this commit. There is no way for data
+                 * files added along with the delete files to be concurrently removed, so there is
+                 * no need to validate the files referenced by the position delete files that are
+                 * being committed.
+                 */
                 RowDelta rowDelta = icebergTable.newRowDelta();
                 Arrays.stream(committable.getDataFiles().stream().toArray(DataFile[]::new))
                         .forEach(rowDelta::addRows);
@@ -147,10 +138,10 @@ public long commit(IcebergCommittable committable, Map<String, String> snapshotP
     }
 
     private void addFlussProperties(
-            AppendFiles appendFiles, Map<String, String> snapshotProperties) {
-        appendFiles.set("commit-user", FLUSS_LAKE_TIERING_COMMIT_USER);
+            SnapshotUpdate<?> operation, Map<String, String> snapshotProperties) {
+        operation.set("commit-user", FLUSS_LAKE_TIERING_COMMIT_USER);
         for (Map.Entry<String, String> entry : snapshotProperties.entrySet()) {
-            appendFiles.set(entry.getKey(), entry.getValue());
+            operation.set(entry.getKey(), entry.getValue());
         }
     }
 
diff --git a/fluss-lake/fluss-lake-iceberg/src/main/java/com/alibaba/fluss/lake/iceberg/tiering/IcebergLakeWriter.java b/fluss-lake/fluss-lake-iceberg/src/main/java/com/alibaba/fluss/lake/iceberg/tiering/IcebergLakeWriter.java
@@ -23,7 +23,6 @@
 import com.alibaba.fluss.lake.writer.WriterInitContext;
 import com.alibaba.fluss.metadata.TablePath;
 import com.alibaba.fluss.record.LogRecord;
-import com.alibaba.fluss.shaded.guava32.com.google.common.collect.Lists;
 
 import org.apache.iceberg.FileFormat;
 import org.apache.iceberg.PartitionSpec;
@@ -37,6 +36,7 @@
 
 import java.io.Closeable;
 import java.io.IOException;
+import java.util.ArrayList;
 import java.util.Collections;
 import java.util.List;
 
@@ -64,7 +64,7 @@ public IcebergLakeWriter(
 
     private RecordWriter createRecordWriter(WriterInitContext writerInitContext) {
         Schema schema = icebergTable.schema();
-        List<Integer> equalityFieldIds = Lists.newArrayList(schema.identifierFieldIds());
+        List<Integer> equalityFieldIds = new ArrayList<>(schema.identifierFieldIds());
         PartitionSpec spec = icebergTable.spec();
 
         // Get target file size from table properties
@@ -90,6 +90,8 @@ private RecordWriter createRecordWriter(WriterInitContext writerInitContext) {
                         format,
                         outputFileFactory,
                         targetFileSize);
+            } else {
+                return null;
             }
         } else {
             if (spec.isUnpartitioned()) {
@@ -102,9 +104,10 @@ private RecordWriter createRecordWriter(WriterInitContext writerInitContext) {
                         format,
                         outputFileFactory,
                         targetFileSize);
+            } else {
+                return null;
             }
         }
-        return null;
     }
 
     @Override
diff --git a/fluss-lake/fluss-lake-iceberg/src/main/java/com/alibaba/fluss/lake/iceberg/tiering/writer/DeltaTaskWriter.java b/fluss-lake/fluss-lake-iceberg/src/main/java/com/alibaba/fluss/lake/iceberg/tiering/writer/DeltaTaskWriter.java
@@ -20,7 +20,6 @@
 import com.alibaba.fluss.lake.iceberg.tiering.RecordWriter;
 import com.alibaba.fluss.metadata.TableBucket;
 import com.alibaba.fluss.record.LogRecord;
-import com.alibaba.fluss.shaded.guava32.com.google.common.collect.Lists;
 import com.alibaba.fluss.types.RowType;
 
 import org.apache.iceberg.FileFormat;
@@ -31,10 +30,10 @@
 import org.apache.iceberg.io.FileAppenderFactory;
 import org.apache.iceberg.io.OutputFileFactory;
 import org.apache.iceberg.io.TaskWriter;
-import org.apache.iceberg.util.ArrayUtil;
 
 import javax.annotation.Nullable;
 
+import java.util.ArrayList;
 import java.util.List;
 
 /** A {@link RecordWriter} to write to Iceberg's primary-key table. */
@@ -63,17 +62,19 @@ private static TaskWriter<Record> createTaskWriter(
             FileFormat format,
             OutputFileFactory outputFileFactory,
             long targetFileSize) {
-
+        int[] equalityFieldIds =
+                icebergTable.schema().identifierFieldIds().stream()
+                        .mapToInt(Integer::intValue)
+                        .toArray();
         FileAppenderFactory<Record> appenderFactory =
                 new GenericAppenderFactory(
                         icebergTable.schema(),
                         icebergTable.spec(),
-                        ArrayUtil.toIntArray(
-                                Lists.newArrayList(icebergTable.schema().identifierFieldIds())),
+                        equalityFieldIds,
                         icebergTable.schema(),
                         null);
 
-        List<String> columns = Lists.newArrayList();
+        List<String> columns = new ArrayList<>();
         for (Integer fieldId : icebergTable.schema().identifierFieldIds()) {
             columns.add(icebergTable.schema().findField(fieldId).name());
         }
@@ -99,9 +100,8 @@ public void write(LogRecord record) throws Exception {
                 deltaWriter.write(flussRecordAsIcebergRecord);
                 break;
             case UPDATE_BEFORE:
-                deltaWriter.delete(flussRecordAsIcebergRecord);
-                break;
             case DELETE:
+                // TODO we can project the record and only write the equality delete fields
                 deltaWriter.delete(flussRecordAsIcebergRecord);
                 break;
             default:
diff --git a/fluss-lake/fluss-lake-iceberg/src/main/java/com/alibaba/fluss/lake/iceberg/tiering/writer/GenericTaskDeltaWriter.java b/fluss-lake/fluss-lake-iceberg/src/main/java/com/alibaba/fluss/lake/iceberg/tiering/writer/GenericTaskDeltaWriter.java
@@ -56,11 +56,6 @@ public void delete(Record row) throws IOException {
         deltaWriter.delete(row);
     }
 
-    // The caller of this function is responsible for passing in a record with only the key fields
-    public void deleteKey(Record key) throws IOException {
-        deltaWriter.deleteKey(key);
-    }
-
     @Override
     public void close() throws IOException {
         deltaWriter.close();
@@ -73,13 +68,13 @@ private GenericEqualityDeltaWriter(
         }
 
         @Override
-        protected StructLike asStructLike(Record row) {
-            return row;
+        protected StructLike asStructLike(Record record) {
+            return record;
         }
 
         @Override
-        protected StructLike asStructLikeKey(Record data) {
-            return data;
+        protected StructLike asStructLikeKey(Record record) {
+            return record;
         }
     }
 }
diff --git a/fluss-lake/fluss-lake-iceberg/src/test/java/com/alibaba/fluss/lake/iceberg/IcebergTieringTest.java b/fluss-lake/fluss-lake-iceberg/src/test/java/com/alibaba/fluss/lake/iceberg/IcebergTieringTest.java
@@ -105,13 +105,17 @@ private static Stream<Arguments> tieringWriteArgs() {
     @ParameterizedTest
     @MethodSource("tieringWriteArgs")
     void testTieringWriteTable(boolean isPrimaryKeyTable) throws Exception {
-        TablePath tablePath = TablePath.of("iceberg", "test_table");
+        int bucketNum = 3;
+        TablePath tablePath =
+                TablePath.of(
+                        "iceberg",
+                        String.format(
+                                "test_tiering_table_%s",
+                                isPrimaryKeyTable ? "primary_key" : "log"));
         createTable(tablePath, isPrimaryKeyTable);
 
         Table icebergTable = icebergCatalog.loadTable(toIceberg(tablePath));
 
-        int bucketNum = 3;
-
         Map<Integer, List<LogRecord>> recordsByBucket = new HashMap<>();
 
         List<IcebergWriteResult> icebergWriteResults = new ArrayList<>();
@@ -126,14 +130,14 @@ void testTieringWriteTable(boolean isPrimaryKeyTable) throws Exception {
                 Tuple2<List<LogRecord>, List<LogRecord>> writeAndExpectRecords =
                         isPrimaryKeyTable
                                 ? genPrimaryKeyTableRecords(bucket)
-                                : genLogTableRecords(bucket, 5);
+                                : genLogTableRecords(bucket, 10);
 
                 List<LogRecord> writtenRecords = writeAndExpectRecords.f0;
                 List<LogRecord> expectRecords = writeAndExpectRecords.f1;
+                recordsByBucket.put(bucket, expectRecords);
                 for (LogRecord record : writtenRecords) {
                     writer.write(record);
                 }
-                recordsByBucket.put(bucket, expectRecords);
                 IcebergWriteResult result = writer.complete();
                 byte[] serialized = writeResultSerializer.serialize(result);
                 icebergWriteResults.add(
@@ -167,7 +171,7 @@ void testTieringWriteTable(boolean isPrimaryKeyTable) throws Exception {
             if (isPrimaryKeyTable) {
                 verifyPrimaryKeyTableRecord(actualRecords, expectRecords, bucket);
             } else {
-                verifyLogTableRecords(actualRecords, bucket, expectRecords);
+                verifyLogTableRecords(actualRecords, expectRecords, bucket);
             }
         }
     }
@@ -329,8 +333,8 @@ private CloseableIterator<Record> getIcebergRows(Table table, int bucket) {
 
     private void verifyLogTableRecords(
             CloseableIterator<Record> actualRecords,
-            int expectBucket,
-            List<LogRecord> expectRecords) {
+            List<LogRecord> expectRecords,
+            int expectBucket) {
         for (LogRecord expectRecord : expectRecords) {
             Record actualRecord = actualRecords.next();
             // check business columns:

Original file line number	Diff line number	Diff line change
`@@ -56,11 +56,6 @@ public void delete(Record row) throws IOException {`
`56`	`56`	`deltaWriter.delete(row);`
`57`	`57`	`}`
`58`	`58`
`59`		`- // The caller of this function is responsible for passing in a record with only the key fields`
`60`		`- public void deleteKey(Record key) throws IOException {`
`61`		`- deltaWriter.deleteKey(key);`
`62`		`- }`
`63`		`-`
`64`	`59`	`@Override`
`65`	`60`	`public void close() throws IOException {`
`66`	`61`	`deltaWriter.close();`
`@@ -73,13 +68,13 @@ private GenericEqualityDeltaWriter(`
`73`	`68`	`}`
`74`	`69`
`75`	`70`	`@Override`
`76`		`- protected StructLike asStructLike(Record row) {`
`77`		`- return row;`
	`71`	`+ protected StructLike asStructLike(Record record) {`
	`72`	`+ return record;`
`78`	`73`	`}`
`79`	`74`
`80`	`75`	`@Override`
`81`		`- protected StructLike asStructLikeKey(Record data) {`
`82`		`- return data;`
	`76`	`+ protected StructLike asStructLikeKey(Record record) {`
	`77`	`+ return record;`
`83`	`78`	`}`
`84`	`79`	`}`
`85`	`80`	`}`