[coordinator] CoordinatorEventProcessor shouldn't process PartitionCreated event for existing partition (#419)

luoyuxia · web-flow · commit 465730f17731 · 2025-02-27T16:40:02.000+08:00
diff --git a/fluss-server/src/main/java/com/alibaba/fluss/server/coordinator/CoordinatorEventProcessor.java b/fluss-server/src/main/java/com/alibaba/fluss/server/coordinator/CoordinatorEventProcessor.java
@@ -500,6 +500,11 @@ private void updateMetrics() {
     }
 
     private void processCreateTable(CreateTableEvent createTableEvent) {
+        long tableId = createTableEvent.getTableInfo().getTableId();
+        // skip the table if it already exists
+        if (coordinatorContext.containsTableId(tableId)) {
+            return;
+        }
         TableInfo tableInfo = createTableEvent.getTableInfo();
         coordinatorContext.putTableInfo(tableInfo);
         tableManager.onCreateNewTable(
@@ -512,6 +517,11 @@ private void processCreateTable(CreateTableEvent createTableEvent) {
     }
 
     private void processCreatePartition(CreatePartitionEvent createPartitionEvent) {
+        long partitionId = createPartitionEvent.getPartitionId();
+        // skip the partition if it already exists
+        if (coordinatorContext.containsPartitionId(partitionId)) {
+            return;
+        }
         tableManager.onCreateNewPartition(
                 createPartitionEvent.getTablePath(),
                 createPartitionEvent.getTableId(),
diff --git a/fluss-server/src/test/java/com/alibaba/fluss/server/coordinator/CoordinatorEventProcessorTest.java b/fluss-server/src/test/java/com/alibaba/fluss/server/coordinator/CoordinatorEventProcessorTest.java
@@ -30,10 +30,7 @@
 import com.alibaba.fluss.metadata.TablePath;
 import com.alibaba.fluss.rpc.messages.CommitKvSnapshotResponse;
 import com.alibaba.fluss.server.coordinator.event.CommitKvSnapshotEvent;
-import com.alibaba.fluss.server.coordinator.event.CoordinatorEvent;
 import com.alibaba.fluss.server.coordinator.event.CoordinatorEventManager;
-import com.alibaba.fluss.server.coordinator.event.CreatePartitionEvent;
-import com.alibaba.fluss.server.coordinator.event.DropPartitionEvent;
 import com.alibaba.fluss.server.coordinator.statemachine.BucketState;
 import com.alibaba.fluss.server.coordinator.statemachine.ReplicaState;
 import com.alibaba.fluss.server.entity.CommitKvSnapshotData;
@@ -56,6 +53,7 @@
 import com.alibaba.fluss.server.zk.data.ZkData.TableIdsZNode;
 import com.alibaba.fluss.testutils.common.AllCallbackWrapper;
 import com.alibaba.fluss.types.DataTypes;
+import com.alibaba.fluss.utils.types.Tuple2;
 
 import org.junit.jupiter.api.AfterEach;
 import org.junit.jupiter.api.BeforeAll;
@@ -78,6 +76,9 @@
 import java.util.concurrent.CompletableFuture;
 import java.util.stream.Collectors;
 
+import static com.alibaba.fluss.server.coordinator.CoordinatorTestUtils.checkLeaderAndIsr;
+import static com.alibaba.fluss.server.coordinator.CoordinatorTestUtils.makeSendLeaderAndStopRequestAlwaysSuccess;
+import static com.alibaba.fluss.server.coordinator.CoordinatorTestUtils.makeSendLeaderAndStopRequestFailContext;
 import static com.alibaba.fluss.server.coordinator.CoordinatorTestUtils.verifyBucketForPartitionInState;
 import static com.alibaba.fluss.server.coordinator.CoordinatorTestUtils.verifyBucketForTableInState;
 import static com.alibaba.fluss.server.coordinator.CoordinatorTestUtils.verifyReplicaForPartitionInState;
@@ -173,7 +174,7 @@ void afterEach() {
     void testCreateAndDropTable() throws Exception {
         CoordinatorContext coordinatorContext = eventProcessor.getCoordinatorContext();
         // make sure all request to gateway should be successful
-        CoordinatorTestUtils.makeSendLeaderAndStopRequestAlwaysSuccess(
+        makeSendLeaderAndStopRequestAlwaysSuccess(
                 eventProcessor.getCoordinatorContext(), testCoordinatorChannelManager);
         // create a table,
         TablePath t1 = TablePath.of(defaultDatabase, "create_drop_t1");
@@ -226,7 +227,7 @@ void testCreateAndDropTable() throws Exception {
                         autoPartitionManager,
                         TestingMetricGroups.COORDINATOR_METRICS,
                         new Configuration());
-        CoordinatorTestUtils.makeSendLeaderAndStopRequestAlwaysSuccess(
+        makeSendLeaderAndStopRequestAlwaysSuccess(
                 testCoordinatorChannelManager,
                 Arrays.stream(zookeeperClient.getSortedTabletServerList())
                         .boxed()
@@ -247,7 +248,7 @@ void testDropTableWithRetry() throws Exception {
         // make request to some server should fail, but delete will still be successful
         // finally with retry logic
         int failedServer = 0;
-        CoordinatorTestUtils.makeSendLeaderAndStopRequestFailContext(
+        makeSendLeaderAndStopRequestFailContext(
                 testCoordinatorChannelManager,
                 Arrays.stream(zookeeperClient.getSortedTabletServerList())
                         .boxed()
@@ -283,7 +284,7 @@ void testDropTableWithRetry() throws Exception {
     void testServerBecomeOnlineAndOfflineLine() throws Exception {
         CoordinatorContext coordinatorContext = eventProcessor.getCoordinatorContext();
         // make sure all request to gateway should be successful
-        CoordinatorTestUtils.makeSendLeaderAndStopRequestAlwaysSuccess(
+        makeSendLeaderAndStopRequestAlwaysSuccess(
                 eventProcessor.getCoordinatorContext(), testCoordinatorChannelManager);
         // assume a new server become online;
         // check the server has been added into coordinator context
@@ -303,7 +304,7 @@ void testServerBecomeOnlineAndOfflineLine() throws Exception {
                         assertThat(coordinatorContext.getLiveTabletServers())
                                 .containsKey(newlyServerId));
 
-        CoordinatorTestUtils.makeSendLeaderAndStopRequestAlwaysSuccess(
+        makeSendLeaderAndStopRequestAlwaysSuccess(
                 eventProcessor.getCoordinatorContext(), testCoordinatorChannelManager);
         verifyTabletServer(coordinatorContext, newlyServerId, tabletServerRegistration);
 
@@ -373,7 +374,7 @@ void testServerBecomeOnlineAndOfflineLine() throws Exception {
         // should change the leader for bucket2 of t1 should change since the leader fail
         assertThat(coordinatorContext.getBucketState(t1Bucket1)).isEqualTo(OnlineBucket);
         // leader should change to replica2, leader epoch should be 1
-        CoordinatorTestUtils.checkLeaderAndIsr(zookeeperClient, t1Bucket1, 1, 2);
+        checkLeaderAndIsr(zookeeperClient, t1Bucket1, 1, 2);
 
         // the bucket with no any other available servers should be still offline,
         // t2 bucket0 should still be offline
@@ -420,7 +421,7 @@ void testServerBecomeOnlineAndOfflineLine() throws Exception {
 
         // in this test case, so make requests to gateway should always be
         // successful for when start up, it will send request to tablet servers
-        CoordinatorTestUtils.makeSendLeaderAndStopRequestAlwaysSuccess(
+        makeSendLeaderAndStopRequestAlwaysSuccess(
                 testCoordinatorChannelManager,
                 Arrays.stream(zookeeperClient.getSortedTabletServerList())
                         .boxed()
@@ -453,7 +454,7 @@ void testRestartTriggerReplicaToOffline() throws Exception {
         long table1Id = metadataManager.createTable(tablePath, TEST_TABLE, tableAssignment, false);
 
         // let's restart
-        CoordinatorTestUtils.makeSendLeaderAndStopRequestAlwaysSuccess(
+        makeSendLeaderAndStopRequestAlwaysSuccess(
                 eventProcessor.getCoordinatorContext(), testCoordinatorChannelManager);
         eventProcessor.shutdown();
         eventProcessor =
@@ -466,7 +467,7 @@ void testRestartTriggerReplicaToOffline() throws Exception {
                         new Configuration());
         CoordinatorContext coordinatorContext = eventProcessor.getCoordinatorContext();
         int failedServer = 0;
-        CoordinatorTestUtils.makeSendLeaderAndStopRequestFailContext(
+        makeSendLeaderAndStopRequestFailContext(
                 testCoordinatorChannelManager,
                 Arrays.stream(zookeeperClient.getSortedTabletServerList())
                         .boxed()
@@ -488,7 +489,7 @@ void testRestartTriggerReplicaToOffline() throws Exception {
                 });
 
         // check the changed leader and isr info
-        CoordinatorTestUtils.checkLeaderAndIsr(zookeeperClient, t1Bucket0, 1, 1);
+        checkLeaderAndIsr(zookeeperClient, t1Bucket0, 1, 1);
         retry(
                 Duration.ofMinutes(1),
                 () -> {
@@ -579,44 +580,31 @@ void testAddBucketCompletedSnapshot(@TempDir Path tempDir) throws Exception {
 
     @Test
     void testCreateAndDropPartition() throws Exception {
+        TablePath tablePath = TablePath.of(defaultDatabase, "test_create_drop_partition");
         CoordinatorContext coordinatorContext = eventProcessor.getCoordinatorContext();
         // make sure all request to gateway should be successful
-        CoordinatorTestUtils.makeSendLeaderAndStopRequestAlwaysSuccess(
-                eventProcessor.getCoordinatorContext(), testCoordinatorChannelManager);
+        makeSendLeaderAndStopRequestAlwaysSuccess(
+                coordinatorContext, testCoordinatorChannelManager);
         // create a partitioned table
-        TablePath tablePath = TablePath.of(defaultDatabase, "partition_table");
         TableDescriptor tablePartitionTableDescriptor = getPartitionedTable();
         long tableId =
                 metadataManager.createTable(tablePath, tablePartitionTableDescriptor, null, false);
 
-        retry(
-                Duration.ofMinutes(1),
-                // retry util the table has been put into context
-                () -> assertThat(coordinatorContext.getTablePathById(tableId)).isNotNull());
-
-        // create partition
-        long partition1Id = zookeeperClient.getPartitionIdAndIncrement();
-        long partition2Id = zookeeperClient.getPartitionIdAndIncrement();
         int nBuckets = 3;
         int replicationFactor = 3;
-        String partition1Name = "2024";
-        String partition2Name = "2025";
         Map<Integer, BucketAssignment> assignments =
                 TableAssignmentUtils.generateAssignment(
                                 nBuckets, replicationFactor, new int[] {0, 1, 2})
                         .getBucketAssignments();
         PartitionAssignment partitionAssignment = new PartitionAssignment(tableId, assignments);
-        zookeeperClient.registerPartitionAssignment(partition1Id, partitionAssignment);
-        zookeeperClient.registerPartitionAssignment(partition2Id, partitionAssignment);
+        Tuple2<PartitionIdName, PartitionIdName> partitionIdAndNameTuple2 =
+                preparePartitionAssignment(
+                        tablePath, tableId, coordinatorContext, partitionAssignment);
+
+        long partition1Id = partitionIdAndNameTuple2.f0.partitionId;
+        String partition1Name = partitionIdAndNameTuple2.f0.partitionName;
+        long partition2Id = partitionIdAndNameTuple2.f1.partitionId;
 
-        CoordinatorEvent createPartitionEvent =
-                new CreatePartitionEvent(
-                        tablePath, tableId, partition1Id, partition1Name, partitionAssignment);
-        eventProcessor.process(createPartitionEvent);
-        createPartitionEvent =
-                new CreatePartitionEvent(
-                        tablePath, tableId, partition2Id, partition2Name, partitionAssignment);
-        eventProcessor.process(createPartitionEvent);
         verifyPartitionCreated(
                 coordinatorContext,
                 new TablePartition(tableId, partition1Id),
@@ -644,9 +632,7 @@ void testCreateAndDropPartition() throws Exception {
         assertThat(completedSnapshotStoreManager.getBucketCompletedSnapshotStores()).isNotEmpty();
 
         // drop the partition
-        DropPartitionEvent dropPartitionEvent = new DropPartitionEvent(tableId, partition1Id);
-        eventProcessor.process(dropPartitionEvent);
-
+        zookeeperClient.deletePartition(tablePath, partition1Name);
         verifyPartitionDropped(coordinatorContext, tableId, partition1Id);
 
         // verify CompleteSnapshotStore has been removed when the table partition1 is dropped
@@ -666,16 +652,113 @@ void testCreateAndDropPartition() throws Exception {
                         autoPartitionManager,
                         TestingMetricGroups.COORDINATOR_METRICS,
                         new Configuration());
-        CoordinatorTestUtils.makeSendLeaderAndStopRequestAlwaysSuccess(
+        makeSendLeaderAndStopRequestAlwaysSuccess(
                 testCoordinatorChannelManager,
                 Arrays.stream(zookeeperClient.getSortedTabletServerList())
                         .boxed()
                         .collect(Collectors.toSet()));
         eventProcessor.startup();
-        verifyPartitionDropped(coordinatorContext, tableId, partition2Id);
+        verifyPartitionDropped(eventProcessor.getCoordinatorContext(), tableId, partition2Id);
     }
 
-    // todo: add test resume drop partition
+    @Test
+    void testRestartResumeDropPartition() throws Exception {
+        TablePath tablePath = TablePath.of(defaultDatabase, "test_resume_drop_partition");
+        CoordinatorContext coordinatorContext = eventProcessor.getCoordinatorContext();
+        // make sure all request to gateway should be successful
+        makeSendLeaderAndStopRequestAlwaysSuccess(
+                coordinatorContext, testCoordinatorChannelManager);
+        // create a partitioned table
+        TableDescriptor tablePartitionTableDescriptor = getPartitionedTable();
+        long tableId =
+                metadataManager.createTable(tablePath, tablePartitionTableDescriptor, null, false);
+
+        int nBuckets = 3;
+        int replicationFactor = 3;
+        Map<Integer, BucketAssignment> assignments =
+                TableAssignmentUtils.generateAssignment(
+                                nBuckets, replicationFactor, new int[] {0, 1, 2})
+                        .getBucketAssignments();
+        PartitionAssignment partitionAssignment = new PartitionAssignment(tableId, assignments);
+        Tuple2<PartitionIdName, PartitionIdName> partitionIdAndNameTuple2 =
+                preparePartitionAssignment(
+                        tablePath, tableId, coordinatorContext, partitionAssignment);
+
+        long partition1Id = partitionIdAndNameTuple2.f0.partitionId;
+        String partition2Name = partitionIdAndNameTuple2.f1.partitionName;
+        long partition2Id = partitionIdAndNameTuple2.f1.partitionId;
+
+        verifyPartitionCreated(
+                coordinatorContext,
+                new TablePartition(tableId, partition1Id),
+                partitionAssignment,
+                nBuckets,
+                replicationFactor);
+        verifyPartitionCreated(
+                coordinatorContext,
+                new TablePartition(tableId, partition2Id),
+                partitionAssignment,
+                nBuckets,
+                replicationFactor);
+
+        // now, drop partition2 and restart the coordinator event processor,
+        // the partition2 should be dropped
+        eventProcessor.shutdown();
+        zookeeperClient.deletePartition(tablePath, partition2Name);
+
+        // start the coordinator
+        eventProcessor =
+                new CoordinatorEventProcessor(
+                        zookeeperClient,
+                        serverMetadataCache,
+                        testCoordinatorChannelManager,
+                        autoPartitionManager,
+                        TestingMetricGroups.COORDINATOR_METRICS,
+                        new Configuration());
+        makeSendLeaderAndStopRequestAlwaysSuccess(
+                testCoordinatorChannelManager,
+                Arrays.stream(zookeeperClient.getSortedTabletServerList())
+                        .boxed()
+                        .collect(Collectors.toSet()));
+        eventProcessor.startup();
+
+        CoordinatorContext newContext = eventProcessor.getCoordinatorContext();
+        // verify partition2 is dropped
+        verifyPartitionDropped(newContext, tableId, partition2Id);
+        // verify the status of partition1
+        verifyPartitionCreated(
+                newContext,
+                new TablePartition(tableId, partition1Id),
+                partitionAssignment,
+                nBuckets,
+                replicationFactor);
+    }
+
+    private Tuple2<PartitionIdName, PartitionIdName> preparePartitionAssignment(
+            TablePath tablePath,
+            long tableId,
+            CoordinatorContext coordinatorContext,
+            PartitionAssignment partitionAssignment)
+            throws Exception {
+        retry(
+                Duration.ofMinutes(1),
+                // retry util the table has been put into context
+                () -> assertThat(coordinatorContext.getTablePathById(tableId)).isNotNull());
+
+        // create partition
+        long partition1Id = zookeeperClient.getPartitionIdAndIncrement();
+        long partition2Id = zookeeperClient.getPartitionIdAndIncrement();
+        String partition1Name = "2024";
+        String partition2Name = "2025";
+        zookeeperClient.registerPartitionAssignment(partition1Id, partitionAssignment);
+        zookeeperClient.registerPartition(tablePath, tableId, partition1Name, partition1Id);
+        zookeeperClient.registerPartitionAssignment(partition2Id, partitionAssignment);
+        zookeeperClient.registerPartition(tablePath, tableId, partition2Name, partition2Id);
+
+        return Tuple2.of(
+                new PartitionIdName(partition1Id, partition1Name),
+                new PartitionIdName(partition2Id, partition2Name));
+    }
 
     private void verifyTableCreated(
             CoordinatorContext coordinatorContext,
@@ -713,7 +796,7 @@ private void verifyTableCreated(
                                 nBuckets * replicationFactor,
                                 ReplicaState.OnlineReplica));
         for (TableBucket tableBucket : coordinatorContext.getAllBucketsForTable(tableId)) {
-            CoordinatorTestUtils.checkLeaderAndIsr(
+            checkLeaderAndIsr(
                     zookeeperClient,
                     tableBucket,
                     0,
@@ -766,7 +849,7 @@ private void verifyPartitionCreated(
         for (TableBucket tableBucket :
                 coordinatorContext.getAllBucketsForPartition(
                         tablePartition.getTableId(), tablePartition.getPartitionId())) {
-            CoordinatorTestUtils.checkLeaderAndIsr(
+            checkLeaderAndIsr(
                     zookeeperClient,
                     tableBucket,
                     0,
@@ -891,7 +974,19 @@ private TableDescriptor getPartitionedTable() {
                 .partitionedBy("b")
                 .property(ConfigOptions.TABLE_AUTO_PARTITION_ENABLED.key(), "true")
                 .property(ConfigOptions.TABLE_AUTO_PARTITION_TIME_UNIT.key(), "DAY")
+                // set to 0 to disable pre-create partition
+                .property(ConfigOptions.TABLE_AUTO_PARTITION_NUM_PRECREATE, 0)
                 .build()
                 .withReplicationFactor(REPLICATION_FACTOR);
     }
+
+    private static class PartitionIdName {
+        private final long partitionId;
+        private final String partitionName;
+
+        private PartitionIdName(long partitionId, String partitionName) {
+            this.partitionId = partitionId;
+            this.partitionName = partitionName;
+        }
+    }
 }