apache
diff --git a/‎fluss-client/src/main/java/org/apache/fluss/client/table/scanner/log/LogFetcher.java‎
Lines changed: 37 additions & 2 deletions b/‎fluss-client/src/main/java/org/apache/fluss/client/table/scanner/log/LogFetcher.java‎
Lines changed: 37 additions & 2 deletions
diff --git a/‎fluss-client/src/test/java/org/apache/fluss/client/metadata/TestingMetadataUpdater.java‎
Lines changed: 4 additions & 0 deletions b/‎fluss-client/src/test/java/org/apache/fluss/client/metadata/TestingMetadataUpdater.java‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎fluss-client/src/test/java/org/apache/fluss/client/table/scanner/log/LogFetcherITCase.java‎
Lines changed: 248 additions & 0 deletions b/‎fluss-client/src/test/java/org/apache/fluss/client/table/scanner/log/LogFetcherITCase.java‎
Lines changed: 248 additions & 0 deletions
@@ -26,6 +26,7 @@
 import org.apache.fluss.cluster.BucketLocation;
 import org.apache.fluss.config.ConfigOptions;
 import org.apache.fluss.config.Configuration;
+import org.apache.fluss.exception.ApiException;
 import org.apache.fluss.exception.InvalidMetadataException;
 import org.apache.fluss.exception.LeaderNotAvailableException;
 import org.apache.fluss.fs.FsPath;
@@ -47,6 +48,7 @@
 import org.apache.fluss.rpc.messages.PbFetchLogReqForTable;
 import org.apache.fluss.rpc.messages.PbFetchLogRespForBucket;
 import org.apache.fluss.rpc.messages.PbFetchLogRespForTable;
+import org.apache.fluss.rpc.protocol.ApiError;
 import org.apache.fluss.rpc.protocol.Errors;
 import org.apache.fluss.utils.IOUtils;
 import org.apache.fluss.utils.Projection;
@@ -220,7 +222,8 @@ private void checkAndUpdateMetadata(List<TableBucket> tableBuckets) {
         }
     }
 
-    private void sendFetchRequest(int destination, FetchLogRequest fetchLogRequest) {
+    @VisibleForTesting
+    void sendFetchRequest(int destination, FetchLogRequest fetchLogRequest) {
         TableOrPartitions tableOrPartitionsInFetchRequest =
                 getTableOrPartitionsInFetchRequest(fetchLogRequest);
         // TODO cache the tablet server gateway.
@@ -341,6 +344,14 @@ private synchronized void handleFetchLogResponse(
                                     respForBucket.getBucketId());
                     FetchLogResultForBucket fetchResultForBucket =
                             getFetchLogResultForBucket(tb, tablePath, respForBucket);
+
+                    // if error code is not NONE, it means the fetch log request failed, we need to
+                    // clear table bucket meta for InvalidMetadataException.
+                    if (fetchResultForBucket.getErrorCode() != Errors.NONE.code()) {
+                        ApiError error = ApiError.fromErrorMessage(respForBucket);
+                        handleFetchLogExceptionForBucket(tb, destination, error);
+                    }
+
                     Long fetchOffset = logScannerStatus.getBucketOffset(tb);
                     // if the offset is null, it means the bucket has been unsubscribed,
                     // we just set a Long.MAX_VALUE as the next fetch offset
@@ -383,6 +394,29 @@ private synchronized void handleFetchLogResponse(
         }
     }
 
+    private void handleFetchLogExceptionForBucket(TableBucket tb, int destination, ApiError error) {
+        ApiException exception = error.error().exception();
+        LOG.error("Failed to fetch log from node {} for bucket {}", destination, tb, exception);
+        if (exception instanceof InvalidMetadataException) {
+            LOG.warn(
+                    "Invalid metadata error in fetch log request. "
+                            + "Going to request metadata update.",
+                    exception);
+            long tableId = tb.getTableId();
+            TableOrPartitions tableOrPartitions;
+            if (tb.getPartitionId() == null) {
+                tableOrPartitions = new TableOrPartitions(Collections.singleton(tableId), null);
+            } else {
+                tableOrPartitions =
+                        new TableOrPartitions(
+                                null,
+                                Collections.singleton(
+                                        new TablePartition(tableId, tb.getPartitionId())));
+            }
+            invalidTableOrPartitions(tableOrPartitions);
+        }
+    }
+
     private void pendRemoteFetches(
             RemoteLogFetchInfo remoteLogFetchInfo, long firstFetchOffset, long highWatermark) {
         checkNotNull(remoteLogFetchInfo);
@@ -413,7 +447,8 @@ private void pendRemoteFetches(
         }
     }
 
-    private Map<Integer, FetchLogRequest> prepareFetchLogRequests() {
+    @VisibleForTesting
+    Map<Integer, FetchLogRequest> prepareFetchLogRequests() {
         Map<Integer, List<PbFetchLogReqForBucket>> fetchLogReqForBuckets = new HashMap<>();
         int readyForFetchCount = 0;
         Long tableId = null;
 
@@ -78,6 +78,10 @@ public void updateCluster(Cluster cluster) {
         this.cluster = cluster;
     }
 
+    public void setResponseLogicId(int serverId, int responseLogicId) {
+        tabletServerGatewayMap.get(serverId).setResponseLogicId(responseLogicId);
+    }
+
     @Override
     public void checkAndUpdateTableMetadata(Set<TablePath> tablePaths) {
         Set<TablePath> needUpdateTablePaths =
 
@@ -0,0 +1,248 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.fluss.client.table.scanner.log;
+
+import org.apache.fluss.client.admin.ClientToServerITCaseBase;
+import org.apache.fluss.client.metadata.MetadataUpdater;
+import org.apache.fluss.client.metrics.TestingScannerMetricGroup;
+import org.apache.fluss.client.table.scanner.RemoteFileDownloader;
+import org.apache.fluss.client.table.scanner.ScanRecord;
+import org.apache.fluss.cluster.Cluster;
+import org.apache.fluss.cluster.ServerNode;
+import org.apache.fluss.metadata.TableBucket;
+import org.apache.fluss.record.MemoryLogRecords;
+import org.apache.fluss.rpc.RpcClient;
+import org.apache.fluss.rpc.gateway.TabletServerGateway;
+import org.apache.fluss.rpc.messages.PbProduceLogRespForBucket;
+import org.apache.fluss.rpc.messages.ProduceLogResponse;
+
+import org.junit.jupiter.api.BeforeEach;
+import org.junit.jupiter.api.Test;
+
+import java.time.Duration;
+import java.util.Collections;
+import java.util.HashMap;
+import java.util.List;
+import java.util.Map;
+import java.util.concurrent.ExecutorService;
+import java.util.concurrent.Executors;
+import java.util.concurrent.Future;
+import java.util.concurrent.TimeUnit;
+
+import static org.apache.fluss.record.TestData.DATA1;
+import static org.apache.fluss.record.TestData.DATA1_TABLE_DESCRIPTOR;
+import static org.apache.fluss.record.TestData.DATA1_TABLE_INFO;
+import static org.apache.fluss.record.TestData.DATA1_TABLE_PATH;
+import static org.apache.fluss.server.testutils.RpcMessageTestUtils.newProduceLogRequest;
+import static org.apache.fluss.testutils.DataTestUtils.genMemoryLogRecordsByObject;
+import static org.apache.fluss.testutils.common.CommonTestUtils.retry;
+import static org.assertj.core.api.Assertions.assertThat;
+
+/** IT test for {@link LogFetcher}. */
+public class LogFetcherITCase extends ClientToServerITCaseBase {
+    private LogFetcher logFetcher;
+    private long tableId;
+    private final int bucketId0 = 0;
+    private final int bucketId1 = 1;
+    private LogScannerStatus logScannerStatus;
+
+    @BeforeEach
+    protected void setup() throws Exception {
+        super.setup();
+
+        // We create table data1NonPkTablePath previously.
+        tableId = createTable(DATA1_TABLE_PATH, DATA1_TABLE_DESCRIPTOR, false);
+        FLUSS_CLUSTER_EXTENSION.waitUntilTableReady(tableId);
+
+        RpcClient rpcClient = FLUSS_CLUSTER_EXTENSION.getRpcClient();
+        MetadataUpdater metadataUpdater = new MetadataUpdater(clientConf, rpcClient);
+        metadataUpdater.checkAndUpdateTableMetadata(Collections.singleton(DATA1_TABLE_PATH));
+
+        Map<TableBucket, Long> scanBuckets = new HashMap<>();
+        // add bucket 0 and bucket 1 to log scanner status.
+        scanBuckets.put(new TableBucket(tableId, bucketId0), 0L);
+        scanBuckets.put(new TableBucket(tableId, bucketId1), 0L);
+        logScannerStatus = new LogScannerStatus();
+        logScannerStatus.assignScanBuckets(scanBuckets);
+        logFetcher =
+                new LogFetcher(
+                        DATA1_TABLE_INFO,
+                        null,
+                        logScannerStatus,
+                        clientConf,
+                        metadataUpdater,
+                        TestingScannerMetricGroup.newInstance(),
+                        new RemoteFileDownloader(1));
+    }
+
+    @Test
+    void testFetch() throws Exception {
+        // add one batch records to tb0.
+        TableBucket tb0 = new TableBucket(tableId, bucketId0);
+        addRecordsToBucket(tb0, genMemoryLogRecordsByObject(DATA1), 0L);
+
+        // add one batch records to tb1.
+        TableBucket tb1 = new TableBucket(tableId, bucketId1);
+        addRecordsToBucket(tb1, genMemoryLogRecordsByObject(DATA1), 0L);
+
+        assertThat(logFetcher.hasAvailableFetches()).isFalse();
+        // collect fetch will be empty while no available fetch.
+        assertThat(logFetcher.collectFetch()).isEmpty();
+
+        // send fetcher to fetch data.
+        logFetcher.sendFetches();
+        // The fetcher is async to fetch data, so we need to wait the result write to the
+        // logFetchBuffer.
+        retry(
+                Duration.ofMinutes(1),
+                () -> {
+                    assertThat(logFetcher.hasAvailableFetches()).isTrue();
+                    assertThat(logFetcher.getCompletedFetchesSize()).isEqualTo(2);
+                });
+
+        Map<TableBucket, List<ScanRecord>> records = logFetcher.collectFetch();
+        assertThat(records.size()).isEqualTo(2);
+        assertThat(records.get(tb0).size()).isEqualTo(10);
+        assertThat(records.get(tb1).size()).isEqualTo(10);
+
+        // after collect fetch, the fetcher is empty.
+        assertThat(logFetcher.hasAvailableFetches()).isFalse();
+        assertThat(logFetcher.getCompletedFetchesSize()).isEqualTo(0);
+    }
+
+    @Test
+    void testFetchWhenDestinationIsNullInMetadata() throws Exception {
+        TableBucket tb0 = new TableBucket(tableId, bucketId0);
+        addRecordsToBucket(tb0, genMemoryLogRecordsByObject(DATA1), 0L);
+
+        RpcClient rpcClient = FLUSS_CLUSTER_EXTENSION.getRpcClient();
+        MetadataUpdater metadataUpdater = new MetadataUpdater(clientConf, rpcClient);
+        metadataUpdater.checkAndUpdateTableMetadata(Collections.singleton(DATA1_TABLE_PATH));
+
+        int leaderNode = metadataUpdater.leaderFor(tb0);
+
+        // now, remove leader nodd ,so that fetch destination
+        // server node is null
+        Cluster oldCluster = metadataUpdater.getCluster();
+        Map<Integer, ServerNode> aliveTabletServersById =
+                new HashMap<>(oldCluster.getAliveTabletServers());
+        aliveTabletServersById.remove(leaderNode);
+        Cluster newCluster =
+                new Cluster(
+                        aliveTabletServersById,
+                        oldCluster.getCoordinatorServer(),
+                        oldCluster.getBucketLocationsByPath(),
+                        oldCluster.getTableIdByPath(),
+                        oldCluster.getPartitionIdByPath(),
+                        oldCluster.getTableInfoByPath());
+        metadataUpdater = new MetadataUpdater(rpcClient, newCluster);
+
+        LogScannerStatus logScannerStatus = new LogScannerStatus();
+        logScannerStatus.assignScanBuckets(Collections.singletonMap(tb0, 0L));
+
+        LogFetcher logFetcher =
+                new LogFetcher(
+                        DATA1_TABLE_INFO,
+                        null,
+                        logScannerStatus,
+                        clientConf,
+                        metadataUpdater,
+                        TestingScannerMetricGroup.newInstance(),
+                        new RemoteFileDownloader(1));
+
+        // send fetches to fetch data, should have no available fetch.
+        logFetcher.sendFetches();
+        assertThat(logFetcher.hasAvailableFetches()).isFalse();
+
+        // then fetches again, should have available fetch.
+        // first send fetch is for update metadata
+        logFetcher.sendFetches();
+        // second send fetch will do real fetch data
+        logFetcher.sendFetches();
+        retry(
+                Duration.ofMinutes(1),
+                () -> {
+                    assertThat(logFetcher.hasAvailableFetches()).isTrue();
+                    assertThat(logFetcher.getCompletedFetchesSize()).isEqualTo(1);
+                });
+        Map<TableBucket, List<ScanRecord>> records = logFetcher.collectFetch();
+        assertThat(records.size()).isEqualTo(1);
+        assertThat(records.get(tb0).size()).isEqualTo(10);
+    }
+
+    @Test
+    void testFetchWithInvalidTableOrPartitions() throws Exception {
+        MetadataUpdater metadataUpdater1 =
+                new MetadataUpdater(clientConf, FLUSS_CLUSTER_EXTENSION.getRpcClient());
+        logFetcher =
+                new LogFetcher(
+                        DATA1_TABLE_INFO,
+                        null,
+                        logScannerStatus,
+                        clientConf,
+                        metadataUpdater1,
+                        TestingScannerMetricGroup.newInstance(),
+                        new RemoteFileDownloader(1));
+
+        ExecutorService executor = Executors.newSingleThreadExecutor();
+        Future<?> future =
+                executor.submit(
+                        () -> {
+                            // If this test blocked, please checking whether it was blocked with
+                            // the same reason as https://github.com/apache/fluss/pull/1666
+                            for (int i = 0; i < 1000; i++) {
+                                logFetcher.sendFetches();
+                                logFetcher.invalidTableOrPartitions(
+                                        new LogFetcher.TableOrPartitions(
+                                                Collections.singleton(tableId), null));
+                            }
+                        });
+
+        future.get(30, TimeUnit.SECONDS);
+        assertThat(future.isDone()).isTrue();
+        executor.shutdownNow();
+    }
+
+    private void addRecordsToBucket(
+            TableBucket tableBucket, MemoryLogRecords logRecords, long expectedBaseOffset)
+            throws Exception {
+        int leader = FLUSS_CLUSTER_EXTENSION.waitAndGetLeader(tableBucket);
+        TabletServerGateway leaderGateWay =
+                FLUSS_CLUSTER_EXTENSION.newTabletServerClientForNode(leader);
+        assertProduceLogResponse(
+                leaderGateWay
+                        .produceLog(
+                                newProduceLogRequest(
+                                        tableBucket.getTableId(),
+                                        tableBucket.getBucket(),
+                                        -1, // need ack, so we can make sure every batch is acked.
+                                        logRecords))
+                        .get(),
+                tableBucket.getBucket(),
+                expectedBaseOffset);
+    }
+
+    private static void assertProduceLogResponse(
+            ProduceLogResponse produceLogResponse, int bucketId, Long baseOffset) {
+        assertThat(produceLogResponse.getBucketsRespsCount()).isEqualTo(1);
+        PbProduceLogRespForBucket produceLogRespForBucket =
+                produceLogResponse.getBucketsRespsList().get(0);
+        assertThat(produceLogRespForBucket.getBucketId()).isEqualTo(bucketId);
+        assertThat(produceLogRespForBucket.getBaseOffset()).isEqualTo(baseOffset);
+    }
+}