apache · poorbarcode · Apr 18, 2023 · Apr 18, 2023 · Apr 19, 2023 · Apr 19, 2023
diff --git a/...er/src/main/java/org/apache/pulsar/broker/service/persistent/GeoPersistentReplicator.java b/...er/src/main/java/org/apache/pulsar/broker/service/persistent/GeoPersistentReplicator.java
@@ -58,6 +58,10 @@ protected boolean replicateEntries(List<Entry> entries) {
                 brokerService.pulsar().getConfiguration().isEnableReplicatedSubscriptions();
 
         try {
+            if (!checkNoMessageSkipped(entries)) {
+                return false;
+            }
+
             // This flag is set to true when we skip at least one local message,
             // in order to skip remaining local messages.
             boolean isLocalMessageSkippedOnce = false;
@@ -173,6 +177,7 @@ protected boolean replicateEntries(List<Entry> entries) {
                                     replicatorId, e);
                         }
                         log.info("[{}] Resume the data replication after the schema fetching done", replicatorId);
+                        lastSent = PositionImpl.EARLIEST;
                         cursor.rewind();
                         fetchSchemaInProgress = false;
                         readMoreEntries();
@@ -183,6 +188,7 @@ protected boolean replicateEntries(List<Entry> entries) {
                     msg.getMessageBuilder().clearTxnidLeastBits();
                     // Increment pending messages for messages produced locally
                     PENDING_MESSAGES_UPDATER.incrementAndGet(this);
+                    lastSent = entry.getPosition();
                     producer.sendAsync(msg, ProducerSendCallback.create(this, entry, msg));
                     atLeastOneMessageSentForReplication = true;
                 }

diff --git a/...roker/src/main/java/org/apache/pulsar/broker/service/persistent/PersistentReplicator.java b/...roker/src/main/java/org/apache/pulsar/broker/service/persistent/PersistentReplicator.java
@@ -42,7 +42,9 @@
 import org.apache.bookkeeper.mledger.ManagedLedgerException.CursorAlreadyClosedException;
 import org.apache.bookkeeper.mledger.ManagedLedgerException.TooManyRequestsException;
 import org.apache.bookkeeper.mledger.Position;
+import org.apache.bookkeeper.mledger.impl.ManagedLedgerImpl;
 import org.apache.bookkeeper.mledger.impl.PositionImpl;
+import org.apache.commons.collections4.CollectionUtils;
 import org.apache.pulsar.broker.PulsarServerException;
 import org.apache.pulsar.broker.service.AbstractReplicator;
 import org.apache.pulsar.broker.service.BrokerService;
@@ -70,6 +72,7 @@ public abstract class PersistentReplicator extends AbstractReplicator
 
     protected final PersistentTopic topic;
     protected final ManagedCursor cursor;
+    protected final ManagedLedgerImpl managedLedger;
 
     protected Optional<DispatchRateLimiter> dispatchRateLimiter = Optional.empty();
     private final Object dispatchRateLimiterLock = new Object();
@@ -108,6 +111,8 @@ public abstract class PersistentReplicator extends AbstractReplicator
 
     protected volatile boolean fetchSchemaInProgress = false;
 
+    protected volatile Position lastSent = PositionImpl.EARLIEST;
+
     public PersistentReplicator(String localCluster, PersistentTopic localTopic, ManagedCursor cursor,
                                    String remoteCluster, String remoteTopic,
                                    BrokerService brokerService, PulsarClientImpl replicationClient)
@@ -116,6 +121,7 @@ public PersistentReplicator(String localCluster, PersistentTopic localTopic, Man
                 brokerService, replicationClient);
         this.topic = localTopic;
         this.cursor = cursor;
+        this.managedLedger = (ManagedLedgerImpl) localTopic.getManagedLedger();
         this.expiryMonitor = new PersistentMessageExpiryMonitor(localTopicName,
                 Codec.decode(cursor.getName()), cursor, null);
         HAVE_PENDING_READ_UPDATER.set(this, FALSE);
@@ -135,6 +141,7 @@ public PersistentReplicator(String localCluster, PersistentTopic localTopic, Man
     @Override
     protected void readEntries(Producer<byte[]> producer) {
         // Rewind the cursor to be sure to read again all non-acked messages sent while restarting
+        lastSent = PositionImpl.EARLIEST;
         cursor.rewind();
 
         cursor.cancelPendingReadRequest();
@@ -268,6 +275,36 @@ protected void readMoreEntries() {
         }
     }
 
+    /**
+     * Check if some messages are skipped, if yes, the messages will be discarded and rewind is called.
+     * Why are messages are skipped, for example: if there has something wrong when Replicator is processing
+     * messages "[1:1 ~ 3:3]", Replicator discards the unprocessed message. But a new batch messages "[4:1 ~ 6:6]"
+     * is received later, then these messages will be sent.
+     */
+    protected boolean checkNoMessageSkipped(List<Entry> entries) {
+        if (CollectionUtils.isEmpty(entries)){
+            return true;
+        }
+
+        PositionImpl markDeletedPos = (PositionImpl) cursor.getMarkDeletedPosition();
+        PositionImpl lastSentPos = (PositionImpl) lastSent;
+        PositionImpl lastProcessedPos = markDeletedPos.compareTo(lastSentPos) > 0 ? markDeletedPos : lastSentPos;
+
+        PositionImpl firstMessageReceived = (PositionImpl) entries.get(0).getPosition();
+        PositionImpl expectedFirstMessage = managedLedger.getNextValidPosition(lastProcessedPos);
+        if (expectedFirstMessage.compareTo(firstMessageReceived) >= 0) {
+            return true;
+        }
+
+        log.warn("[{}] Detected messages are skipped. first received: {}, last processed: {}",
+                replicatorId, firstMessageReceived, expectedFirstMessage);
+        entries.forEach(Entry::release);
+        cursor.cancelPendingReadRequest();
+        this.lastSent = PositionImpl.EARLIEST;
+        cursor.rewind();
+        return false;
+    }
+
     @Override
     public void readEntriesComplete(List<Entry> entries, Object ctx) {
         if (log.isDebugEnabled()) {
@@ -332,6 +369,7 @@ public void sendComplete(Exception exception) {
             if (exception != null && !(exception instanceof PulsarClientException.InvalidMessageException)) {
                 log.error("[{}] Error producing on remote broker", replicator.replicatorId, exception);
                 // cursor should be rewinded since it was incremented when readMoreEntries
+                replicator.lastSent = PositionImpl.EARLIEST;
                 replicator.cursor.rewind();
             } else {
                 if (log.isDebugEnabled()) {

diff --git a/...ar-broker/src/main/java/org/apache/pulsar/broker/service/persistent/ShadowReplicator.java b/...ar-broker/src/main/java/org/apache/pulsar/broker/service/persistent/ShadowReplicator.java
@@ -58,6 +58,10 @@ protected boolean replicateEntries(List<Entry> entries) {
         boolean atLeastOneMessageSentForReplication = false;
 
         try {
+            if (!checkNoMessageSkipped(entries)) {
+                return false;
+            }
+
             // This flag is set to true when we skip at least one local message,
             // in order to skip remaining local messages.
             boolean isLocalMessageSkippedOnce = false;
@@ -113,6 +117,7 @@ protected boolean replicateEntries(List<Entry> entries) {
 
                 // Increment pending messages for messages produced locally
                 PENDING_MESSAGES_UPDATER.incrementAndGet(this);
+                lastSent = entry.getPosition();
                 producer.sendAsync(msg, ProducerSendCallback.create(this, entry, msg));
                 atLeastOneMessageSentForReplication = true;
             }

diff --git a/pulsar-broker/src/test/java/org/apache/pulsar/broker/service/ReplicatorTest.java b/pulsar-broker/src/test/java/org/apache/pulsar/broker/service/ReplicatorTest.java
@@ -34,15 +34,18 @@
 import io.netty.buffer.ByteBuf;
 import java.lang.reflect.Field;
 import java.lang.reflect.Method;
+import java.nio.charset.Charset;
 import java.nio.charset.StandardCharsets;
 import java.util.ArrayList;
+import java.util.Collections;
 import java.util.List;
 import java.util.Map;
 import java.util.Optional;
 import java.util.Set;
 import java.util.SortedSet;
 import java.util.TreeSet;
 import java.util.UUID;
+import java.util.concurrent.ArrayBlockingQueue;
 import java.util.concurrent.Callable;
 import java.util.concurrent.CompletableFuture;
 import java.util.concurrent.ConcurrentHashMap;
@@ -51,6 +54,8 @@
 import java.util.concurrent.Executors;
 import java.util.concurrent.Future;
 import java.util.concurrent.TimeUnit;
+import java.util.concurrent.atomic.AtomicInteger;
+import java.util.function.BiConsumer;
 import java.util.stream.Collectors;
 import lombok.Cleanup;
 import org.apache.bookkeeper.mledger.AsyncCallbacks.DeleteCursorCallback;
@@ -67,6 +72,7 @@
 import org.apache.pulsar.broker.BrokerTestUtil;
 import org.apache.pulsar.broker.PulsarService;
 import org.apache.pulsar.broker.service.BrokerServiceException.NamingException;
+import org.apache.pulsar.broker.service.persistent.GeoPersistentReplicator;
 import org.apache.pulsar.broker.service.persistent.PersistentReplicator;
 import org.apache.pulsar.broker.service.persistent.PersistentTopic;
 import org.apache.pulsar.client.admin.PulsarAdmin;
@@ -90,6 +96,7 @@
 import org.apache.pulsar.client.impl.PulsarClientImpl;
 import org.apache.pulsar.client.impl.conf.ProducerConfigurationData;
 import org.apache.pulsar.client.impl.transaction.TransactionImpl;
+import org.apache.pulsar.common.api.proto.CommandSubscribe;
 import org.apache.pulsar.common.naming.NamespaceName;
 import org.apache.pulsar.common.naming.SystemTopicNames;
 import org.apache.pulsar.common.naming.TopicName;
@@ -1756,4 +1763,93 @@ public void testReplicatorProducerNotExceed() throws Exception {
 
         Assert.assertThrows(PulsarClientException.ProducerBusyException.class, () -> new MessageProducer(url2, dest2));
     }
+
+    @Test
+    public void testDiscontinuousMessages() throws Exception {
+        final Field fieldReadPosition = ManagedCursorImpl.class.getDeclaredField("readPosition");
+        fieldReadPosition.setAccessible(true);
+        final Field fieldPendingMessages = PersistentReplicator.class.getDeclaredField("pendingMessages");
+        fieldPendingMessages.setAccessible(true);
+        final String namespace = "pulsar/ns1";
+        final TopicName tName = TopicName.get(BrokerTestUtil.newUniqueName("persistent://" + namespace + "/tp_"));
+        final String tpName = tName.toString();
+        final String ignoredSubName = "sub_ignore";
+        final String replicatorSubName = "pulsar.repl.r2";
+
+        // create topics.
+        admin1.topics().createNonPartitionedTopic(tpName);
+        admin1.topics().createSubscription(tpName, ignoredSubName, MessageId.earliest);
+        admin1.topicPolicies().setDeduplicationStatus(tpName, true);
+        try {
+            admin2.topics().createNonPartitionedTopic(tpName);
+        } catch (Exception ex){/* Maybe ConflictException: because replicator will create this topic too.*/}
+        admin2.topics().createSubscription(tpName, ignoredSubName, MessageId.earliest);
+        admin2.schemas().createSchema(tpName, Schema.STRING.getSchemaInfo());
+        admin2.topicPolicies().setDeduplicationStatus(tpName, true);
+
+        // init clients.
+        final PulsarClient client1 = PulsarClient.builder().serviceUrl(url1.toString()).build();
+        final PulsarClient client2 = PulsarClient.builder().serviceUrl(url2.toString()).build();
+        final Producer producer1 = client1.newProducer().topic(tpName).enableBatching(false).create();
+        final Consumer consumer2 = client2.newConsumer().topic(tpName).subscriptionName(ignoredSubName).subscribe();
+        final PersistentTopic tp =
+                (PersistentTopic) pulsar1.getBrokerService().getTopic(tName.toString(), false).join().get();
+        final ManagedLedgerImpl ml = (ManagedLedgerImpl) tp.getManagedLedger();
+        final ManagedCursorImpl replicatorCursor = (ManagedCursorImpl) ml.openCursor(replicatorSubName,
+                CommandSubscribe.InitialPosition.Earliest);
+        tp.checkReplication().join();
+        final GeoPersistentReplicator replicator = (GeoPersistentReplicator) tp.getReplicators().values().get(0);
+
+        // pause replication.
+        fieldPendingMessages.set(replicator, Integer.MAX_VALUE);
+        // sleep some seconds to skip the first reading.
+        Thread.sleep(2000);
+
+        // Set a wrong read position to mock discontinuous read.
+        BiConsumer<MessageId, Throwable> actionToMakeReadPositionError = (messageId, ex) -> {
+            MessageIdImpl messageIdImpl = (MessageIdImpl) messageId;
+            PositionImpl wrongReadPosition =
+                    PositionImpl.get(messageIdImpl.getLedgerId(), messageIdImpl.getEntryId());
+            Position originalPos = replicatorCursor.getReadPosition();
+            try {
+                fieldReadPosition.set(replicatorCursor, wrongReadPosition);
+            } catch (IllegalAccessException e) {
+            }
+            log.info("original read-pos: {}, set wrong pos: {}", originalPos,
+                    replicatorCursor.getReadPosition());
+        };
+
+        // Send messages.
+        final int sentCount = 200;
+        for (int i = 0; i < sentCount; i++){
+            CompletableFuture<MessageId> sendFuture =
+                    producer1.sendAsync(Integer.valueOf(i).toString().getBytes(Charset.defaultCharset()));
+            if (i % 10 == 0 && i > 10) {
+                sendFuture.whenComplete(actionToMakeReadPositionError);
+            }
+        }
+
+        // Start replication.
+        fieldPendingMessages.set(replicator, 0);
+        replicator.readEntriesComplete(Collections.emptyList(), null);
+
+        // Receive replicated messages.
+        final AtomicInteger receivedCounter = new AtomicInteger();
+        final ArrayBlockingQueue<Integer> receivedMessages = new ArrayBlockingQueue<>(sentCount);
+        // 60s is set only to avoid flaky test, which is slow to run locally.
+        Awaitility.await().atMost(60, TimeUnit.SECONDS).untilAsserted(() -> {
+            Message<byte[]> msg = consumer2.receive(2, TimeUnit.SECONDS);
+            if (msg != null) {
+                String receivedMsg = new String(msg.getValue(), Charset.defaultCharset());
+                log.info("received: {}", receivedMsg);
+                receivedMessages.add(Integer.valueOf(receivedMsg));
+                receivedCounter.incrementAndGet();
+            }
+            assertEquals(receivedCounter.get(), sentCount);
+        });
+
+        // Verify the order in which messages are received.
+        ArrayList<Integer> sortedReceivedMessages = new ArrayList<>(receivedMessages);
+        assertEquals(receivedMessages, sortedReceivedMessages);
+    }
 }