Skip to content

Commit

Permalink
Revert "[server] Race condition fix for re-subscription of real-time …
Browse files Browse the repository at this point in the history
…topic partitions. (#1192)" (#1221)

This reverts commit 06cc1fc.
  • Loading branch information
gaojieliu authored Oct 7, 2024
1 parent 5889f63 commit 001f7a9
Show file tree
Hide file tree
Showing 4 changed files with 33 additions and 214 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -250,8 +250,8 @@ void setDataReceiver(
// Defensive coding. Should never happen except in case of a regression.
throw new IllegalStateException(
"It is not allowed to set multiple " + ConsumedDataReceiver.class.getSimpleName() + " instances for the same "
+ "topic-partition of a given consumer. Previous: " + previousConsumedDataReceiver.destinationIdentifier()
+ ", New: " + consumedDataReceiver.destinationIdentifier());
+ "topic-partition of a given consumer. Previous: " + previousConsumedDataReceiver + ", New: "
+ consumedDataReceiver);
}
synchronized (this) {
notifyAll();
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -222,14 +222,8 @@ public void unsubscribeAll(PubSubTopic versionTopic) {
versionTopicToTopicPartitionToConsumer.compute(versionTopic, (k, topicPartitionToConsumerMap) -> {
if (topicPartitionToConsumerMap != null) {
topicPartitionToConsumerMap.forEach((topicPartition, sharedConsumer) -> {
/**
* Refer {@link KafkaConsumerService#startConsumptionIntoDataReceiver} for avoiding race condition caused by
* setting data receiver and unsubscribing concurrently for the same topic partition on a shared consumer.
*/
synchronized (sharedConsumer) {
sharedConsumer.unSubscribe(topicPartition);
removeTopicPartitionFromConsumptionTask(sharedConsumer, topicPartition);
}
sharedConsumer.unSubscribe(topicPartition);
removeTopicPartitionFromConsumptionTask(sharedConsumer, topicPartition);
});
}
return null;
Expand All @@ -243,14 +237,8 @@ public void unsubscribeAll(PubSubTopic versionTopic) {
public void unSubscribe(PubSubTopic versionTopic, PubSubTopicPartition pubSubTopicPartition) {
PubSubConsumerAdapter consumer = getConsumerAssignedToVersionTopicPartition(versionTopic, pubSubTopicPartition);
if (consumer != null) {
/**
* Refer {@link KafkaConsumerService#startConsumptionIntoDataReceiver} for avoiding race condition caused by
* setting data receiver and unsubscribing concurrently for the same topic partition on a shared consumer.
*/
synchronized (consumer) {
consumer.unSubscribe(pubSubTopicPartition);
removeTopicPartitionFromConsumptionTask(consumer, pubSubTopicPartition);
}
consumer.unSubscribe(pubSubTopicPartition);
consumerToConsumptionTask.get(consumer).removeDataReceiver(pubSubTopicPartition);
versionTopicToTopicPartitionToConsumer.compute(versionTopic, (k, topicPartitionToConsumerMap) -> {
if (topicPartitionToConsumerMap != null) {
topicPartitionToConsumerMap.remove(pubSubTopicPartition);
Expand All @@ -277,25 +265,20 @@ public void batchUnsubscribe(PubSubTopic versionTopic, Set<PubSubTopicPartition>
/**
* Leverage {@link PubSubConsumerAdapter#batchUnsubscribe(Set)}.
*/
consumerUnSubTopicPartitionSet.forEach((sharedConsumer, tpSet) -> {
ConsumptionTask task = consumerToConsumptionTask.get(sharedConsumer);
/**
* Refer {@link KafkaConsumerService#startConsumptionIntoDataReceiver} for avoiding race condition caused by
* setting data receiver and unsubscribing concurrently for the same topic partition on a shared consumer.
*/
synchronized (sharedConsumer) {
sharedConsumer.batchUnsubscribe(tpSet);
tpSet.forEach(task::removeDataReceiver);
}
tpSet.forEach(
tp -> versionTopicToTopicPartitionToConsumer.compute(versionTopic, (k, topicPartitionToConsumerMap) -> {
if (topicPartitionToConsumerMap != null) {
topicPartitionToConsumerMap.remove(tp);
return topicPartitionToConsumerMap.isEmpty() ? null : topicPartitionToConsumerMap;
} else {
return null;
}
}));
consumerUnSubTopicPartitionSet.forEach((c, tpSet) -> {
c.batchUnsubscribe(tpSet);
ConsumptionTask task = consumerToConsumptionTask.get(c);
tpSet.forEach(tp -> {
task.removeDataReceiver(tp);
versionTopicToTopicPartitionToConsumer.compute(versionTopic, (k, topicPartitionToConsumerMap) -> {
if (topicPartitionToConsumerMap != null) {
topicPartitionToConsumerMap.remove(tp);
return topicPartitionToConsumerMap.isEmpty() ? null : topicPartitionToConsumerMap;
} else {
return null;
}
});
});
});
}

Expand Down Expand Up @@ -404,32 +387,26 @@ public void startConsumptionIntoDataReceiver(
PubSubTopic versionTopic = consumedDataReceiver.destinationIdentifier();
PubSubTopicPartition topicPartition = partitionReplicaIngestionContext.getPubSubTopicPartition();
SharedKafkaConsumer consumer = assignConsumerFor(versionTopic, topicPartition);

if (consumer == null) {
// Defensive code. Shouldn't happen except in case of a regression.
throw new VeniceException(
"Shared consumer must exist for version topic: " + versionTopic + " in Kafka cluster: " + kafkaUrl);
}

ConsumptionTask consumptionTask = consumerToConsumptionTask.get(consumer);
if (consumptionTask == null) {
// Defensive coding. Should never happen except in case of a regression.
throw new IllegalStateException(
"There should be a " + ConsumptionTask.class.getSimpleName() + " assigned for this "
+ SharedKafkaConsumer.class.getSimpleName());
}
/**
* It is possible that when one {@link StoreIngestionTask} thread finishes unsubscribing a topic partition but not
* finish removing data receiver, but the other {@link StoreIngestionTask} thread is setting data receiver for this
* topic partition before subscription. As {@link ConsumptionTask} does not allow 2 different data receivers for
* the same topic partition, it will throw exception.
* N.B. it's important to set the {@link ConsumedDataReceiver} prior to subscribing, otherwise the
* {@link KafkaConsumerService.ConsumptionTask} will not be able to funnel the messages.
*/
synchronized (consumer) {
ConsumptionTask consumptionTask = consumerToConsumptionTask.get(consumer);
if (consumptionTask == null) {
// Defensive coding. Should never happen except in case of a regression.
throw new IllegalStateException(
"There should be a " + ConsumptionTask.class.getSimpleName() + " assigned for this "
+ SharedKafkaConsumer.class.getSimpleName());
}
/**
* N.B. it's important to set the {@link ConsumedDataReceiver} prior to subscribing, otherwise the
* {@link KafkaConsumerService.ConsumptionTask} will not be able to funnel the messages.
*/
consumptionTask.setDataReceiver(topicPartition, consumedDataReceiver);
consumer.subscribe(consumedDataReceiver.destinationIdentifier(), topicPartition, lastReadOffset);
}
consumptionTask.setDataReceiver(topicPartition, consumedDataReceiver);
consumer.subscribe(consumedDataReceiver.destinationIdentifier(), topicPartition, lastReadOffset);
}

interface KCSConstructor {
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -348,9 +348,4 @@ public Long endOffset(PubSubTopicPartition pubSubTopicPartition) {
public List<PubSubTopicPartitionInfo> partitionsFor(PubSubTopic topic) {
throw new UnsupportedOperationException("partitionsFor is not supported in SharedKafkaConsumer");
}

// Test only
public void setNextPollTimeOutSeconds(long seconds) {
this.nextPollTimeOutSeconds = seconds;
}
}
Original file line number Diff line number Diff line change
@@ -1,51 +1,28 @@
package com.linkedin.davinci.kafka.consumer;

import static com.linkedin.venice.ConfigKeys.KAFKA_BOOTSTRAP_SERVERS;
import static org.mockito.ArgumentMatchers.any;
import static org.mockito.ArgumentMatchers.anyBoolean;
import static org.mockito.ArgumentMatchers.anyString;
import static org.mockito.Mockito.doReturn;
import static org.mockito.Mockito.mock;
import static org.mockito.Mockito.never;
import static org.mockito.Mockito.reset;
import static org.mockito.Mockito.verify;
import static org.mockito.Mockito.when;
import static org.testng.Assert.assertFalse;
import static org.testng.Assert.assertTrue;

import com.linkedin.davinci.config.VeniceServerConfig;
import com.linkedin.davinci.ingestion.consumption.ConsumedDataReceiver;
import com.linkedin.venice.kafka.protocol.KafkaMessageEnvelope;
import com.linkedin.venice.meta.ReadOnlyStoreRepository;
import com.linkedin.venice.meta.Version;
import com.linkedin.venice.pubsub.PubSubConsumerAdapterFactory;
import com.linkedin.venice.pubsub.PubSubTopicPartitionImpl;
import com.linkedin.venice.pubsub.PubSubTopicRepository;
import com.linkedin.venice.pubsub.adapter.kafka.consumer.ApacheKafkaConsumerAdapter;
import com.linkedin.venice.pubsub.api.PubSubMessageDeserializer;
import com.linkedin.venice.pubsub.api.PubSubTopic;
import com.linkedin.venice.pubsub.api.PubSubTopicPartition;
import com.linkedin.venice.serialization.avro.OptimizedKafkaValueSerializer;
import com.linkedin.venice.utils.SystemTime;
import com.linkedin.venice.utils.Utils;
import com.linkedin.venice.utils.pools.LandFillObjectPool;
import io.tehuti.metrics.MetricsRepository;
import io.tehuti.metrics.Sensor;
import java.lang.reflect.InvocationTargetException;
import java.lang.reflect.Method;
import java.util.ArrayList;
import java.util.Collections;
import java.util.HashMap;
import java.util.HashSet;
import java.util.List;
import java.util.Map;
import java.util.Properties;
import java.util.Set;
import java.util.concurrent.CountDownLatch;
import java.util.concurrent.TimeUnit;
import java.util.concurrent.atomic.AtomicBoolean;
import java.util.function.Function;
import org.testng.Assert;
import org.testng.annotations.DataProvider;
import org.testng.annotations.Test;

Expand Down Expand Up @@ -481,134 +458,4 @@ private void verifyConsumerServiceStartConsumptionIntoDataReceiver(
partitionReplicaIngestionContext.getVersionTopic(),
partitionReplicaIngestionContext.getPubSubTopicPartition());
}

/**
* This test is to simulate multiple threads resubscribing to the same real-time topic partition for different store
* versions and verify if the lock will protect the handoff for {@link ConsumptionTask} and {@link ConsumedDataReceiver}
* during the re-subscription.
*/
@Test
public void testKafkaConsumerServiceResubscriptionConcurrency() throws Exception {
ApacheKafkaConsumerAdapter consumer1 = mock(ApacheKafkaConsumerAdapter.class);
when(consumer1.hasAnySubscription()).thenReturn(true);

PubSubConsumerAdapterFactory factory = mock(PubSubConsumerAdapterFactory.class);
when(factory.create(any(), anyBoolean(), any(), any())).thenReturn(consumer1);

Properties properties = new Properties();
String testKafkaUrl = "test_kafka_url";
properties.put(KAFKA_BOOTSTRAP_SERVERS, testKafkaUrl);
MetricsRepository mockMetricsRepository = mock(MetricsRepository.class);
final Sensor mockSensor = mock(Sensor.class);
doReturn(mockSensor).when(mockMetricsRepository).sensor(anyString(), any());

int versionNum = 5;

PubSubMessageDeserializer pubSubDeserializer = new PubSubMessageDeserializer(
new OptimizedKafkaValueSerializer(),
new LandFillObjectPool<>(KafkaMessageEnvelope::new),
new LandFillObjectPool<>(KafkaMessageEnvelope::new));
KafkaConsumerService consumerService = new PartitionWiseKafkaConsumerService(
ConsumerPoolType.REGULAR_POOL,
factory,
properties,
1000l,
versionNum + 1, // Plus 1 to guarantee the consumer pool size is larger than the # of versions.
mock(IngestionThrottler.class),
mock(KafkaClusterBasedRecordThrottler.class),
mockMetricsRepository,
"test_kafka_cluster_alias",
TimeUnit.MINUTES.toMillis(1),
mock(TopicExistenceChecker.class),
false,
pubSubDeserializer,
SystemTime.INSTANCE,
null,
false,
mock(ReadOnlyStoreRepository.class),
false);
String storeName = Utils.getUniqueString("test_consumer_service");

Function<String, Boolean> isAAWCStoreFunc = vt -> true;
KafkaConsumerServiceDelegator.KafkaConsumerServiceBuilder consumerServiceBuilder =
(ignored, poolType) -> consumerService;
VeniceServerConfig mockConfig = mock(VeniceServerConfig.class);
doReturn(false).when(mockConfig).isDedicatedConsumerPoolForAAWCLeaderEnabled();
doReturn(true).when(mockConfig).isResubscriptionTriggeredByVersionIngestionContextChangeEnabled();
doReturn(KafkaConsumerServiceDelegator.ConsumerPoolStrategyType.CURRENT_VERSION_PRIORITIZATION).when(mockConfig)
.getConsumerPoolStrategyType();
KafkaConsumerServiceDelegator delegator =
new KafkaConsumerServiceDelegator(mockConfig, consumerServiceBuilder, isAAWCStoreFunc);
PubSubTopicPartition realTimeTopicPartition =
new PubSubTopicPartitionImpl(TOPIC_REPOSITORY.getTopic(Version.composeRealTimeTopic(storeName)), 0);

CountDownLatch countDownLatch = new CountDownLatch(1);
List<Thread> infiniteSubUnSubThreads = new ArrayList<>();
for (int i = 0; i < versionNum; i++) {
PubSubTopic topicV1ForStoreName3 = TOPIC_REPOSITORY.getTopic(Version.composeKafkaTopic(storeName, i));
StoreIngestionTask task = mock(StoreIngestionTask.class);
when(task.getVersionTopic()).thenReturn(topicV1ForStoreName3);
when(task.isHybridMode()).thenReturn(true);
PubSubTopic versionTopicV1 = task.getVersionTopic();

PartitionReplicaIngestionContext partitionReplicaIngestionContext = new PartitionReplicaIngestionContext(
versionTopicV1,
realTimeTopicPartition,
PartitionReplicaIngestionContext.VersionRole.CURRENT,
PartitionReplicaIngestionContext.WorkloadType.AA_OR_WRITE_COMPUTE);
ConsumedDataReceiver consumedDataReceiver = mock(ConsumedDataReceiver.class);
when(consumedDataReceiver.destinationIdentifier()).thenReturn(versionTopicV1);
Runnable infiniteSubUnSub = getResubscriptionRunnableFor(
delegator,
partitionReplicaIngestionContext,
consumedDataReceiver,
countDownLatch);
Thread infiniteSubUnSubThread = new Thread(infiniteSubUnSub, "infiniteResubscribe: " + topicV1ForStoreName3);
infiniteSubUnSubThread.start();
infiniteSubUnSubThreads.add(infiniteSubUnSubThread);
}

long currentTime = System.currentTimeMillis();
Boolean raceConditionFound = countDownLatch.await(30, TimeUnit.SECONDS);
long elapsedTime = System.currentTimeMillis() - currentTime;
for (Thread infiniteSubUnSubThread: infiniteSubUnSubThreads) {
infiniteSubUnSubThread.stop();
}
Assert.assertFalse(
raceConditionFound,
"Found race condition in KafkaConsumerService with time passed in milliseconds: " + elapsedTime);
}

private Runnable getResubscriptionRunnableFor(
KafkaConsumerServiceDelegator consumerServiceDelegator,
PartitionReplicaIngestionContext partitionReplicaIngestionContext,
ConsumedDataReceiver consumedDataReceiver,
CountDownLatch countDownLatch) {
PubSubTopic versionTopic = partitionReplicaIngestionContext.getVersionTopic();
PubSubTopicPartition pubSubTopicPartition = partitionReplicaIngestionContext.getPubSubTopicPartition();
return () -> {
try {
while (true) {
consumerServiceDelegator
.startConsumptionIntoDataReceiver(partitionReplicaIngestionContext, 0, consumedDataReceiver);
// Avoid wait time here to increase the chance for race condition.
consumerServiceDelegator.assignConsumerFor(versionTopic, pubSubTopicPartition).setNextPollTimeOutSeconds(0);
int versionNum =
Version.parseVersionFromKafkaTopicName(partitionReplicaIngestionContext.getVersionTopic().getName());
if (versionNum % 3 == 0) {
consumerServiceDelegator.unSubscribe(versionTopic, pubSubTopicPartition);
} else if (versionNum % 3 == 1) {
consumerServiceDelegator.unsubscribeAll(partitionReplicaIngestionContext.getVersionTopic());
} else {
consumerServiceDelegator.batchUnsubscribe(
partitionReplicaIngestionContext.getVersionTopic(),
Collections.singleton(partitionReplicaIngestionContext.getPubSubTopicPartition()));
}
}
} catch (Exception e) {
e.printStackTrace();
countDownLatch.countDown();
}
};
}
}

0 comments on commit 001f7a9

Please sign in to comment.