2 * Copyright (c) 2014, 2015 Cisco Systems, Inc. and others. All rights reserved.
4 * This program and the accompanying materials are made available under the
5 * terms of the Eclipse Public License v1.0 which accompanies this distribution,
6 * and is available at http://www.eclipse.org/legal/epl-v10.html
8 package org.opendaylight.controller.cluster.datastore.shardmanager;
10 import static org.awaitility.Awaitility.await;
11 import static org.junit.Assert.assertEquals;
12 import static org.junit.Assert.assertFalse;
13 import static org.junit.Assert.assertNotNull;
14 import static org.junit.Assert.assertNull;
15 import static org.junit.Assert.assertSame;
16 import static org.junit.Assert.assertTrue;
17 import static org.junit.Assert.fail;
18 import static org.mockito.ArgumentMatchers.anyString;
19 import static org.mockito.Mockito.doReturn;
20 import static org.mockito.Mockito.mock;
21 import static org.mockito.Mockito.reset;
22 import static org.mockito.Mockito.timeout;
23 import static org.mockito.Mockito.verify;
24 import static org.mockito.Mockito.verifyNoMoreInteractions;
26 import akka.actor.ActorRef;
27 import akka.actor.ActorSystem;
28 import akka.actor.AddressFromURIString;
29 import akka.actor.PoisonPill;
30 import akka.actor.Props;
31 import akka.actor.Status;
32 import akka.actor.Status.Failure;
33 import akka.actor.Status.Success;
34 import akka.cluster.Cluster;
35 import akka.cluster.ClusterEvent;
36 import akka.cluster.Member;
37 import akka.dispatch.Dispatchers;
38 import akka.dispatch.OnComplete;
39 import akka.japi.Creator;
40 import akka.pattern.Patterns;
41 import akka.persistence.RecoveryCompleted;
42 import akka.serialization.Serialization;
43 import akka.testkit.TestActorRef;
44 import akka.testkit.javadsl.TestKit;
45 import akka.util.Timeout;
46 import com.google.common.base.Stopwatch;
47 import com.google.common.collect.ImmutableMap;
48 import com.google.common.collect.Lists;
49 import com.google.common.collect.Sets;
50 import com.google.common.util.concurrent.SettableFuture;
51 import com.google.common.util.concurrent.Uninterruptibles;
52 import java.time.Duration;
53 import java.util.AbstractMap;
54 import java.util.Arrays;
55 import java.util.Collection;
56 import java.util.Collections;
57 import java.util.HashMap;
58 import java.util.List;
60 import java.util.Map.Entry;
62 import java.util.concurrent.CountDownLatch;
63 import java.util.concurrent.TimeUnit;
64 import java.util.concurrent.TimeoutException;
65 import java.util.function.Consumer;
66 import java.util.function.Function;
67 import java.util.stream.Collectors;
68 import org.junit.After;
69 import org.junit.AfterClass;
70 import org.junit.Before;
71 import org.junit.BeforeClass;
72 import org.junit.Test;
73 import org.junit.runner.RunWith;
74 import org.mockito.junit.MockitoJUnitRunner;
75 import org.opendaylight.controller.cluster.access.concepts.MemberName;
76 import org.opendaylight.controller.cluster.datastore.AbstractClusterRefActorTest;
77 import org.opendaylight.controller.cluster.datastore.ClusterWrapperImpl;
78 import org.opendaylight.controller.cluster.datastore.DataStoreVersions;
79 import org.opendaylight.controller.cluster.datastore.DatastoreContext;
80 import org.opendaylight.controller.cluster.datastore.DatastoreContextFactory;
81 import org.opendaylight.controller.cluster.datastore.DistributedDataStore;
82 import org.opendaylight.controller.cluster.datastore.Shard;
83 import org.opendaylight.controller.cluster.datastore.config.Configuration;
84 import org.opendaylight.controller.cluster.datastore.config.ConfigurationImpl;
85 import org.opendaylight.controller.cluster.datastore.config.EmptyModuleShardConfigProvider;
86 import org.opendaylight.controller.cluster.datastore.config.ModuleShardConfiguration;
87 import org.opendaylight.controller.cluster.datastore.exceptions.AlreadyExistsException;
88 import org.opendaylight.controller.cluster.datastore.exceptions.NoShardLeaderException;
89 import org.opendaylight.controller.cluster.datastore.exceptions.NotInitializedException;
90 import org.opendaylight.controller.cluster.datastore.exceptions.PrimaryNotFoundException;
91 import org.opendaylight.controller.cluster.datastore.identifiers.ShardIdentifier;
92 import org.opendaylight.controller.cluster.datastore.identifiers.ShardManagerIdentifier;
93 import org.opendaylight.controller.cluster.datastore.messages.ActorInitialized;
94 import org.opendaylight.controller.cluster.datastore.messages.AddShardReplica;
95 import org.opendaylight.controller.cluster.datastore.messages.ChangeShardMembersVotingStatus;
96 import org.opendaylight.controller.cluster.datastore.messages.CreateShard;
97 import org.opendaylight.controller.cluster.datastore.messages.FindLocalShard;
98 import org.opendaylight.controller.cluster.datastore.messages.FindPrimary;
99 import org.opendaylight.controller.cluster.datastore.messages.LocalPrimaryShardFound;
100 import org.opendaylight.controller.cluster.datastore.messages.LocalShardFound;
101 import org.opendaylight.controller.cluster.datastore.messages.LocalShardNotFound;
102 import org.opendaylight.controller.cluster.datastore.messages.PrimaryShardInfo;
103 import org.opendaylight.controller.cluster.datastore.messages.RemotePrimaryShardFound;
104 import org.opendaylight.controller.cluster.datastore.messages.RemoveShardReplica;
105 import org.opendaylight.controller.cluster.datastore.messages.ShardLeaderStateChanged;
106 import org.opendaylight.controller.cluster.datastore.messages.UpdateSchemaContext;
107 import org.opendaylight.controller.cluster.datastore.persisted.DatastoreSnapshot;
108 import org.opendaylight.controller.cluster.datastore.persisted.DatastoreSnapshot.ShardSnapshot;
109 import org.opendaylight.controller.cluster.datastore.persisted.ShardManagerSnapshot;
110 import org.opendaylight.controller.cluster.datastore.utils.ForwardingActor;
111 import org.opendaylight.controller.cluster.datastore.utils.MockClusterWrapper;
112 import org.opendaylight.controller.cluster.datastore.utils.MockConfiguration;
113 import org.opendaylight.controller.cluster.datastore.utils.PrimaryShardInfoFutureCache;
114 import org.opendaylight.controller.cluster.notifications.LeaderStateChanged;
115 import org.opendaylight.controller.cluster.notifications.RegisterRoleChangeListener;
116 import org.opendaylight.controller.cluster.notifications.RoleChangeNotification;
117 import org.opendaylight.controller.cluster.raft.RaftState;
118 import org.opendaylight.controller.cluster.raft.TestActorFactory;
119 import org.opendaylight.controller.cluster.raft.base.messages.FollowerInitialSyncUpStatus;
120 import org.opendaylight.controller.cluster.raft.base.messages.SwitchBehavior;
121 import org.opendaylight.controller.cluster.raft.client.messages.GetSnapshot;
122 import org.opendaylight.controller.cluster.raft.client.messages.Shutdown;
123 import org.opendaylight.controller.cluster.raft.messages.AddServer;
124 import org.opendaylight.controller.cluster.raft.messages.AddServerReply;
125 import org.opendaylight.controller.cluster.raft.messages.ChangeServersVotingStatus;
126 import org.opendaylight.controller.cluster.raft.messages.RemoveServer;
127 import org.opendaylight.controller.cluster.raft.messages.RemoveServerReply;
128 import org.opendaylight.controller.cluster.raft.messages.ServerChangeReply;
129 import org.opendaylight.controller.cluster.raft.messages.ServerChangeStatus;
130 import org.opendaylight.controller.cluster.raft.messages.ServerRemoved;
131 import org.opendaylight.controller.cluster.raft.policy.DisableElectionsRaftPolicy;
132 import org.opendaylight.controller.cluster.raft.utils.InMemoryJournal;
133 import org.opendaylight.controller.cluster.raft.utils.InMemorySnapshotStore;
134 import org.opendaylight.controller.cluster.raft.utils.MessageCollectorActor;
135 import org.opendaylight.controller.md.cluster.datastore.model.TestModel;
136 import org.opendaylight.yangtools.concepts.Registration;
137 import org.opendaylight.yangtools.yang.common.XMLNamespace;
138 import org.opendaylight.yangtools.yang.data.api.schema.tree.DataTree;
139 import org.opendaylight.yangtools.yang.model.api.EffectiveModelContext;
140 import org.slf4j.Logger;
141 import org.slf4j.LoggerFactory;
142 import scala.concurrent.Await;
143 import scala.concurrent.Future;
144 import scala.concurrent.duration.FiniteDuration;
146 @RunWith(MockitoJUnitRunner.StrictStubs.class)
147 public class ShardManagerTest extends AbstractClusterRefActorTest {
148 private static final Logger LOG = LoggerFactory.getLogger(ShardManagerTest.class);
149 private static final MemberName MEMBER_1 = MemberName.forName("member-1");
150 private static final MemberName MEMBER_2 = MemberName.forName("member-2");
151 private static final MemberName MEMBER_3 = MemberName.forName("member-3");
153 private static int ID_COUNTER = 1;
154 private static ActorRef mockShardActor;
155 private static ShardIdentifier mockShardName;
156 private static SettableFuture<Void> ready;
157 private static EffectiveModelContext TEST_SCHEMA_CONTEXT;
159 private final String shardMrgIDSuffix = "config" + ID_COUNTER++;
160 private final TestActorFactory actorFactory = new TestActorFactory(getSystem());
161 private final DatastoreContext.Builder datastoreContextBuilder = DatastoreContext.newBuilder()
162 .dataStoreName(shardMrgIDSuffix).shardInitializationTimeout(600, TimeUnit.MILLISECONDS)
163 .shardHeartbeatIntervalInMillis(100).shardElectionTimeoutFactor(6);
165 private final String shardMgrID = ShardManagerIdentifier.builder().type(shardMrgIDSuffix).build().toString();
168 public static void beforeClass() {
169 TEST_SCHEMA_CONTEXT = TestModel.createTestContext();
173 public static void afterClass() {
174 TEST_SCHEMA_CONTEXT = null;
178 public void setUp() {
179 ready = SettableFuture.create();
181 InMemoryJournal.clear();
182 InMemorySnapshotStore.clear();
184 if (mockShardActor == null) {
185 mockShardName = ShardIdentifier.create(Shard.DEFAULT_NAME, MEMBER_1, "config");
186 mockShardActor = getSystem().actorOf(MessageCollectorActor.props(), mockShardName.toString());
189 MessageCollectorActor.clearMessages(mockShardActor);
193 public void tearDown() {
194 InMemoryJournal.clear();
195 InMemorySnapshotStore.clear();
197 mockShardActor.tell(PoisonPill.getInstance(), ActorRef.noSender());
198 await().atMost(Duration.ofSeconds(10)).until(mockShardActor::isTerminated);
199 mockShardActor = null;
201 actorFactory.close();
204 private TestShardManager.Builder newTestShardMgrBuilder() {
205 return TestShardManager.builder(datastoreContextBuilder).distributedDataStore(mock(DistributedDataStore.class));
208 private TestShardManager.Builder newTestShardMgrBuilder(final Configuration config) {
209 return TestShardManager.builder(datastoreContextBuilder).configuration(config)
210 .distributedDataStore(mock(DistributedDataStore.class));
213 private Props newShardMgrProps() {
214 return newShardMgrProps(new MockConfiguration());
217 private Props newShardMgrProps(final Configuration config) {
218 return newTestShardMgrBuilder(config).readinessFuture(ready).props();
221 private ActorSystem newActorSystem(final String config) {
222 return newActorSystem("cluster-test", config);
225 private ActorRef newMockShardActor(final ActorSystem system, final String shardName, final String memberName) {
226 String name = ShardIdentifier.create(shardName, MemberName.forName(memberName), "config").toString();
227 if (system == getSystem()) {
228 return actorFactory.createActor(MessageCollectorActor.props(), name);
231 return system.actorOf(MessageCollectorActor.props(), name);
234 private static DatastoreContextFactory newDatastoreContextFactory(final DatastoreContext datastoreContext) {
235 DatastoreContextFactory mockFactory = mock(DatastoreContextFactory.class);
236 doReturn(datastoreContext).when(mockFactory).getBaseDatastoreContext();
237 doReturn(datastoreContext).when(mockFactory).getShardDatastoreContext(anyString());
241 private TestShardManager.Builder newTestShardMgrBuilderWithMockShardActor() {
242 return newTestShardMgrBuilderWithMockShardActor(mockShardActor);
245 private TestShardManager.Builder newTestShardMgrBuilderWithMockShardActor(final ActorRef shardActor) {
246 return TestShardManager.builder(datastoreContextBuilder).shardActor(shardActor)
247 .distributedDataStore(mock(DistributedDataStore.class));
251 private Props newPropsShardMgrWithMockShardActor() {
252 return newTestShardMgrBuilderWithMockShardActor().props().withDispatcher(
253 Dispatchers.DefaultDispatcherId());
256 private Props newPropsShardMgrWithMockShardActor(final ActorRef shardActor) {
257 return newTestShardMgrBuilderWithMockShardActor(shardActor).props()
258 .withDispatcher(Dispatchers.DefaultDispatcherId());
262 private TestShardManager newTestShardManager() {
263 return newTestShardManager(newShardMgrProps());
266 private TestShardManager newTestShardManager(final Props props) {
267 TestActorRef<TestShardManager> shardManagerActor = actorFactory.createTestActor(props);
268 TestShardManager shardManager = shardManagerActor.underlyingActor();
269 shardManager.waitForRecoveryComplete();
273 private static void waitForShardInitialized(final ActorRef shardManager, final String shardName,
275 AssertionError last = null;
276 Stopwatch sw = Stopwatch.createStarted();
277 while (sw.elapsed(TimeUnit.SECONDS) <= 5) {
279 shardManager.tell(new FindLocalShard(shardName, true), kit.getRef());
280 kit.expectMsgClass(LocalShardFound.class);
282 } catch (AssertionError e) {
286 Uninterruptibles.sleepUninterruptibly(50, TimeUnit.MILLISECONDS);
292 @SuppressWarnings("unchecked")
293 private static <T> T expectMsgClassOrFailure(final Class<T> msgClass, final TestKit kit, final String msg) {
294 Object reply = kit.expectMsgAnyClassOf(kit.duration("5 sec"), msgClass, Failure.class);
295 if (reply instanceof Failure) {
296 throw new AssertionError(msg + " failed", ((Failure)reply).cause());
303 public void testPerShardDatastoreContext() throws Exception {
304 LOG.info("testPerShardDatastoreContext starting");
305 final DatastoreContextFactory mockFactory = newDatastoreContextFactory(
306 datastoreContextBuilder.shardElectionTimeoutFactor(5).build());
309 DatastoreContext.newBuilderFrom(datastoreContextBuilder.build()).shardElectionTimeoutFactor(6).build())
310 .when(mockFactory).getShardDatastoreContext("default");
313 DatastoreContext.newBuilderFrom(datastoreContextBuilder.build()).shardElectionTimeoutFactor(7).build())
314 .when(mockFactory).getShardDatastoreContext("topology");
316 final MockConfiguration mockConfig = new MockConfiguration() {
318 public Collection<String> getMemberShardNames(final MemberName memberName) {
319 return Arrays.asList("default", "topology");
323 public Collection<MemberName> getMembersFromShardName(final String shardName) {
324 return members("member-1");
328 final ActorRef defaultShardActor = actorFactory.createActor(
329 MessageCollectorActor.props(), actorFactory.generateActorId("default"));
330 final ActorRef topologyShardActor = actorFactory.createActor(
331 MessageCollectorActor.props(), actorFactory.generateActorId("topology"));
333 final Map<String, Entry<ActorRef, DatastoreContext>> shardInfoMap = Collections.synchronizedMap(
334 new HashMap<String, Entry<ActorRef, DatastoreContext>>());
335 shardInfoMap.put("default", new AbstractMap.SimpleEntry<>(defaultShardActor, null));
336 shardInfoMap.put("topology", new AbstractMap.SimpleEntry<>(topologyShardActor, null));
338 final PrimaryShardInfoFutureCache primaryShardInfoCache = new PrimaryShardInfoFutureCache();
339 final CountDownLatch newShardActorLatch = new CountDownLatch(2);
340 class LocalShardManager extends ShardManager {
341 LocalShardManager(final AbstractShardManagerCreator<?> creator) {
346 protected ActorRef newShardActor(final ShardInformation info) {
347 Entry<ActorRef, DatastoreContext> entry = shardInfoMap.get(info.getShardName());
350 ref = entry.getKey();
351 entry.setValue(info.getDatastoreContext());
354 newShardActorLatch.countDown();
359 final Creator<ShardManager> creator = new Creator<>() {
360 private static final long serialVersionUID = 1L;
362 public ShardManager create() {
363 return new LocalShardManager(
364 new GenericCreator<>(LocalShardManager.class).datastoreContextFactory(mockFactory)
365 .primaryShardInfoCache(primaryShardInfoCache).configuration(mockConfig));
369 final TestKit kit = new TestKit(getSystem());
371 final ActorRef shardManager = actorFactory.createActor(Props.create(ShardManager.class,
372 new DelegatingShardManagerCreator(creator)).withDispatcher(Dispatchers.DefaultDispatcherId()));
374 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
376 assertTrue("Shard actors created", newShardActorLatch.await(5, TimeUnit.SECONDS));
377 assertEquals("getShardElectionTimeoutFactor", 6,
378 shardInfoMap.get("default").getValue().getShardElectionTimeoutFactor());
379 assertEquals("getShardElectionTimeoutFactor", 7,
380 shardInfoMap.get("topology").getValue().getShardElectionTimeoutFactor());
382 DatastoreContextFactory newMockFactory = newDatastoreContextFactory(
383 datastoreContextBuilder.shardElectionTimeoutFactor(5).build());
385 DatastoreContext.newBuilderFrom(datastoreContextBuilder.build()).shardElectionTimeoutFactor(66).build())
386 .when(newMockFactory).getShardDatastoreContext("default");
389 DatastoreContext.newBuilderFrom(datastoreContextBuilder.build()).shardElectionTimeoutFactor(77).build())
390 .when(newMockFactory).getShardDatastoreContext("topology");
392 shardManager.tell(newMockFactory, kit.getRef());
394 DatastoreContext newContext = MessageCollectorActor.expectFirstMatching(defaultShardActor,
395 DatastoreContext.class);
396 assertEquals("getShardElectionTimeoutFactor", 66, newContext.getShardElectionTimeoutFactor());
398 newContext = MessageCollectorActor.expectFirstMatching(topologyShardActor, DatastoreContext.class);
399 assertEquals("getShardElectionTimeoutFactor", 77, newContext.getShardElectionTimeoutFactor());
401 LOG.info("testPerShardDatastoreContext ending");
405 public void testOnReceiveFindPrimaryForNonExistentShard() {
406 final TestKit kit = new TestKit(getSystem());
407 final ActorRef shardManager = actorFactory.createActor(newPropsShardMgrWithMockShardActor());
409 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
411 shardManager.tell(new FindPrimary("non-existent", false), kit.getRef());
413 kit.expectMsgClass(Duration.ofSeconds(5), PrimaryNotFoundException.class);
417 public void testOnReceiveFindPrimaryForLocalLeaderShard() {
418 LOG.info("testOnReceiveFindPrimaryForLocalLeaderShard starting");
419 final TestKit kit = new TestKit(getSystem());
420 String memberId = "member-1-shard-default-" + shardMrgIDSuffix;
422 final ActorRef shardManager = actorFactory.createActor(newPropsShardMgrWithMockShardActor());
424 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
425 shardManager.tell(new ActorInitialized(), mockShardActor);
427 DataTree mockDataTree = mock(DataTree.class);
428 shardManager.tell(new ShardLeaderStateChanged(memberId, memberId, mockDataTree,
429 DataStoreVersions.CURRENT_VERSION), kit.getRef());
431 MessageCollectorActor.expectFirstMatching(mockShardActor, RegisterRoleChangeListener.class);
433 new RoleChangeNotification(memberId, RaftState.Candidate.name(), RaftState.Leader.name()),
436 shardManager.tell(new FindPrimary(Shard.DEFAULT_NAME, false), kit.getRef());
438 LocalPrimaryShardFound primaryFound = kit.expectMsgClass(Duration.ofSeconds(5),
439 LocalPrimaryShardFound.class);
440 assertTrue("Unexpected primary path " + primaryFound.getPrimaryPath(),
441 primaryFound.getPrimaryPath().contains("member-1-shard-default"));
442 assertSame("getLocalShardDataTree", mockDataTree, primaryFound.getLocalShardDataTree());
444 LOG.info("testOnReceiveFindPrimaryForLocalLeaderShard ending");
448 public void testOnReceiveFindPrimaryForNonLocalLeaderShardBeforeMemberUp() {
449 LOG.info("testOnReceiveFindPrimaryForNonLocalLeaderShardBeforeMemberUp starting");
450 final TestKit kit = new TestKit(getSystem());
451 final ActorRef shardManager = actorFactory.createActor(newPropsShardMgrWithMockShardActor());
453 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
454 shardManager.tell(new ActorInitialized(), mockShardActor);
456 String memberId2 = "member-2-shard-default-" + shardMrgIDSuffix;
457 String memberId1 = "member-1-shard-default-" + shardMrgIDSuffix;
459 new RoleChangeNotification(memberId1, RaftState.Candidate.name(), RaftState.Follower.name()),
461 shardManager.tell(new LeaderStateChanged(memberId1, memberId2, DataStoreVersions.CURRENT_VERSION),
464 shardManager.tell(new FindPrimary(Shard.DEFAULT_NAME, false), kit.getRef());
466 kit.expectMsgClass(Duration.ofSeconds(5), NoShardLeaderException.class);
468 LOG.info("testOnReceiveFindPrimaryForNonLocalLeaderShardBeforeMemberUp ending");
472 public void testOnReceiveFindPrimaryForNonLocalLeaderShard() {
473 LOG.info("testOnReceiveFindPrimaryForNonLocalLeaderShard starting");
474 final TestKit kit = new TestKit(getSystem());
475 final ActorRef shardManager = actorFactory.createActor(newPropsShardMgrWithMockShardActor());
477 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
478 shardManager.tell(new ActorInitialized(), mockShardActor);
480 String memberId2 = "member-2-shard-default-" + shardMrgIDSuffix;
481 MockClusterWrapper.sendMemberUp(shardManager, "member-2", kit.getRef().path().toString());
483 String memberId1 = "member-1-shard-default-" + shardMrgIDSuffix;
485 new RoleChangeNotification(memberId1, RaftState.Candidate.name(), RaftState.Follower.name()),
487 short leaderVersion = DataStoreVersions.CURRENT_VERSION - 1;
488 shardManager.tell(new ShardLeaderStateChanged(memberId1, memberId2, leaderVersion), mockShardActor);
490 shardManager.tell(new FindPrimary(Shard.DEFAULT_NAME, false), kit.getRef());
492 RemotePrimaryShardFound primaryFound = kit.expectMsgClass(Duration.ofSeconds(5), RemotePrimaryShardFound.class);
493 assertTrue("Unexpected primary path " + primaryFound.getPrimaryPath(),
494 primaryFound.getPrimaryPath().contains("member-2-shard-default"));
495 assertEquals("getPrimaryVersion", leaderVersion, primaryFound.getPrimaryVersion());
497 LOG.info("testOnReceiveFindPrimaryForNonLocalLeaderShard ending");
501 public void testOnReceiveFindPrimaryForUninitializedShard() {
502 final TestKit kit = new TestKit(getSystem());
503 final ActorRef shardManager = actorFactory.createActor(newPropsShardMgrWithMockShardActor());
505 shardManager.tell(new FindPrimary(Shard.DEFAULT_NAME, false), kit.getRef());
507 kit.expectMsgClass(Duration.ofSeconds(5), NotInitializedException.class);
511 public void testOnReceiveFindPrimaryForInitializedShardWithNoRole() {
512 final TestKit kit = new TestKit(getSystem());
513 final ActorRef shardManager = actorFactory.createActor(newPropsShardMgrWithMockShardActor());
515 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
516 shardManager.tell(new ActorInitialized(), mockShardActor);
518 shardManager.tell(new FindPrimary(Shard.DEFAULT_NAME, false), kit.getRef());
520 kit.expectMsgClass(Duration.ofSeconds(5), NoShardLeaderException.class);
524 public void testOnReceiveFindPrimaryForFollowerShardWithNoInitialLeaderId() {
525 LOG.info("testOnReceiveFindPrimaryForFollowerShardWithNoInitialLeaderId starting");
526 final TestKit kit = new TestKit(getSystem());
527 final ActorRef shardManager = actorFactory.createActor(newPropsShardMgrWithMockShardActor());
529 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
530 shardManager.tell(new ActorInitialized(), mockShardActor);
532 String memberId = "member-1-shard-default-" + shardMrgIDSuffix;
534 new RoleChangeNotification(memberId, RaftState.Candidate.name(), RaftState.Follower.name()),
537 shardManager.tell(new FindPrimary(Shard.DEFAULT_NAME, false), kit.getRef());
539 kit.expectMsgClass(Duration.ofSeconds(5), NoShardLeaderException.class);
541 DataTree mockDataTree = mock(DataTree.class);
542 shardManager.tell(new ShardLeaderStateChanged(memberId, memberId, mockDataTree,
543 DataStoreVersions.CURRENT_VERSION), mockShardActor);
545 shardManager.tell(new FindPrimary(Shard.DEFAULT_NAME, false), kit.getRef());
547 LocalPrimaryShardFound primaryFound = kit.expectMsgClass(Duration.ofSeconds(5),
548 LocalPrimaryShardFound.class);
549 assertTrue("Unexpected primary path " + primaryFound.getPrimaryPath(),
550 primaryFound.getPrimaryPath().contains("member-1-shard-default"));
551 assertSame("getLocalShardDataTree", mockDataTree, primaryFound.getLocalShardDataTree());
553 LOG.info("testOnReceiveFindPrimaryForFollowerShardWithNoInitialLeaderId starting");
557 public void testOnReceiveFindPrimaryWaitForShardLeader() {
558 LOG.info("testOnReceiveFindPrimaryWaitForShardLeader starting");
559 datastoreContextBuilder.shardInitializationTimeout(10, TimeUnit.SECONDS);
560 final TestKit kit = new TestKit(getSystem());
561 final ActorRef shardManager = actorFactory.createActor(newPropsShardMgrWithMockShardActor());
563 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
565 // We're passing waitUntilInitialized = true to FindPrimary so
566 // the response should be
567 // delayed until we send ActorInitialized and
568 // RoleChangeNotification.
569 shardManager.tell(new FindPrimary(Shard.DEFAULT_NAME, true), kit.getRef());
571 kit.expectNoMessage(Duration.ofMillis(150));
573 shardManager.tell(new ActorInitialized(), mockShardActor);
575 kit.expectNoMessage(Duration.ofMillis(150));
577 String memberId = "member-1-shard-default-" + shardMrgIDSuffix;
579 new RoleChangeNotification(memberId, RaftState.Candidate.name(), RaftState.Leader.name()),
582 kit.expectNoMessage(Duration.ofMillis(150));
584 DataTree mockDataTree = mock(DataTree.class);
585 shardManager.tell(new ShardLeaderStateChanged(memberId, memberId, mockDataTree,
586 DataStoreVersions.CURRENT_VERSION), mockShardActor);
588 LocalPrimaryShardFound primaryFound = kit.expectMsgClass(Duration.ofSeconds(5), LocalPrimaryShardFound.class);
589 assertTrue("Unexpected primary path " + primaryFound.getPrimaryPath(),
590 primaryFound.getPrimaryPath().contains("member-1-shard-default"));
591 assertSame("getLocalShardDataTree", mockDataTree, primaryFound.getLocalShardDataTree());
593 kit.expectNoMessage(Duration.ofMillis(200));
595 LOG.info("testOnReceiveFindPrimaryWaitForShardLeader ending");
599 public void testOnReceiveFindPrimaryWaitForReadyWithUninitializedShard() {
600 LOG.info("testOnReceiveFindPrimaryWaitForReadyWithUninitializedShard starting");
601 final TestKit kit = new TestKit(getSystem());
602 final ActorRef shardManager = actorFactory.createActor(newPropsShardMgrWithMockShardActor());
604 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
606 shardManager.tell(new FindPrimary(Shard.DEFAULT_NAME, true), kit.getRef());
608 kit.expectMsgClass(Duration.ofSeconds(2), NotInitializedException.class);
610 shardManager.tell(new ActorInitialized(), mockShardActor);
612 kit.expectNoMessage(Duration.ofMillis(200));
614 LOG.info("testOnReceiveFindPrimaryWaitForReadyWithUninitializedShard ending");
618 public void testOnReceiveFindPrimaryWaitForReadyWithCandidateShard() {
619 LOG.info("testOnReceiveFindPrimaryWaitForReadyWithCandidateShard starting");
620 final TestKit kit = new TestKit(getSystem());
621 final ActorRef shardManager = actorFactory.createActor(newPropsShardMgrWithMockShardActor());
623 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
624 shardManager.tell(new ActorInitialized(), mockShardActor);
625 shardManager.tell(new RoleChangeNotification("member-1-shard-default-" + shardMrgIDSuffix, null,
626 RaftState.Candidate.name()), mockShardActor);
628 shardManager.tell(new FindPrimary(Shard.DEFAULT_NAME, true), kit.getRef());
630 kit.expectMsgClass(Duration.ofSeconds(2), NoShardLeaderException.class);
632 LOG.info("testOnReceiveFindPrimaryWaitForReadyWithCandidateShard ending");
636 public void testOnReceiveFindPrimaryWaitForReadyWithIsolatedLeaderShard() {
637 LOG.info("testOnReceiveFindPrimaryWaitForReadyWithIsolatedLeaderShard starting");
638 final TestKit kit = new TestKit(getSystem());
639 final ActorRef shardManager = actorFactory.createActor(newPropsShardMgrWithMockShardActor());
641 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
642 shardManager.tell(new ActorInitialized(), mockShardActor);
643 shardManager.tell(new RoleChangeNotification("member-1-shard-default-" + shardMrgIDSuffix, null,
644 RaftState.IsolatedLeader.name()), mockShardActor);
646 shardManager.tell(new FindPrimary(Shard.DEFAULT_NAME, true),kit. getRef());
648 kit.expectMsgClass(Duration.ofSeconds(2), NoShardLeaderException.class);
650 LOG.info("testOnReceiveFindPrimaryWaitForReadyWithIsolatedLeaderShard ending");
654 public void testOnReceiveFindPrimaryWaitForReadyWithNoRoleShard() {
655 LOG.info("testOnReceiveFindPrimaryWaitForReadyWithNoRoleShard starting");
656 final TestKit kit = new TestKit(getSystem());
657 final ActorRef shardManager = actorFactory.createActor(newPropsShardMgrWithMockShardActor());
659 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
660 shardManager.tell(new ActorInitialized(), mockShardActor);
662 shardManager.tell(new FindPrimary(Shard.DEFAULT_NAME, true), kit.getRef());
664 kit.expectMsgClass(Duration.ofSeconds(2), NoShardLeaderException.class);
666 LOG.info("testOnReceiveFindPrimaryWaitForReadyWithNoRoleShard ending");
670 public void testOnReceiveFindPrimaryForRemoteShard() {
671 LOG.info("testOnReceiveFindPrimaryForRemoteShard starting");
672 String shardManagerID = ShardManagerIdentifier.builder().type(shardMrgIDSuffix).build().toString();
674 // Create an ActorSystem ShardManager actor for member-1.
676 final ActorSystem system1 = newActorSystem("Member1");
677 Cluster.get(system1).join(AddressFromURIString.parse("akka://cluster-test@127.0.0.1:2558"));
679 final TestActorRef<TestShardManager> shardManager1 = TestActorRef.create(system1,
680 newTestShardMgrBuilderWithMockShardActor().cluster(
681 new ClusterWrapperImpl(system1)).props().withDispatcher(
682 Dispatchers.DefaultDispatcherId()), shardManagerID);
684 // Create an ActorSystem ShardManager actor for member-2.
686 final ActorSystem system2 = newActorSystem("Member2");
688 Cluster.get(system2).join(AddressFromURIString.parse("akka://cluster-test@127.0.0.1:2558"));
690 final ActorRef mockShardActor2 = newMockShardActor(system2, "astronauts", "member-2");
692 MockConfiguration mockConfig2 = new MockConfiguration(
693 ImmutableMap.<String, List<String>>builder().put("default", Arrays.asList("member-1", "member-2"))
694 .put("astronauts", Arrays.asList("member-2")).build());
696 final TestActorRef<TestShardManager> shardManager2 = TestActorRef.create(system2,
697 newTestShardMgrBuilder(mockConfig2).shardActor(mockShardActor2).cluster(
698 new ClusterWrapperImpl(system2)).props().withDispatcher(
699 Dispatchers.DefaultDispatcherId()), shardManagerID);
701 final TestKit kit = new TestKit(system1);
702 shardManager1.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
703 shardManager2.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
705 shardManager2.tell(new ActorInitialized(), mockShardActor2);
707 String memberId2 = "member-2-shard-astronauts-" + shardMrgIDSuffix;
708 short leaderVersion = DataStoreVersions.CURRENT_VERSION - 1;
709 shardManager2.tell(new ShardLeaderStateChanged(memberId2, memberId2, mock(DataTree.class), leaderVersion),
711 shardManager2.tell(new RoleChangeNotification(memberId2, RaftState.Candidate.name(), RaftState.Leader.name()),
714 shardManager1.underlyingActor().waitForMemberUp();
715 shardManager1.tell(new FindPrimary("astronauts", false), kit.getRef());
717 RemotePrimaryShardFound found = kit.expectMsgClass(Duration.ofSeconds(5), RemotePrimaryShardFound.class);
718 String path = found.getPrimaryPath();
719 assertTrue("Unexpected primary path " + path, path.contains("member-2-shard-astronauts-config"));
720 assertEquals("getPrimaryVersion", leaderVersion, found.getPrimaryVersion());
722 shardManager2.underlyingActor().verifyFindPrimary();
724 // This part times out quite a bit on jenkins for some reason
726 // Cluster.get(system2).down(AddressFromURIString.parse("akka://cluster-test@127.0.0.1:2558"));
728 // shardManager1.underlyingActor().waitForMemberRemoved();
730 // shardManager1.tell(new FindPrimary("astronauts", false), getRef());
732 // expectMsgClass(Duration.ofSeconds(5), PrimaryNotFoundException.class);
734 LOG.info("testOnReceiveFindPrimaryForRemoteShard ending");
738 public void testShardAvailabilityOnChangeOfMemberReachability() {
739 LOG.info("testShardAvailabilityOnChangeOfMemberReachability starting");
740 String shardManagerID = ShardManagerIdentifier.builder().type(shardMrgIDSuffix).build().toString();
742 // Create an ActorSystem ShardManager actor for member-1.
744 final ActorSystem system1 = newActorSystem("Member1");
745 Cluster.get(system1).join(AddressFromURIString.parse("akka://cluster-test@127.0.0.1:2558"));
747 final ActorRef mockShardActor1 = newMockShardActor(system1, Shard.DEFAULT_NAME, "member-1");
749 final TestActorRef<TestShardManager> shardManager1 = TestActorRef.create(system1,
750 newTestShardMgrBuilder().shardActor(mockShardActor1).cluster(
751 new ClusterWrapperImpl(system1)).props().withDispatcher(
752 Dispatchers.DefaultDispatcherId()), shardManagerID);
754 // Create an ActorSystem ShardManager actor for member-2.
756 final ActorSystem system2 = newActorSystem("Member2");
758 Cluster.get(system2).join(AddressFromURIString.parse("akka://cluster-test@127.0.0.1:2558"));
760 final ActorRef mockShardActor2 = newMockShardActor(system2, Shard.DEFAULT_NAME, "member-2");
762 MockConfiguration mockConfig2 = new MockConfiguration(ImmutableMap.<String, List<String>>builder()
763 .put("default", Arrays.asList("member-1", "member-2")).build());
765 final TestActorRef<TestShardManager> shardManager2 = TestActorRef.create(system2,
766 newTestShardMgrBuilder(mockConfig2).shardActor(mockShardActor2).cluster(
767 new ClusterWrapperImpl(system2)).props().withDispatcher(
768 Dispatchers.DefaultDispatcherId()), shardManagerID);
770 final TestKit kit = new TestKit(system1);
771 shardManager1.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
772 shardManager2.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
773 shardManager1.tell(new ActorInitialized(), mockShardActor1);
774 shardManager2.tell(new ActorInitialized(), mockShardActor2);
776 String memberId2 = "member-2-shard-default-" + shardMrgIDSuffix;
777 String memberId1 = "member-1-shard-default-" + shardMrgIDSuffix;
778 shardManager1.tell(new ShardLeaderStateChanged(memberId1, memberId2, mock(DataTree.class),
779 DataStoreVersions.CURRENT_VERSION), mockShardActor1);
781 new RoleChangeNotification(memberId1, RaftState.Candidate.name(), RaftState.Follower.name()),
783 shardManager2.tell(new ShardLeaderStateChanged(memberId2, memberId2, mock(DataTree.class),
784 DataStoreVersions.CURRENT_VERSION), mockShardActor2);
786 new RoleChangeNotification(memberId2, RaftState.Candidate.name(), RaftState.Leader.name()),
788 shardManager1.underlyingActor().waitForMemberUp();
790 shardManager1.tell(new FindPrimary("default", true), kit.getRef());
792 RemotePrimaryShardFound found = kit.expectMsgClass(Duration.ofSeconds(5), RemotePrimaryShardFound.class);
793 String path = found.getPrimaryPath();
794 assertTrue("Unexpected primary path " + path, path.contains("member-2-shard-default-config"));
796 shardManager1.tell(MockClusterWrapper.createUnreachableMember("member-2", "akka://cluster-test@127.0.0.1:2558"),
799 shardManager1.underlyingActor().waitForUnreachableMember();
800 MessageCollectorActor.clearMessages(mockShardActor1);
802 shardManager1.tell(MockClusterWrapper.createMemberRemoved("member-2", "akka://cluster-test@127.0.0.1:2558"),
805 shardManager1.tell(new FindPrimary("default", true), kit.getRef());
807 kit.expectMsgClass(Duration.ofSeconds(5), NoShardLeaderException.class);
809 shardManager1.tell(MockClusterWrapper.createReachableMember("member-2", "akka://cluster-test@127.0.0.1:2558"),
812 shardManager1.underlyingActor().waitForReachableMember();
814 shardManager1.tell(new FindPrimary("default", true), kit.getRef());
816 RemotePrimaryShardFound found1 = kit.expectMsgClass(Duration.ofSeconds(5), RemotePrimaryShardFound.class);
817 String path1 = found1.getPrimaryPath();
818 assertTrue("Unexpected primary path " + path1, path1.contains("member-2-shard-default-config"));
820 shardManager1.tell(MockClusterWrapper.createMemberUp("member-2", "akka://cluster-test@127.0.0.1:2558"),
823 // Test FindPrimary wait succeeds after reachable member event.
825 shardManager1.tell(MockClusterWrapper.createUnreachableMember("member-2",
826 "akka://cluster-test@127.0.0.1:2558"), kit.getRef());
827 shardManager1.underlyingActor().waitForUnreachableMember();
829 shardManager1.tell(new FindPrimary("default", true), kit.getRef());
832 MockClusterWrapper.createReachableMember("member-2", "akka://cluster-test@127.0.0.1:2558"), kit.getRef());
834 RemotePrimaryShardFound found2 = kit.expectMsgClass(Duration.ofSeconds(5), RemotePrimaryShardFound.class);
835 String path2 = found2.getPrimaryPath();
836 assertTrue("Unexpected primary path " + path2, path2.contains("member-2-shard-default-config"));
838 LOG.info("testShardAvailabilityOnChangeOfMemberReachability ending");
842 public void testShardAvailabilityChangeOnMemberUnreachableAndLeadershipChange() {
843 LOG.info("testShardAvailabilityChangeOnMemberUnreachableAndLeadershipChange starting");
844 String shardManagerID = ShardManagerIdentifier.builder().type(shardMrgIDSuffix).build().toString();
846 // Create an ActorSystem ShardManager actor for member-1.
848 final ActorSystem system1 = newActorSystem("Member1");
849 Cluster.get(system1).join(AddressFromURIString.parse("akka://cluster-test@127.0.0.1:2558"));
851 final ActorRef mockShardActor1 = newMockShardActor(system1, Shard.DEFAULT_NAME, "member-1");
853 final PrimaryShardInfoFutureCache primaryShardInfoCache = new PrimaryShardInfoFutureCache();
854 final TestActorRef<TestShardManager> shardManager1 = TestActorRef.create(system1,
855 newTestShardMgrBuilder().shardActor(mockShardActor1).cluster(new ClusterWrapperImpl(system1))
856 .primaryShardInfoCache(primaryShardInfoCache).props()
857 .withDispatcher(Dispatchers.DefaultDispatcherId()),
860 // Create an ActorSystem ShardManager actor for member-2.
862 final ActorSystem system2 = newActorSystem("Member2");
864 Cluster.get(system2).join(AddressFromURIString.parse("akka://cluster-test@127.0.0.1:2558"));
866 final ActorRef mockShardActor2 = newMockShardActor(system2, Shard.DEFAULT_NAME, "member-2");
868 MockConfiguration mockConfig2 = new MockConfiguration(ImmutableMap.<String, List<String>>builder()
869 .put("default", Arrays.asList("member-1", "member-2")).build());
871 final TestActorRef<TestShardManager> shardManager2 = TestActorRef.create(system2,
872 newTestShardMgrBuilder(mockConfig2).shardActor(mockShardActor2).cluster(
873 new ClusterWrapperImpl(system2)).props().withDispatcher(
874 Dispatchers.DefaultDispatcherId()), shardManagerID);
876 final TestKit kit = new TestKit(system1);
877 shardManager1.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
878 shardManager2.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
879 shardManager1.tell(new ActorInitialized(), mockShardActor1);
880 shardManager2.tell(new ActorInitialized(), mockShardActor2);
882 String memberId2 = "member-2-shard-default-" + shardMrgIDSuffix;
883 String memberId1 = "member-1-shard-default-" + shardMrgIDSuffix;
884 shardManager1.tell(new ShardLeaderStateChanged(memberId1, memberId2, mock(DataTree.class),
885 DataStoreVersions.CURRENT_VERSION), mockShardActor1);
887 new RoleChangeNotification(memberId1, RaftState.Candidate.name(), RaftState.Follower.name()),
889 shardManager2.tell(new ShardLeaderStateChanged(memberId2, memberId2, mock(DataTree.class),
890 DataStoreVersions.CURRENT_VERSION), mockShardActor2);
892 new RoleChangeNotification(memberId2, RaftState.Candidate.name(), RaftState.Leader.name()),
894 shardManager1.underlyingActor().waitForMemberUp();
896 shardManager1.tell(new FindPrimary("default", true), kit.getRef());
898 RemotePrimaryShardFound found = kit.expectMsgClass(Duration.ofSeconds(5), RemotePrimaryShardFound.class);
899 String path = found.getPrimaryPath();
900 assertTrue("Unexpected primary path " + path, path.contains("member-2-shard-default-config"));
902 primaryShardInfoCache.putSuccessful("default", new PrimaryShardInfo(
903 system1.actorSelection(mockShardActor1.path()), DataStoreVersions.CURRENT_VERSION));
905 shardManager1.tell(MockClusterWrapper.createUnreachableMember("member-2",
906 "akka://cluster-test@127.0.0.1:2558"), kit.getRef());
908 shardManager1.underlyingActor().waitForUnreachableMember();
910 shardManager1.tell(new FindPrimary("default", true), kit.getRef());
912 kit.expectMsgClass(Duration.ofSeconds(5), NoShardLeaderException.class);
914 assertNull("Expected primaryShardInfoCache entry removed",
915 primaryShardInfoCache.getIfPresent("default"));
917 shardManager1.tell(new ShardLeaderStateChanged(memberId1, memberId1, mock(DataTree.class),
918 DataStoreVersions.CURRENT_VERSION), mockShardActor1);
920 new RoleChangeNotification(memberId1, RaftState.Follower.name(), RaftState.Leader.name()),
923 shardManager1.tell(new FindPrimary("default", true), kit.getRef());
925 LocalPrimaryShardFound found1 = kit.expectMsgClass(Duration.ofSeconds(5), LocalPrimaryShardFound.class);
926 String path1 = found1.getPrimaryPath();
927 assertTrue("Unexpected primary path " + path1, path1.contains("member-1-shard-default-config"));
929 LOG.info("testShardAvailabilityChangeOnMemberUnreachableAndLeadershipChange ending");
933 public void testShardAvailabilityChangeOnMemberWithNameContainedInLeaderIdUnreachable() {
934 LOG.info("testShardAvailabilityChangeOnMemberWithNameContainedInLeaderIdUnreachable starting");
935 String shardManagerID = ShardManagerIdentifier.builder().type(shardMrgIDSuffix).build().toString();
937 MockConfiguration mockConfig = new MockConfiguration(ImmutableMap.<String, List<String>>builder()
938 .put("default", Arrays.asList("member-256", "member-2")).build());
940 // Create an ActorSystem, ShardManager and actor for member-256.
942 final ActorSystem system256 = newActorSystem("Member256");
943 // 2562 is the tcp port of Member256 in src/test/resources/application.conf.
944 Cluster.get(system256).join(AddressFromURIString.parse("akka://cluster-test@127.0.0.1:2562"));
946 final ActorRef mockShardActor256 = newMockShardActor(system256, Shard.DEFAULT_NAME, "member-256");
948 final PrimaryShardInfoFutureCache primaryShardInfoCache = new PrimaryShardInfoFutureCache();
950 // ShardManager must be created with shard configuration to let its localShards has shards.
951 final TestActorRef<TestShardManager> shardManager256 = TestActorRef.create(system256,
952 newTestShardMgrBuilder(mockConfig).shardActor(mockShardActor256)
953 .cluster(new ClusterWrapperImpl(system256))
954 .primaryShardInfoCache(primaryShardInfoCache).props()
955 .withDispatcher(Dispatchers.DefaultDispatcherId()),
958 // Create an ActorSystem, ShardManager and actor for member-2 whose name is contained in member-256.
960 final ActorSystem system2 = newActorSystem("Member2");
962 // Join member-2 into the cluster of member-256.
963 Cluster.get(system2).join(AddressFromURIString.parse("akka://cluster-test@127.0.0.1:2562"));
965 final ActorRef mockShardActor2 = newMockShardActor(system2, Shard.DEFAULT_NAME, "member-2");
967 final TestActorRef<TestShardManager> shardManager2 = TestActorRef.create(system2,
968 newTestShardMgrBuilder(mockConfig).shardActor(mockShardActor2).cluster(
969 new ClusterWrapperImpl(system2)).props().withDispatcher(
970 Dispatchers.DefaultDispatcherId()), shardManagerID);
972 final TestKit kit256 = new TestKit(system256);
973 shardManager256.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit256.getRef());
974 shardManager2.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit256.getRef());
975 shardManager256.tell(new ActorInitialized(), mockShardActor256);
976 shardManager2.tell(new ActorInitialized(), mockShardActor2);
978 String memberId256 = "member-256-shard-default-" + shardMrgIDSuffix;
979 String memberId2 = "member-2-shard-default-" + shardMrgIDSuffix;
980 shardManager256.tell(new ShardLeaderStateChanged(memberId256, memberId256, mock(DataTree.class),
981 DataStoreVersions.CURRENT_VERSION), mockShardActor256);
982 shardManager256.tell(
983 new RoleChangeNotification(memberId256, RaftState.Candidate.name(), RaftState.Leader.name()),
985 shardManager2.tell(new ShardLeaderStateChanged(memberId2, memberId256, mock(DataTree.class),
986 DataStoreVersions.CURRENT_VERSION), mockShardActor2);
988 new RoleChangeNotification(memberId2, RaftState.Candidate.name(), RaftState.Follower.name()),
990 shardManager256.underlyingActor().waitForMemberUp();
992 shardManager256.tell(new FindPrimary("default", true), kit256.getRef());
994 LocalPrimaryShardFound found = kit256.expectMsgClass(Duration.ofSeconds(5), LocalPrimaryShardFound.class);
995 String path = found.getPrimaryPath();
996 assertTrue("Unexpected primary path " + path + " which must on member-256",
997 path.contains("member-256-shard-default-config"));
999 PrimaryShardInfo primaryShardInfo = new PrimaryShardInfo(
1000 system256.actorSelection(mockShardActor256.path()), DataStoreVersions.CURRENT_VERSION);
1001 primaryShardInfoCache.putSuccessful("default", primaryShardInfo);
1003 // Simulate member-2 become unreachable.
1004 shardManager256.tell(MockClusterWrapper.createUnreachableMember("member-2",
1005 "akka://cluster-test@127.0.0.1:2558"), kit256.getRef());
1006 shardManager256.underlyingActor().waitForUnreachableMember();
1008 // Make sure leader shard on member-256 is still leader and still in the cache.
1009 shardManager256.tell(new FindPrimary("default", true), kit256.getRef());
1010 found = kit256.expectMsgClass(Duration.ofSeconds(5), LocalPrimaryShardFound.class);
1011 path = found.getPrimaryPath();
1012 assertTrue("Unexpected primary path " + path + " which must still not on member-256",
1013 path.contains("member-256-shard-default-config"));
1014 Future<PrimaryShardInfo> futurePrimaryShard = primaryShardInfoCache.getIfPresent("default");
1015 futurePrimaryShard.onComplete(new OnComplete<PrimaryShardInfo>() {
1017 public void onComplete(final Throwable failure, final PrimaryShardInfo futurePrimaryShardInfo) {
1018 if (failure != null) {
1019 assertTrue("Primary shard info is unexpectedly removed from primaryShardInfoCache", false);
1021 assertEquals("Expected primaryShardInfoCache entry",
1022 primaryShardInfo, futurePrimaryShardInfo);
1025 }, system256.dispatchers().defaultGlobalDispatcher());
1027 LOG.info("testShardAvailabilityChangeOnMemberWithNameContainedInLeaderIdUnreachable ending");
1031 public void testOnReceiveFindLocalShardForNonExistentShard() {
1032 final TestKit kit = new TestKit(getSystem());
1033 final ActorRef shardManager = actorFactory.createActor(newPropsShardMgrWithMockShardActor());
1035 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
1037 shardManager.tell(new FindLocalShard("non-existent", false), kit.getRef());
1039 LocalShardNotFound notFound = kit.expectMsgClass(Duration.ofSeconds(5), LocalShardNotFound.class);
1041 assertEquals("getShardName", "non-existent", notFound.getShardName());
1045 public void testOnReceiveFindLocalShardForExistentShard() {
1046 final TestKit kit = new TestKit(getSystem());
1047 final ActorRef shardManager = actorFactory.createActor(newPropsShardMgrWithMockShardActor());
1049 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
1050 shardManager.tell(new ActorInitialized(), mockShardActor);
1052 shardManager.tell(new FindLocalShard(Shard.DEFAULT_NAME, false), kit.getRef());
1054 LocalShardFound found = kit.expectMsgClass(Duration.ofSeconds(5), LocalShardFound.class);
1056 assertTrue("Found path contains " + found.getPath().path().toString(),
1057 found.getPath().path().toString().contains("member-1-shard-default-config"));
1061 public void testOnReceiveFindLocalShardForNotInitializedShard() {
1062 final TestKit kit = new TestKit(getSystem());
1063 final ActorRef shardManager = actorFactory.createActor(newPropsShardMgrWithMockShardActor());
1065 shardManager.tell(new FindLocalShard(Shard.DEFAULT_NAME, false), kit.getRef());
1067 kit.expectMsgClass(Duration.ofSeconds(5), NotInitializedException.class);
1071 public void testOnReceiveFindLocalShardWaitForShardInitialized() throws Exception {
1072 LOG.info("testOnReceiveFindLocalShardWaitForShardInitialized starting");
1073 final TestKit kit = new TestKit(getSystem());
1074 final ActorRef shardManager = actorFactory.createActor(newPropsShardMgrWithMockShardActor());
1076 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
1078 // We're passing waitUntilInitialized = true to FindLocalShard
1079 // so the response should be
1080 // delayed until we send ActorInitialized.
1081 Future<Object> future = Patterns.ask(shardManager, new FindLocalShard(Shard.DEFAULT_NAME, true),
1082 new Timeout(5, TimeUnit.SECONDS));
1084 shardManager.tell(new ActorInitialized(), mockShardActor);
1086 Object resp = Await.result(future, kit.duration("5 seconds"));
1087 assertTrue("Expected: LocalShardFound, Actual: " + resp, resp instanceof LocalShardFound);
1089 LOG.info("testOnReceiveFindLocalShardWaitForShardInitialized starting");
1093 public void testRoleChangeNotificationAndShardLeaderStateChangedReleaseReady() throws Exception {
1094 TestShardManager shardManager = newTestShardManager();
1096 String memberId = "member-1-shard-default-" + shardMrgIDSuffix;
1097 shardManager.handleCommand(new RoleChangeNotification(
1098 memberId, RaftState.Candidate.name(), RaftState.Leader.name()));
1099 assertFalse(ready.isDone());
1101 shardManager.handleCommand(new ShardLeaderStateChanged(memberId, memberId,
1102 mock(DataTree.class), DataStoreVersions.CURRENT_VERSION));
1103 assertTrue(ready.isDone());
1107 public void testRoleChangeNotificationToFollowerWithShardLeaderStateChangedReleaseReady() throws Exception {
1108 final TestKit kit = new TestKit(getSystem());
1109 TestShardManager shardManager = newTestShardManager();
1111 String memberId = "member-1-shard-default-" + shardMrgIDSuffix;
1112 shardManager.handleCommand(new RoleChangeNotification(memberId, null, RaftState.Follower.name()));
1113 assertFalse(ready.isDone());
1115 shardManager.handleCommand(MockClusterWrapper.createMemberUp("member-2", kit.getRef().path().toString()));
1117 shardManager.handleCommand(
1118 new ShardLeaderStateChanged(memberId, "member-2-shard-default-" + shardMrgIDSuffix,
1119 mock(DataTree.class), DataStoreVersions.CURRENT_VERSION));
1120 assertTrue(ready.isDone());
1124 public void testReadyCountDownForMemberUpAfterLeaderStateChanged() throws Exception {
1125 final TestKit kit = new TestKit(getSystem());
1126 TestShardManager shardManager = newTestShardManager();
1128 String memberId = "member-1-shard-default-" + shardMrgIDSuffix;
1129 shardManager.handleCommand(new RoleChangeNotification(memberId, null, RaftState.Follower.name()));
1130 assertFalse(ready.isDone());
1132 shardManager.handleCommand(
1133 new ShardLeaderStateChanged(memberId, "member-2-shard-default-" + shardMrgIDSuffix,
1134 mock(DataTree.class), DataStoreVersions.CURRENT_VERSION));
1136 shardManager.handleCommand(MockClusterWrapper.createMemberUp("member-2", kit.getRef().path().toString()));
1137 assertTrue(ready.isDone());
1141 public void testRoleChangeNotificationDoNothingForUnknownShard() throws Exception {
1142 TestShardManager shardManager = newTestShardManager();
1144 shardManager.handleCommand(new RoleChangeNotification("unknown", RaftState.Candidate.name(),
1145 RaftState.Leader.name()));
1146 assertFalse(ready.isDone());
1150 public void testByDefaultSyncStatusIsFalse() {
1151 TestShardManager shardManager = newTestShardManager();
1153 assertFalse(shardManager.getMBean().getSyncStatus());
1157 public void testWhenShardIsLeaderSyncStatusIsTrue() throws Exception {
1158 TestShardManager shardManager = newTestShardManager();
1160 shardManager.handleCommand(new RoleChangeNotification("member-1-shard-default-" + shardMrgIDSuffix,
1161 RaftState.Follower.name(), RaftState.Leader.name()));
1163 assertTrue(shardManager.getMBean().getSyncStatus());
1167 public void testWhenShardIsCandidateSyncStatusIsFalse() throws Exception {
1168 TestShardManager shardManager = newTestShardManager();
1170 String shardId = "member-1-shard-default-" + shardMrgIDSuffix;
1171 shardManager.handleCommand(new RoleChangeNotification(shardId,
1172 RaftState.Follower.name(), RaftState.Candidate.name()));
1174 assertFalse(shardManager.getMBean().getSyncStatus());
1176 // Send a FollowerInitialSyncStatus with status = true for the replica whose current state is candidate
1177 shardManager.handleCommand(new FollowerInitialSyncUpStatus(
1180 assertFalse(shardManager.getMBean().getSyncStatus());
1184 public void testWhenShardIsFollowerSyncStatusDependsOnFollowerInitialSyncStatus() throws Exception {
1185 TestShardManager shardManager = newTestShardManager();
1187 String shardId = "member-1-shard-default-" + shardMrgIDSuffix;
1188 shardManager.handleCommand(new RoleChangeNotification(shardId,
1189 RaftState.Candidate.name(), RaftState.Follower.name()));
1191 // Initially will be false
1192 assertFalse(shardManager.getMBean().getSyncStatus());
1194 // Send status true will make sync status true
1195 shardManager.handleCommand(new FollowerInitialSyncUpStatus(true, shardId));
1197 assertTrue(shardManager.getMBean().getSyncStatus());
1199 // Send status false will make sync status false
1200 shardManager.handleCommand(new FollowerInitialSyncUpStatus(false, shardId));
1202 assertFalse(shardManager.getMBean().getSyncStatus());
1206 public void testWhenMultipleShardsPresentSyncStatusMustBeTrueForAllShards() throws Exception {
1207 LOG.info("testWhenMultipleShardsPresentSyncStatusMustBeTrueForAllShards starting");
1208 TestShardManager shardManager = newTestShardManager(newShardMgrProps(new MockConfiguration() {
1210 public List<String> getMemberShardNames(final MemberName memberName) {
1211 return Arrays.asList("default", "astronauts");
1215 // Initially will be false
1216 assertFalse(shardManager.getMBean().getSyncStatus());
1218 // Make default shard leader
1219 String defaultShardId = "member-1-shard-default-" + shardMrgIDSuffix;
1220 shardManager.handleCommand(new RoleChangeNotification(defaultShardId,
1221 RaftState.Follower.name(), RaftState.Leader.name()));
1223 // default = Leader, astronauts is unknown so sync status remains false
1224 assertFalse(shardManager.getMBean().getSyncStatus());
1226 // Make astronauts shard leader as well
1227 String astronautsShardId = "member-1-shard-astronauts-" + shardMrgIDSuffix;
1228 shardManager.handleCommand(new RoleChangeNotification(astronautsShardId,
1229 RaftState.Follower.name(), RaftState.Leader.name()));
1231 // Now sync status should be true
1232 assertTrue(shardManager.getMBean().getSyncStatus());
1234 // Make astronauts a Follower
1235 shardManager.handleCommand(new RoleChangeNotification(astronautsShardId,
1236 RaftState.Leader.name(), RaftState.Follower.name()));
1238 // Sync status is not true
1239 assertFalse(shardManager.getMBean().getSyncStatus());
1241 // Make the astronauts follower sync status true
1242 shardManager.handleCommand(new FollowerInitialSyncUpStatus(true, astronautsShardId));
1244 // Sync status is now true
1245 assertTrue(shardManager.getMBean().getSyncStatus());
1247 LOG.info("testWhenMultipleShardsPresentSyncStatusMustBeTrueForAllShards ending");
1251 public void testOnReceiveSwitchShardBehavior() {
1252 final TestKit kit = new TestKit(getSystem());
1253 final ActorRef shardManager = actorFactory.createActor(newPropsShardMgrWithMockShardActor());
1255 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
1256 shardManager.tell(new ActorInitialized(), mockShardActor);
1258 shardManager.tell(new SwitchShardBehavior(mockShardName, RaftState.Leader, 1000), kit.getRef());
1260 SwitchBehavior switchBehavior = MessageCollectorActor.expectFirstMatching(mockShardActor,
1261 SwitchBehavior.class);
1263 assertEquals(RaftState.Leader, switchBehavior.getNewState());
1264 assertEquals(1000, switchBehavior.getNewTerm());
1267 private static List<MemberName> members(final String... names) {
1268 return Arrays.asList(names).stream().map(MemberName::forName).collect(Collectors.toList());
1272 public void testOnCreateShard() {
1273 LOG.info("testOnCreateShard starting");
1274 final TestKit kit = new TestKit(getSystem());
1275 datastoreContextBuilder.shardInitializationTimeout(1, TimeUnit.MINUTES).persistent(true);
1277 ActorRef shardManager = actorFactory
1278 .createActor(newShardMgrProps(new ConfigurationImpl(new EmptyModuleShardConfigProvider()))
1279 .withDispatcher(Dispatchers.DefaultDispatcherId()));
1281 EffectiveModelContext schemaContext = TEST_SCHEMA_CONTEXT;
1282 shardManager.tell(new UpdateSchemaContext(schemaContext), ActorRef.noSender());
1284 DatastoreContext datastoreContext = DatastoreContext.newBuilder().shardElectionTimeoutFactor(100)
1285 .persistent(false).build();
1286 Shard.Builder shardBuilder = Shard.builder();
1288 ModuleShardConfiguration config = new ModuleShardConfiguration(XMLNamespace.of("foo-ns"), "foo-module",
1289 "foo", null, members("member-1", "member-5", "member-6"));
1290 shardManager.tell(new CreateShard(config, shardBuilder, datastoreContext), kit.getRef());
1292 kit.expectMsgClass(Duration.ofSeconds(5), Success.class);
1294 shardManager.tell(new FindLocalShard("foo", true), kit.getRef());
1296 kit.expectMsgClass(Duration.ofSeconds(5), LocalShardFound.class);
1298 assertFalse("isRecoveryApplicable", shardBuilder.getDatastoreContext().isPersistent());
1299 assertTrue("Epxected ShardPeerAddressResolver", shardBuilder.getDatastoreContext().getShardRaftConfig()
1300 .getPeerAddressResolver() instanceof ShardPeerAddressResolver);
1301 assertEquals("peerMembers", Sets.newHashSet(
1302 ShardIdentifier.create("foo", MemberName.forName("member-5"), shardMrgIDSuffix).toString(),
1303 ShardIdentifier.create("foo", MemberName.forName("member-6"), shardMrgIDSuffix).toString()),
1304 shardBuilder.getPeerAddresses().keySet());
1305 assertEquals("ShardIdentifier", ShardIdentifier.create("foo", MEMBER_1, shardMrgIDSuffix),
1306 shardBuilder.getId());
1307 assertSame("schemaContext", schemaContext, shardBuilder.getSchemaContext());
1309 // Send CreateShard with same name - should return Success with
1312 shardManager.tell(new CreateShard(config, shardBuilder, null), kit.getRef());
1314 Success success = kit.expectMsgClass(Duration.ofSeconds(5), Success.class);
1315 assertNotNull("Success status is null", success.status());
1317 LOG.info("testOnCreateShard ending");
1321 public void testOnCreateShardWithLocalMemberNotInShardConfig() {
1322 LOG.info("testOnCreateShardWithLocalMemberNotInShardConfig starting");
1323 final TestKit kit = new TestKit(getSystem());
1324 datastoreContextBuilder.shardInitializationTimeout(1, TimeUnit.MINUTES).persistent(true);
1326 ActorRef shardManager = actorFactory
1327 .createActor(newShardMgrProps(new ConfigurationImpl(new EmptyModuleShardConfigProvider()))
1328 .withDispatcher(Dispatchers.DefaultDispatcherId()));
1330 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), ActorRef.noSender());
1332 Shard.Builder shardBuilder = Shard.builder();
1333 ModuleShardConfiguration config = new ModuleShardConfiguration(XMLNamespace.of("foo-ns"), "foo-module",
1334 "foo", null, members("member-5", "member-6"));
1336 shardManager.tell(new CreateShard(config, shardBuilder, null), kit.getRef());
1337 kit.expectMsgClass(Duration.ofSeconds(5), Success.class);
1339 shardManager.tell(new FindLocalShard("foo", true), kit.getRef());
1340 kit.expectMsgClass(Duration.ofSeconds(5), LocalShardFound.class);
1342 assertEquals("peerMembers size", 0, shardBuilder.getPeerAddresses().size());
1343 assertEquals("schemaContext", DisableElectionsRaftPolicy.class.getName(), shardBuilder
1344 .getDatastoreContext().getShardRaftConfig().getCustomRaftPolicyImplementationClass());
1346 LOG.info("testOnCreateShardWithLocalMemberNotInShardConfig ending");
1350 public void testOnCreateShardWithNoInitialSchemaContext() {
1351 LOG.info("testOnCreateShardWithNoInitialSchemaContext starting");
1352 final TestKit kit = new TestKit(getSystem());
1353 ActorRef shardManager = actorFactory
1354 .createActor(newShardMgrProps(new ConfigurationImpl(new EmptyModuleShardConfigProvider()))
1355 .withDispatcher(Dispatchers.DefaultDispatcherId()));
1357 Shard.Builder shardBuilder = Shard.builder();
1359 ModuleShardConfiguration config = new ModuleShardConfiguration(XMLNamespace.of("foo-ns"), "foo-module",
1360 "foo", null, members("member-1"));
1361 shardManager.tell(new CreateShard(config, shardBuilder, null), kit.getRef());
1363 kit.expectMsgClass(Duration.ofSeconds(5), Success.class);
1365 EffectiveModelContext schemaContext = TEST_SCHEMA_CONTEXT;
1366 shardManager.tell(new UpdateSchemaContext(schemaContext), ActorRef.noSender());
1368 shardManager.tell(new FindLocalShard("foo", true), kit.getRef());
1370 kit.expectMsgClass(Duration.ofSeconds(5), LocalShardFound.class);
1372 assertSame("schemaContext", schemaContext, shardBuilder.getSchemaContext());
1373 assertNotNull("schemaContext is null", shardBuilder.getDatastoreContext());
1375 LOG.info("testOnCreateShardWithNoInitialSchemaContext ending");
1379 public void testGetSnapshot() {
1380 LOG.info("testGetSnapshot starting");
1381 TestKit kit = new TestKit(getSystem());
1383 MockConfiguration mockConfig = new MockConfiguration(ImmutableMap.<String, List<String>>builder()
1384 .put("shard1", Arrays.asList("member-1")).put("shard2", Arrays.asList("member-1"))
1385 .put("astronauts", Collections.<String>emptyList()).build());
1387 TestActorRef<TestShardManager> shardManager = actorFactory.createTestActor(newShardMgrProps(mockConfig)
1388 .withDispatcher(Dispatchers.DefaultDispatcherId()));
1390 shardManager.tell(GetSnapshot.INSTANCE, kit.getRef());
1391 Failure failure = kit.expectMsgClass(Failure.class);
1392 assertEquals("Failure cause type", IllegalStateException.class, failure.cause().getClass());
1394 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), ActorRef.noSender());
1396 waitForShardInitialized(shardManager, "shard1", kit);
1397 waitForShardInitialized(shardManager, "shard2", kit);
1399 shardManager.tell(GetSnapshot.INSTANCE, kit.getRef());
1401 DatastoreSnapshot datastoreSnapshot = expectMsgClassOrFailure(DatastoreSnapshot.class, kit, "GetSnapshot");
1403 assertEquals("getType", shardMrgIDSuffix, datastoreSnapshot.getType());
1404 assertNull("Expected null ShardManagerSnapshot", datastoreSnapshot.getShardManagerSnapshot());
1406 assertEquals("Shard names", Sets.newHashSet("shard1", "shard2"), Sets.newHashSet(
1407 datastoreSnapshot.getShardSnapshots().stream().map(ShardSnapshot::getName).collect(Collectors.toSet())));
1409 // Add a new replica
1411 TestKit mockShardLeaderKit = new TestKit(getSystem());
1413 TestShardManager shardManagerInstance = shardManager.underlyingActor();
1414 shardManagerInstance.setMessageInterceptor(newFindPrimaryInterceptor(mockShardLeaderKit.getRef()));
1416 shardManager.tell(new AddShardReplica("astronauts"), kit.getRef());
1417 mockShardLeaderKit.expectMsgClass(AddServer.class);
1418 mockShardLeaderKit.reply(new AddServerReply(ServerChangeStatus.OK, ""));
1419 kit.expectMsgClass(Status.Success.class);
1420 waitForShardInitialized(shardManager, "astronauts", kit);
1422 // Send another GetSnapshot and verify
1424 shardManager.tell(GetSnapshot.INSTANCE, kit.getRef());
1425 datastoreSnapshot = expectMsgClassOrFailure(DatastoreSnapshot.class, kit, "GetSnapshot");
1427 assertEquals("Shard names", Sets.newHashSet("shard1", "shard2", "astronauts"), Sets.newHashSet(
1428 Lists.transform(datastoreSnapshot.getShardSnapshots(), ShardSnapshot::getName)));
1430 ShardManagerSnapshot snapshot = datastoreSnapshot.getShardManagerSnapshot();
1431 assertNotNull("Expected ShardManagerSnapshot", snapshot);
1432 assertEquals("Shard names", Sets.newHashSet("shard1", "shard2", "astronauts"),
1433 Sets.newHashSet(snapshot.getShardList()));
1435 LOG.info("testGetSnapshot ending");
1439 public void testRestoreFromSnapshot() {
1440 LOG.info("testRestoreFromSnapshot starting");
1442 datastoreContextBuilder.shardInitializationTimeout(3, TimeUnit.SECONDS);
1444 TestKit kit = new TestKit(getSystem());
1446 MockConfiguration mockConfig = new MockConfiguration(ImmutableMap.<String, List<String>>builder()
1447 .put("shard1", Collections.<String>emptyList()).put("shard2", Collections.<String>emptyList())
1448 .put("astronauts", Collections.<String>emptyList()).build());
1450 ShardManagerSnapshot snapshot =
1451 new ShardManagerSnapshot(Arrays.asList("shard1", "shard2", "astronauts"));
1452 DatastoreSnapshot restoreFromSnapshot = new DatastoreSnapshot(shardMrgIDSuffix, snapshot,
1453 Collections.<ShardSnapshot>emptyList());
1454 TestActorRef<TestShardManager> shardManager = actorFactory.createTestActor(newTestShardMgrBuilder(mockConfig)
1455 .restoreFromSnapshot(restoreFromSnapshot).props().withDispatcher(Dispatchers.DefaultDispatcherId()));
1457 shardManager.underlyingActor().waitForRecoveryComplete();
1459 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), ActorRef.noSender());
1461 waitForShardInitialized(shardManager, "shard1", kit);
1462 waitForShardInitialized(shardManager, "shard2", kit);
1463 waitForShardInitialized(shardManager, "astronauts", kit);
1465 shardManager.tell(GetSnapshot.INSTANCE, kit.getRef());
1467 DatastoreSnapshot datastoreSnapshot = expectMsgClassOrFailure(DatastoreSnapshot.class, kit, "GetSnapshot");
1469 assertEquals("getType", shardMrgIDSuffix, datastoreSnapshot.getType());
1471 assertNotNull("Expected ShardManagerSnapshot", datastoreSnapshot.getShardManagerSnapshot());
1472 assertEquals("Shard names", Sets.newHashSet("shard1", "shard2", "astronauts"),
1473 Sets.newHashSet(datastoreSnapshot.getShardManagerSnapshot().getShardList()));
1475 LOG.info("testRestoreFromSnapshot ending");
1479 public void testAddShardReplicaForNonExistentShardConfig() {
1480 final TestKit kit = new TestKit(getSystem());
1481 ActorRef shardManager = actorFactory
1482 .createActor(newShardMgrProps(new ConfigurationImpl(new EmptyModuleShardConfigProvider()))
1483 .withDispatcher(Dispatchers.DefaultDispatcherId()));
1485 shardManager.tell(new AddShardReplica("model-inventory"), kit.getRef());
1486 Status.Failure resp = kit.expectMsgClass(Duration.ofSeconds(2), Status.Failure.class);
1488 assertTrue("Failure obtained", resp.cause() instanceof IllegalArgumentException);
1492 public void testAddShardReplica() {
1493 LOG.info("testAddShardReplica starting");
1494 MockConfiguration mockConfig = new MockConfiguration(
1495 ImmutableMap.<String, List<String>>builder().put("default", Arrays.asList("member-1", "member-2"))
1496 .put("astronauts", Arrays.asList("member-2")).build());
1498 final String shardManagerID = ShardManagerIdentifier.builder().type(shardMrgIDSuffix).build().toString();
1499 datastoreContextBuilder.shardManagerPersistenceId(shardManagerID);
1501 // Create an ActorSystem ShardManager actor for member-1.
1502 final ActorSystem system1 = newActorSystem("Member1");
1503 Cluster.get(system1).join(AddressFromURIString.parse("akka://cluster-test@127.0.0.1:2558"));
1504 ActorRef mockDefaultShardActor = newMockShardActor(system1, Shard.DEFAULT_NAME, "member-1");
1505 final TestActorRef<TestShardManager> newReplicaShardManager = TestActorRef.create(system1,
1506 newTestShardMgrBuilder(mockConfig).shardActor(mockDefaultShardActor)
1507 .cluster(new ClusterWrapperImpl(system1)).props()
1508 .withDispatcher(Dispatchers.DefaultDispatcherId()),
1511 // Create an ActorSystem ShardManager actor for member-2.
1512 final ActorSystem system2 = newActorSystem("Member2");
1513 Cluster.get(system2).join(AddressFromURIString.parse("akka://cluster-test@127.0.0.1:2558"));
1515 String memberId2 = "member-2-shard-astronauts-" + shardMrgIDSuffix;
1516 String name = ShardIdentifier.create("astronauts", MEMBER_2, "config").toString();
1517 final TestActorRef<MockRespondActor> mockShardLeaderActor = TestActorRef.create(system2,
1518 Props.create(MockRespondActor.class, AddServer.class,
1519 new AddServerReply(ServerChangeStatus.OK, memberId2))
1520 .withDispatcher(Dispatchers.DefaultDispatcherId()),
1522 final TestActorRef<TestShardManager> leaderShardManager = TestActorRef.create(system2,
1523 newTestShardMgrBuilder(mockConfig).shardActor(mockShardLeaderActor)
1524 .cluster(new ClusterWrapperImpl(system2)).props()
1525 .withDispatcher(Dispatchers.DefaultDispatcherId()),
1528 final TestKit kit = new TestKit(getSystem());
1529 newReplicaShardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
1530 leaderShardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
1532 leaderShardManager.tell(new ActorInitialized(), mockShardLeaderActor);
1534 short leaderVersion = DataStoreVersions.CURRENT_VERSION - 1;
1535 leaderShardManager.tell(
1536 new ShardLeaderStateChanged(memberId2, memberId2, mock(DataTree.class), leaderVersion),
1537 mockShardLeaderActor);
1538 leaderShardManager.tell(
1539 new RoleChangeNotification(memberId2, RaftState.Candidate.name(), RaftState.Leader.name()),
1540 mockShardLeaderActor);
1542 newReplicaShardManager.underlyingActor().waitForMemberUp();
1543 leaderShardManager.underlyingActor().waitForMemberUp();
1545 // Have a dummy snapshot to be overwritten by the new data
1547 String[] restoredShards = { "default", "people" };
1548 ShardManagerSnapshot snapshot =
1549 new ShardManagerSnapshot(Arrays.asList(restoredShards));
1550 InMemorySnapshotStore.addSnapshot(shardManagerID, snapshot);
1551 Uninterruptibles.sleepUninterruptibly(2, TimeUnit.MILLISECONDS);
1553 InMemorySnapshotStore.addSnapshotSavedLatch(shardManagerID);
1554 InMemorySnapshotStore.addSnapshotDeletedLatch(shardManagerID);
1556 // construct a mock response message
1557 newReplicaShardManager.tell(new AddShardReplica("astronauts"), kit.getRef());
1558 AddServer addServerMsg = MessageCollectorActor.expectFirstMatching(mockShardLeaderActor,
1560 String addServerId = "member-1-shard-astronauts-" + shardMrgIDSuffix;
1561 assertEquals("AddServer serverId", addServerId, addServerMsg.getNewServerId());
1562 kit.expectMsgClass(Duration.ofSeconds(5), Status.Success.class);
1564 InMemorySnapshotStore.waitForSavedSnapshot(shardManagerID, ShardManagerSnapshot.class);
1565 InMemorySnapshotStore.waitForDeletedSnapshot(shardManagerID);
1566 List<ShardManagerSnapshot> persistedSnapshots = InMemorySnapshotStore.getSnapshots(shardManagerID,
1567 ShardManagerSnapshot.class);
1568 assertEquals("Number of snapshots persisted", 1, persistedSnapshots.size());
1569 ShardManagerSnapshot shardManagerSnapshot = persistedSnapshots.get(0);
1570 assertEquals("Persisted local shards", Sets.newHashSet("default", "astronauts"),
1571 Sets.newHashSet(shardManagerSnapshot.getShardList()));
1572 LOG.info("testAddShardReplica ending");
1576 public void testAddShardReplicaWithPreExistingReplicaInRemoteShardLeader() {
1577 LOG.info("testAddShardReplicaWithPreExistingReplicaInRemoteShardLeader starting");
1578 final TestKit kit = new TestKit(getSystem());
1579 TestActorRef<TestShardManager> shardManager = actorFactory
1580 .createTestActor(newPropsShardMgrWithMockShardActor(), shardMgrID);
1582 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
1583 shardManager.tell(new ActorInitialized(), mockShardActor);
1585 String leaderId = "leader-member-shard-default-" + shardMrgIDSuffix;
1586 AddServerReply addServerReply = new AddServerReply(ServerChangeStatus.ALREADY_EXISTS, null);
1587 ActorRef leaderShardActor = shardManager.underlyingActor().getContext()
1588 .actorOf(Props.create(MockRespondActor.class, AddServer.class, addServerReply), leaderId);
1590 MockClusterWrapper.sendMemberUp(shardManager, "leader-member", leaderShardActor.path().toString());
1592 String newReplicaId = "member-1-shard-default-" + shardMrgIDSuffix;
1594 new RoleChangeNotification(newReplicaId, RaftState.Candidate.name(), RaftState.Follower.name()),
1597 new ShardLeaderStateChanged(newReplicaId, leaderId, DataStoreVersions.CURRENT_VERSION),
1600 shardManager.tell(new AddShardReplica(Shard.DEFAULT_NAME), kit.getRef());
1602 MessageCollectorActor.expectFirstMatching(leaderShardActor, AddServer.class);
1604 Failure resp = kit.expectMsgClass(Duration.ofSeconds(5), Failure.class);
1605 assertEquals("Failure cause", AlreadyExistsException.class, resp.cause().getClass());
1607 shardManager.tell(new FindLocalShard(Shard.DEFAULT_NAME, false), kit.getRef());
1608 kit.expectMsgClass(Duration.ofSeconds(5), LocalShardFound.class);
1610 // Send message again to verify previous in progress state is
1613 shardManager.tell(new AddShardReplica(Shard.DEFAULT_NAME), kit.getRef());
1614 resp = kit.expectMsgClass(Duration.ofSeconds(5), Failure.class);
1615 assertEquals("Failure cause", AlreadyExistsException.class, resp.cause().getClass());
1617 // Send message again with an AddServer timeout to verify the
1618 // pre-existing shard actor isn't terminated.
1621 newDatastoreContextFactory(
1622 datastoreContextBuilder.shardLeaderElectionTimeout(100, TimeUnit.MILLISECONDS).build()), kit.getRef());
1623 leaderShardActor.tell(MockRespondActor.CLEAR_RESPONSE, ActorRef.noSender());
1624 shardManager.tell(new AddShardReplica(Shard.DEFAULT_NAME), kit.getRef());
1625 kit.expectMsgClass(Duration.ofSeconds(5), Failure.class);
1627 shardManager.tell(new FindLocalShard(Shard.DEFAULT_NAME, false), kit.getRef());
1628 kit.expectMsgClass(Duration.ofSeconds(5), LocalShardFound.class);
1630 LOG.info("testAddShardReplicaWithPreExistingReplicaInRemoteShardLeader ending");
1634 public void testAddShardReplicaWithPreExistingLocalReplicaLeader() {
1635 LOG.info("testAddShardReplicaWithPreExistingLocalReplicaLeader starting");
1636 final TestKit kit = new TestKit(getSystem());
1637 String memberId = "member-1-shard-default-" + shardMrgIDSuffix;
1638 ActorRef shardManager = actorFactory.createActor(newPropsShardMgrWithMockShardActor());
1640 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
1641 shardManager.tell(new ActorInitialized(), mockShardActor);
1642 shardManager.tell(new ShardLeaderStateChanged(memberId, memberId, mock(DataTree.class),
1643 DataStoreVersions.CURRENT_VERSION), kit.getRef());
1645 new RoleChangeNotification(memberId, RaftState.Candidate.name(), RaftState.Leader.name()),
1648 shardManager.tell(new AddShardReplica(Shard.DEFAULT_NAME), kit.getRef());
1649 Failure resp = kit.expectMsgClass(Duration.ofSeconds(5), Failure.class);
1650 assertEquals("Failure cause", AlreadyExistsException.class, resp.cause().getClass());
1652 shardManager.tell(new FindLocalShard(Shard.DEFAULT_NAME, false), kit.getRef());
1653 kit.expectMsgClass(Duration.ofSeconds(5), LocalShardFound.class);
1655 LOG.info("testAddShardReplicaWithPreExistingLocalReplicaLeader ending");
1659 public void testAddShardReplicaWithAddServerReplyFailure() {
1660 LOG.info("testAddShardReplicaWithAddServerReplyFailure starting");
1661 final TestKit kit = new TestKit(getSystem());
1662 final TestKit mockShardLeaderKit = new TestKit(getSystem());
1664 MockConfiguration mockConfig = new MockConfiguration(
1665 ImmutableMap.of("astronauts", Arrays.asList("member-2")));
1667 ActorRef mockNewReplicaShardActor = newMockShardActor(getSystem(), "astronauts", "member-1");
1668 final TestActorRef<TestShardManager> shardManager = actorFactory.createTestActor(
1669 newTestShardMgrBuilder(mockConfig).shardActor(mockNewReplicaShardActor).props()
1670 .withDispatcher(Dispatchers.DefaultDispatcherId()), shardMgrID);
1671 shardManager.underlyingActor().setMessageInterceptor(newFindPrimaryInterceptor(mockShardLeaderKit.getRef()));
1673 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
1675 TestKit terminateWatcher = new TestKit(getSystem());
1676 terminateWatcher.watch(mockNewReplicaShardActor);
1678 shardManager.tell(new AddShardReplica("astronauts"), kit.getRef());
1680 AddServer addServerMsg = mockShardLeaderKit.expectMsgClass(AddServer.class);
1681 assertEquals("AddServer serverId", "member-1-shard-astronauts-" + shardMrgIDSuffix,
1682 addServerMsg.getNewServerId());
1683 mockShardLeaderKit.reply(new AddServerReply(ServerChangeStatus.TIMEOUT, null));
1685 Failure failure = kit.expectMsgClass(Duration.ofSeconds(5), Failure.class);
1686 assertEquals("Failure cause", TimeoutException.class, failure.cause().getClass());
1688 shardManager.tell(new FindLocalShard("astronauts", false), kit.getRef());
1689 kit.expectMsgClass(Duration.ofSeconds(5), LocalShardNotFound.class);
1691 terminateWatcher.expectTerminated(mockNewReplicaShardActor);
1693 shardManager.tell(new AddShardReplica("astronauts"), kit.getRef());
1694 mockShardLeaderKit.expectMsgClass(AddServer.class);
1695 mockShardLeaderKit.reply(new AddServerReply(ServerChangeStatus.NO_LEADER, null));
1696 failure = kit.expectMsgClass(Duration.ofSeconds(5), Failure.class);
1697 assertEquals("Failure cause", NoShardLeaderException.class, failure.cause().getClass());
1699 LOG.info("testAddShardReplicaWithAddServerReplyFailure ending");
1703 public void testAddShardReplicaWithAlreadyInProgress() {
1704 testServerChangeWhenAlreadyInProgress("astronauts", new AddShardReplica("astronauts"),
1705 AddServer.class, new AddShardReplica("astronauts"));
1709 public void testAddShardReplicaWithFindPrimaryTimeout() {
1710 LOG.info("testAddShardReplicaWithFindPrimaryTimeout starting");
1711 datastoreContextBuilder.shardInitializationTimeout(100, TimeUnit.MILLISECONDS);
1712 final TestKit kit = new TestKit(getSystem());
1713 MockConfiguration mockConfig = new MockConfiguration(ImmutableMap.of("astronauts", Arrays.asList("member-2")));
1715 final ActorRef newReplicaShardManager = actorFactory
1716 .createActor(newTestShardMgrBuilder(mockConfig).shardActor(mockShardActor).props()
1717 .withDispatcher(Dispatchers.DefaultDispatcherId()), shardMgrID);
1719 newReplicaShardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
1720 MockClusterWrapper.sendMemberUp(newReplicaShardManager, "member-2",
1721 AddressFromURIString.parse("akka://non-existent@127.0.0.1:5").toString());
1723 newReplicaShardManager.tell(new AddShardReplica("astronauts"), kit.getRef());
1724 Status.Failure resp = kit.expectMsgClass(Duration.ofSeconds(5), Status.Failure.class);
1725 assertTrue("Failure obtained", resp.cause() instanceof RuntimeException);
1727 LOG.info("testAddShardReplicaWithFindPrimaryTimeout ending");
1731 public void testRemoveShardReplicaForNonExistentShard() {
1732 final TestKit kit = new TestKit(getSystem());
1733 ActorRef shardManager = actorFactory
1734 .createActor(newShardMgrProps(new ConfigurationImpl(new EmptyModuleShardConfigProvider()))
1735 .withDispatcher(Dispatchers.DefaultDispatcherId()));
1737 shardManager.tell(new RemoveShardReplica("model-inventory", MEMBER_1), kit.getRef());
1738 Status.Failure resp = kit.expectMsgClass(Duration.ofSeconds(10), Status.Failure.class);
1739 assertTrue("Failure obtained", resp.cause() instanceof PrimaryNotFoundException);
1746 public void testRemoveShardReplicaLocal() {
1747 final TestKit kit = new TestKit(getSystem());
1748 String memberId = "member-1-shard-default-" + shardMrgIDSuffix;
1750 final ActorRef respondActor = actorFactory.createActor(Props.create(MockRespondActor.class,
1751 RemoveServer.class, new RemoveServerReply(ServerChangeStatus.OK, null)), memberId);
1753 ActorRef shardManager = getSystem().actorOf(newPropsShardMgrWithMockShardActor(respondActor));
1755 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
1756 shardManager.tell(new ActorInitialized(), respondActor);
1757 shardManager.tell(new ShardLeaderStateChanged(memberId, memberId, mock(DataTree.class),
1758 DataStoreVersions.CURRENT_VERSION), kit.getRef());
1760 new RoleChangeNotification(memberId, RaftState.Candidate.name(), RaftState.Leader.name()),
1763 shardManager.tell(new RemoveShardReplica(Shard.DEFAULT_NAME, MEMBER_1), kit.getRef());
1764 final RemoveServer removeServer = MessageCollectorActor.expectFirstMatching(respondActor,
1765 RemoveServer.class);
1766 assertEquals(ShardIdentifier.create("default", MEMBER_1, shardMrgIDSuffix).toString(),
1767 removeServer.getServerId());
1768 kit.expectMsgClass(Duration.ofSeconds(5), Success.class);
1772 public void testRemoveShardReplicaRemote() {
1773 MockConfiguration mockConfig = new MockConfiguration(
1774 ImmutableMap.<String, List<String>>builder().put("default", Arrays.asList("member-1", "member-2"))
1775 .put("astronauts", Arrays.asList("member-1")).build());
1777 String shardManagerID = ShardManagerIdentifier.builder().type(shardMrgIDSuffix).build().toString();
1779 // Create an ActorSystem ShardManager actor for member-1.
1780 final ActorSystem system1 = newActorSystem("Member1");
1781 Cluster.get(system1).join(AddressFromURIString.parse("akka://cluster-test@127.0.0.1:2558"));
1782 ActorRef mockDefaultShardActor = newMockShardActor(system1, Shard.DEFAULT_NAME, "member-1");
1784 final TestActorRef<TestShardManager> newReplicaShardManager = TestActorRef.create(system1,
1785 newTestShardMgrBuilder().configuration(mockConfig).shardActor(mockDefaultShardActor).cluster(
1786 new ClusterWrapperImpl(system1)).props().withDispatcher(Dispatchers.DefaultDispatcherId()),
1789 // Create an ActorSystem ShardManager actor for member-2.
1790 final ActorSystem system2 = newActorSystem("Member2");
1791 Cluster.get(system2).join(AddressFromURIString.parse("akka://cluster-test@127.0.0.1:2558"));
1793 String name = ShardIdentifier.create("default", MEMBER_2, shardMrgIDSuffix).toString();
1794 String memberId2 = "member-2-shard-default-" + shardMrgIDSuffix;
1795 final TestActorRef<MockRespondActor> mockShardLeaderActor =
1796 TestActorRef.create(system2, Props.create(MockRespondActor.class, RemoveServer.class,
1797 new RemoveServerReply(ServerChangeStatus.OK, memberId2)), name);
1799 LOG.error("Mock Shard Leader Actor : {}", mockShardLeaderActor);
1801 final TestActorRef<TestShardManager> leaderShardManager = TestActorRef.create(system2,
1802 newTestShardMgrBuilder().configuration(mockConfig).shardActor(mockShardLeaderActor).cluster(
1803 new ClusterWrapperImpl(system2)).props().withDispatcher(Dispatchers.DefaultDispatcherId()),
1806 // Because mockShardLeaderActor is created at the top level of the actor system it has an address like so,
1807 // akka://cluster-test@127.0.0.1:2559/user/member-2-shard-default-config1
1808 // However when a shard manager has a local shard which is a follower and a leader that is remote it will
1809 // try to compute an address for the remote shard leader using the ShardPeerAddressResolver. This address will
1811 // akka://cluster-test@127.0.0.1:2559/user/shardmanager-config1/member-2-shard-default-config1
1812 // In this specific case if we did a FindPrimary for shard default from member-1 we would come up
1813 // with the address of an actor which does not exist, therefore any message sent to that actor would go to
1815 // To work around this problem we create a ForwardingActor with the right address and pass to it the
1816 // mockShardLeaderActor. The ForwardingActor simply forwards all messages to the mockShardLeaderActor and every
1817 // thing works as expected
1818 final ActorRef actorRef = leaderShardManager.underlyingActor().context()
1819 .actorOf(Props.create(ForwardingActor.class, mockShardLeaderActor),
1820 "member-2-shard-default-" + shardMrgIDSuffix);
1822 LOG.error("Forwarding actor : {}", actorRef);
1824 final TestKit kit = new TestKit(getSystem());
1825 newReplicaShardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
1826 leaderShardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
1828 leaderShardManager.tell(new ActorInitialized(), mockShardLeaderActor);
1829 newReplicaShardManager.tell(new ActorInitialized(), mockShardLeaderActor);
1831 short leaderVersion = DataStoreVersions.CURRENT_VERSION - 1;
1832 leaderShardManager.tell(
1833 new ShardLeaderStateChanged(memberId2, memberId2, mock(DataTree.class), leaderVersion),
1834 mockShardLeaderActor);
1835 leaderShardManager.tell(
1836 new RoleChangeNotification(memberId2, RaftState.Candidate.name(), RaftState.Leader.name()),
1837 mockShardLeaderActor);
1839 String memberId1 = "member-1-shard-default-" + shardMrgIDSuffix;
1840 newReplicaShardManager.tell(
1841 new ShardLeaderStateChanged(memberId1, memberId2, mock(DataTree.class), leaderVersion),
1843 newReplicaShardManager.tell(
1844 new RoleChangeNotification(memberId1, RaftState.Candidate.name(), RaftState.Follower.name()),
1847 newReplicaShardManager.underlyingActor().waitForMemberUp();
1848 leaderShardManager.underlyingActor().waitForMemberUp();
1850 // construct a mock response message
1851 newReplicaShardManager.tell(new RemoveShardReplica("default", MEMBER_1), kit.getRef());
1852 RemoveServer removeServer = MessageCollectorActor.expectFirstMatching(mockShardLeaderActor,
1853 RemoveServer.class);
1854 String removeServerId = ShardIdentifier.create("default", MEMBER_1, shardMrgIDSuffix).toString();
1855 assertEquals("RemoveServer serverId", removeServerId, removeServer.getServerId());
1856 kit.expectMsgClass(Duration.ofSeconds(5), Status.Success.class);
1860 public void testRemoveShardReplicaWhenAnotherRemoveShardReplicaAlreadyInProgress() {
1861 testServerChangeWhenAlreadyInProgress("astronauts", new RemoveShardReplica("astronauts", MEMBER_2),
1862 RemoveServer.class, new RemoveShardReplica("astronauts", MEMBER_3));
1866 public void testRemoveShardReplicaWhenAddShardReplicaAlreadyInProgress() {
1867 testServerChangeWhenAlreadyInProgress("astronauts", new AddShardReplica("astronauts"),
1868 AddServer.class, new RemoveShardReplica("astronauts", MEMBER_2));
1872 public void testServerChangeWhenAlreadyInProgress(final String shardName, final Object firstServerChange,
1873 final Class<?> firstForwardedServerChangeClass,
1874 final Object secondServerChange) {
1875 final TestKit kit = new TestKit(getSystem());
1876 final TestKit mockShardLeaderKit = new TestKit(getSystem());
1877 final TestKit secondRequestKit = new TestKit(getSystem());
1879 MockConfiguration mockConfig = new MockConfiguration(ImmutableMap.<String, List<String>>builder()
1880 .put(shardName, Arrays.asList("member-2")).build());
1882 final TestActorRef<TestShardManager> shardManager = TestActorRef.create(getSystem(),
1883 newTestShardMgrBuilder().configuration(mockConfig).shardActor(mockShardActor)
1884 .cluster(new MockClusterWrapper()).props()
1885 .withDispatcher(Dispatchers.DefaultDispatcherId()),
1888 shardManager.underlyingActor().setMessageInterceptor(newFindPrimaryInterceptor(mockShardLeaderKit.getRef()));
1890 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
1892 shardManager.tell(firstServerChange, kit.getRef());
1894 mockShardLeaderKit.expectMsgClass(firstForwardedServerChangeClass);
1896 shardManager.tell(secondServerChange, secondRequestKit.getRef());
1898 secondRequestKit.expectMsgClass(Duration.ofSeconds(5), Failure.class);
1902 public void testServerRemovedShardActorNotRunning() {
1903 LOG.info("testServerRemovedShardActorNotRunning starting");
1904 final TestKit kit = new TestKit(getSystem());
1905 MockConfiguration mockConfig = new MockConfiguration(ImmutableMap.<String, List<String>>builder()
1906 .put("default", Arrays.asList("member-1", "member-2"))
1907 .put("astronauts", Arrays.asList("member-2"))
1908 .put("people", Arrays.asList("member-1", "member-2")).build());
1910 TestActorRef<TestShardManager> shardManager = actorFactory.createTestActor(
1911 newShardMgrProps(mockConfig).withDispatcher(Dispatchers.DefaultDispatcherId()));
1913 shardManager.underlyingActor().waitForRecoveryComplete();
1914 shardManager.tell(new FindLocalShard("people", false), kit.getRef());
1915 kit.expectMsgClass(Duration.ofSeconds(5), NotInitializedException.class);
1917 shardManager.tell(new FindLocalShard("default", false), kit.getRef());
1918 kit.expectMsgClass(Duration.ofSeconds(5), NotInitializedException.class);
1920 // Removed the default shard replica from member-1
1921 ShardIdentifier.Builder builder = new ShardIdentifier.Builder();
1922 ShardIdentifier shardId = builder.shardName("default").memberName(MEMBER_1).type(shardMrgIDSuffix)
1924 shardManager.tell(new ServerRemoved(shardId.toString()), kit.getRef());
1926 shardManager.underlyingActor().verifySnapshotPersisted(Sets.newHashSet("people"));
1928 LOG.info("testServerRemovedShardActorNotRunning ending");
1932 public void testServerRemovedShardActorRunning() {
1933 LOG.info("testServerRemovedShardActorRunning starting");
1934 final TestKit kit = new TestKit(getSystem());
1935 MockConfiguration mockConfig = new MockConfiguration(ImmutableMap.<String, List<String>>builder()
1936 .put("default", Arrays.asList("member-1", "member-2"))
1937 .put("astronauts", Arrays.asList("member-2"))
1938 .put("people", Arrays.asList("member-1", "member-2")).build());
1940 String shardId = ShardIdentifier.create("default", MEMBER_1, shardMrgIDSuffix).toString();
1941 ActorRef shard = actorFactory.createActor(MessageCollectorActor.props(), shardId);
1943 TestActorRef<TestShardManager> shardManager = actorFactory
1944 .createTestActor(newTestShardMgrBuilder(mockConfig).addShardActor("default", shard).props()
1945 .withDispatcher(Dispatchers.DefaultDispatcherId()));
1947 shardManager.underlyingActor().waitForRecoveryComplete();
1949 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
1950 shardManager.tell(new ActorInitialized(), shard);
1952 waitForShardInitialized(shardManager, "people", kit);
1953 waitForShardInitialized(shardManager, "default", kit);
1955 // Removed the default shard replica from member-1
1956 shardManager.tell(new ServerRemoved(shardId), kit.getRef());
1958 shardManager.underlyingActor().verifySnapshotPersisted(Sets.newHashSet("people"));
1960 MessageCollectorActor.expectFirstMatching(shard, Shutdown.class);
1962 LOG.info("testServerRemovedShardActorRunning ending");
1966 public void testShardPersistenceWithRestoredData() {
1967 LOG.info("testShardPersistenceWithRestoredData starting");
1968 final TestKit kit = new TestKit(getSystem());
1969 MockConfiguration mockConfig =
1970 new MockConfiguration(ImmutableMap.<String, List<String>>builder()
1971 .put("default", Arrays.asList("member-1", "member-2"))
1972 .put("astronauts", Arrays.asList("member-2"))
1973 .put("people", Arrays.asList("member-1", "member-2")).build());
1974 String[] restoredShards = {"default", "astronauts"};
1975 ShardManagerSnapshot snapshot =
1976 new ShardManagerSnapshot(Arrays.asList(restoredShards));
1977 InMemorySnapshotStore.addSnapshot("shard-manager-" + shardMrgIDSuffix, snapshot);
1979 // create shardManager to come up with restored data
1980 TestActorRef<TestShardManager> newRestoredShardManager = actorFactory.createTestActor(
1981 newShardMgrProps(mockConfig).withDispatcher(Dispatchers.DefaultDispatcherId()));
1983 newRestoredShardManager.underlyingActor().waitForRecoveryComplete();
1985 newRestoredShardManager.tell(new FindLocalShard("people", false), kit.getRef());
1986 LocalShardNotFound notFound = kit.expectMsgClass(Duration.ofSeconds(5), LocalShardNotFound.class);
1987 assertEquals("for uninitialized shard", "people", notFound.getShardName());
1989 // Verify a local shard is created for the restored shards,
1990 // although we expect a NotInitializedException for the shards
1991 // as the actor initialization
1992 // message is not sent for them
1993 newRestoredShardManager.tell(new FindLocalShard("default", false), kit.getRef());
1994 kit.expectMsgClass(Duration.ofSeconds(5), NotInitializedException.class);
1996 newRestoredShardManager.tell(new FindLocalShard("astronauts", false), kit.getRef());
1997 kit.expectMsgClass(Duration.ofSeconds(5), NotInitializedException.class);
1999 LOG.info("testShardPersistenceWithRestoredData ending");
2003 public void testShutDown() throws Exception {
2004 LOG.info("testShutDown starting");
2005 final TestKit kit = new TestKit(getSystem());
2006 MockConfiguration mockConfig = new MockConfiguration(ImmutableMap.<String, List<String>>builder()
2007 .put("shard1", Arrays.asList("member-1")).put("shard2", Arrays.asList("member-1")).build());
2009 String shardId1 = ShardIdentifier.create("shard1", MEMBER_1, shardMrgIDSuffix).toString();
2010 ActorRef shard1 = actorFactory.createActor(MessageCollectorActor.props(), shardId1);
2012 String shardId2 = ShardIdentifier.create("shard2", MEMBER_1, shardMrgIDSuffix).toString();
2013 ActorRef shard2 = actorFactory.createActor(MessageCollectorActor.props(), shardId2);
2015 ActorRef shardManager = actorFactory.createActor(newTestShardMgrBuilder(mockConfig)
2016 .addShardActor("shard1", shard1).addShardActor("shard2", shard2).props());
2018 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
2019 shardManager.tell(new ActorInitialized(), shard1);
2020 shardManager.tell(new ActorInitialized(), shard2);
2022 FiniteDuration duration = FiniteDuration.create(5, TimeUnit.SECONDS);
2023 Future<Boolean> stopFuture = Patterns.gracefulStop(shardManager, duration, Shutdown.INSTANCE);
2025 MessageCollectorActor.expectFirstMatching(shard1, Shutdown.class);
2026 MessageCollectorActor.expectFirstMatching(shard2, Shutdown.class);
2029 Await.ready(stopFuture, FiniteDuration.create(500, TimeUnit.MILLISECONDS));
2030 fail("ShardManager actor stopped without waiting for the Shards to be stopped");
2031 } catch (TimeoutException e) {
2035 actorFactory.killActor(shard1, kit);
2036 actorFactory.killActor(shard2, kit);
2038 Boolean stopped = Await.result(stopFuture, duration);
2039 assertEquals("Stopped", Boolean.TRUE, stopped);
2041 LOG.info("testShutDown ending");
2045 public void testChangeServersVotingStatus() {
2046 final TestKit kit = new TestKit(getSystem());
2047 String memberId = "member-1-shard-default-" + shardMrgIDSuffix;
2049 ActorRef respondActor = actorFactory
2050 .createActor(Props.create(MockRespondActor.class, ChangeServersVotingStatus.class,
2051 new ServerChangeReply(ServerChangeStatus.OK, null)), memberId);
2053 ActorRef shardManager = getSystem().actorOf(newPropsShardMgrWithMockShardActor(respondActor));
2055 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
2056 shardManager.tell(new ActorInitialized(), respondActor);
2057 shardManager.tell(new ShardLeaderStateChanged(memberId, memberId, mock(DataTree.class),
2058 DataStoreVersions.CURRENT_VERSION), kit.getRef());
2060 new RoleChangeNotification(memberId, RaftState.Candidate.name(), RaftState.Leader.name()),
2064 new ChangeShardMembersVotingStatus("default", ImmutableMap.of("member-2", Boolean.TRUE)), kit.getRef());
2066 ChangeServersVotingStatus actualChangeStatusMsg = MessageCollectorActor
2067 .expectFirstMatching(respondActor, ChangeServersVotingStatus.class);
2068 assertEquals("ChangeServersVotingStatus map", actualChangeStatusMsg.getServerVotingStatusMap(),
2069 ImmutableMap.of(ShardIdentifier
2070 .create("default", MemberName.forName("member-2"), shardMrgIDSuffix).toString(),
2073 kit.expectMsgClass(Duration.ofSeconds(5), Success.class);
2077 public void testChangeServersVotingStatusWithNoLeader() {
2078 final TestKit kit = new TestKit(getSystem());
2079 String memberId = "member-1-shard-default-" + shardMrgIDSuffix;
2081 ActorRef respondActor = actorFactory
2082 .createActor(Props.create(MockRespondActor.class, ChangeServersVotingStatus.class,
2083 new ServerChangeReply(ServerChangeStatus.NO_LEADER, null)), memberId);
2085 ActorRef shardManager = getSystem().actorOf(newPropsShardMgrWithMockShardActor(respondActor));
2087 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
2088 shardManager.tell(new ActorInitialized(), respondActor);
2089 shardManager.tell(new RoleChangeNotification(memberId, null, RaftState.Follower.name()), respondActor);
2092 new ChangeShardMembersVotingStatus("default", ImmutableMap.of("member-2", Boolean.TRUE)), kit.getRef());
2094 MessageCollectorActor.expectFirstMatching(respondActor, ChangeServersVotingStatus.class);
2096 Status.Failure resp = kit.expectMsgClass(Duration.ofSeconds(5), Status.Failure.class);
2097 assertTrue("Failure resposnse", resp.cause() instanceof NoShardLeaderException);
2100 @SuppressWarnings("unchecked")
2102 public void testRegisterForShardLeaderChanges() {
2103 LOG.info("testRegisterForShardLeaderChanges starting");
2105 final String memberId1 = "member-1-shard-default-" + shardMrgIDSuffix;
2106 final String memberId2 = "member-2-shard-default-" + shardMrgIDSuffix;
2107 final TestKit kit = new TestKit(getSystem());
2108 final ActorRef shardManager = actorFactory.createActor(newPropsShardMgrWithMockShardActor());
2110 shardManager.tell(new UpdateSchemaContext(TEST_SCHEMA_CONTEXT), kit.getRef());
2111 shardManager.tell(new ActorInitialized(), mockShardActor);
2113 final Consumer<String> mockCallback = mock(Consumer.class);
2114 shardManager.tell(new RegisterForShardAvailabilityChanges(mockCallback), kit.getRef());
2116 final Success reply = kit.expectMsgClass(Duration.ofSeconds(5), Success.class);
2117 final Registration reg = (Registration) reply.status();
2119 final DataTree mockDataTree = mock(DataTree.class);
2120 shardManager.tell(new ShardLeaderStateChanged(memberId1, memberId1, mockDataTree,
2121 DataStoreVersions.CURRENT_VERSION), mockShardActor);
2123 verify(mockCallback, timeout(5000)).accept("default");
2125 reset(mockCallback);
2126 shardManager.tell(new ShardLeaderStateChanged(memberId1, memberId1, mockDataTree,
2127 DataStoreVersions.CURRENT_VERSION), mockShardActor);
2129 Uninterruptibles.sleepUninterruptibly(500, TimeUnit.MILLISECONDS);
2130 verifyNoMoreInteractions(mockCallback);
2132 shardManager.tell(new ShardLeaderStateChanged(memberId1, null, mockDataTree,
2133 DataStoreVersions.CURRENT_VERSION), mockShardActor);
2135 verify(mockCallback, timeout(5000)).accept("default");
2137 reset(mockCallback);
2138 shardManager.tell(new ShardLeaderStateChanged(memberId1, memberId2, mockDataTree,
2139 DataStoreVersions.CURRENT_VERSION), mockShardActor);
2141 verify(mockCallback, timeout(5000)).accept("default");
2143 reset(mockCallback);
2146 shardManager.tell(new ShardLeaderStateChanged(memberId1, memberId1, mockDataTree,
2147 DataStoreVersions.CURRENT_VERSION), mockShardActor);
2149 Uninterruptibles.sleepUninterruptibly(500, TimeUnit.MILLISECONDS);
2150 verifyNoMoreInteractions(mockCallback);
2152 LOG.info("testRegisterForShardLeaderChanges ending");
2155 public static class TestShardManager extends ShardManager {
2156 private final CountDownLatch recoveryComplete = new CountDownLatch(1);
2157 private final CountDownLatch snapshotPersist = new CountDownLatch(1);
2158 private ShardManagerSnapshot snapshot;
2159 private final Map<String, ActorRef> shardActors;
2160 private final ActorRef shardActor;
2161 private CountDownLatch findPrimaryMessageReceived = new CountDownLatch(1);
2162 private CountDownLatch memberUpReceived = new CountDownLatch(1);
2163 private CountDownLatch memberRemovedReceived = new CountDownLatch(1);
2164 private CountDownLatch memberUnreachableReceived = new CountDownLatch(1);
2165 private CountDownLatch memberReachableReceived = new CountDownLatch(1);
2166 private volatile MessageInterceptor messageInterceptor;
2168 TestShardManager(final Builder builder) {
2170 shardActor = builder.shardActor;
2171 shardActors = builder.shardActors;
2175 protected void handleRecover(final Object message) throws Exception {
2177 super.handleRecover(message);
2179 if (message instanceof RecoveryCompleted) {
2180 recoveryComplete.countDown();
2185 private void countDownIfOther(final Member member, final CountDownLatch latch) {
2186 if (!getCluster().getCurrentMemberName().equals(memberToName(member))) {
2192 public void handleCommand(final Object message) throws Exception {
2194 if (messageInterceptor != null && messageInterceptor.canIntercept(message)) {
2195 getSender().tell(messageInterceptor.apply(message), getSelf());
2197 super.handleCommand(message);
2200 if (message instanceof FindPrimary) {
2201 findPrimaryMessageReceived.countDown();
2202 } else if (message instanceof ClusterEvent.MemberUp) {
2203 countDownIfOther(((ClusterEvent.MemberUp) message).member(), memberUpReceived);
2204 } else if (message instanceof ClusterEvent.MemberRemoved) {
2205 countDownIfOther(((ClusterEvent.MemberRemoved) message).member(), memberRemovedReceived);
2206 } else if (message instanceof ClusterEvent.UnreachableMember) {
2207 countDownIfOther(((ClusterEvent.UnreachableMember) message).member(), memberUnreachableReceived);
2208 } else if (message instanceof ClusterEvent.ReachableMember) {
2209 countDownIfOther(((ClusterEvent.ReachableMember) message).member(), memberReachableReceived);
2214 void setMessageInterceptor(final MessageInterceptor messageInterceptor) {
2215 this.messageInterceptor = messageInterceptor;
2218 void waitForRecoveryComplete() {
2219 assertTrue("Recovery complete",
2220 Uninterruptibles.awaitUninterruptibly(recoveryComplete, 5, TimeUnit.SECONDS));
2223 public void waitForMemberUp() {
2224 assertTrue("MemberUp received",
2225 Uninterruptibles.awaitUninterruptibly(memberUpReceived, 5, TimeUnit.SECONDS));
2226 memberUpReceived = new CountDownLatch(1);
2229 void waitForMemberRemoved() {
2230 assertTrue("MemberRemoved received",
2231 Uninterruptibles.awaitUninterruptibly(memberRemovedReceived, 5, TimeUnit.SECONDS));
2232 memberRemovedReceived = new CountDownLatch(1);
2235 void waitForUnreachableMember() {
2236 assertTrue("UnreachableMember received",
2237 Uninterruptibles.awaitUninterruptibly(memberUnreachableReceived, 5, TimeUnit.SECONDS));
2238 memberUnreachableReceived = new CountDownLatch(1);
2241 void waitForReachableMember() {
2242 assertTrue("ReachableMember received",
2243 Uninterruptibles.awaitUninterruptibly(memberReachableReceived, 5, TimeUnit.SECONDS));
2244 memberReachableReceived = new CountDownLatch(1);
2247 void verifyFindPrimary() {
2248 assertTrue("FindPrimary received",
2249 Uninterruptibles.awaitUninterruptibly(findPrimaryMessageReceived, 5, TimeUnit.SECONDS));
2250 findPrimaryMessageReceived = new CountDownLatch(1);
2253 public static Builder builder(final DatastoreContext.Builder datastoreContextBuilder) {
2254 return new Builder(datastoreContextBuilder);
2257 public static class Builder extends AbstractGenericCreator<Builder, TestShardManager> {
2258 private ActorRef shardActor;
2259 private final Map<String, ActorRef> shardActors = new HashMap<>();
2261 Builder(final DatastoreContext.Builder datastoreContextBuilder) {
2262 super(TestShardManager.class);
2263 datastoreContextFactory(newDatastoreContextFactory(datastoreContextBuilder.build()));
2266 Builder shardActor(final ActorRef newShardActor) {
2267 shardActor = newShardActor;
2271 Builder addShardActor(final String shardName, final ActorRef actorRef) {
2272 shardActors.put(shardName, actorRef);
2278 public void saveSnapshot(final Object obj) {
2279 snapshot = (ShardManagerSnapshot) obj;
2280 snapshotPersist.countDown();
2281 super.saveSnapshot(obj);
2284 void verifySnapshotPersisted(final Set<String> shardList) {
2285 assertTrue("saveSnapshot invoked",
2286 Uninterruptibles.awaitUninterruptibly(snapshotPersist, 5, TimeUnit.SECONDS));
2287 assertEquals("Shard Persisted", shardList, Sets.newHashSet(snapshot.getShardList()));
2291 protected ActorRef newShardActor(final ShardInformation info) {
2292 if (shardActors.get(info.getShardName()) != null) {
2293 return shardActors.get(info.getShardName());
2296 if (shardActor != null) {
2300 return super.newShardActor(info);
2304 private abstract static class AbstractGenericCreator<T extends AbstractGenericCreator<T, ?>, C extends ShardManager>
2305 extends AbstractShardManagerCreator<T> {
2306 private final Class<C> shardManagerClass;
2308 AbstractGenericCreator(final Class<C> shardManagerClass) {
2309 this.shardManagerClass = shardManagerClass;
2310 cluster(new MockClusterWrapper()).configuration(new MockConfiguration()).readinessFuture(ready)
2311 .primaryShardInfoCache(new PrimaryShardInfoFutureCache());
2315 public Props props() {
2317 return Props.create(shardManagerClass, this);
2321 private static class GenericCreator<C extends ShardManager> extends AbstractGenericCreator<GenericCreator<C>, C> {
2322 GenericCreator(final Class<C> shardManagerClass) {
2323 super(shardManagerClass);
2327 private static class DelegatingShardManagerCreator implements Creator<ShardManager> {
2328 private static final long serialVersionUID = 1L;
2329 private final Creator<ShardManager> delegate;
2331 DelegatingShardManagerCreator(final Creator<ShardManager> delegate) {
2332 this.delegate = delegate;
2336 public ShardManager create() throws Exception {
2337 return delegate.create();
2341 interface MessageInterceptor extends Function<Object, Object> {
2342 boolean canIntercept(Object message);
2345 private static MessageInterceptor newFindPrimaryInterceptor(final ActorRef primaryActor) {
2346 return new MessageInterceptor() {
2348 public Object apply(final Object message) {
2349 return new RemotePrimaryShardFound(Serialization.serializedActorPath(primaryActor), (short) 1);
2353 public boolean canIntercept(final Object message) {
2354 return message instanceof FindPrimary;
2359 private static class MockRespondActor extends MessageCollectorActor {
2360 static final String CLEAR_RESPONSE = "clear-response";
2362 private Object responseMsg;
2363 private final Class<?> requestClass;
2365 @SuppressWarnings("unused")
2366 MockRespondActor(final Class<?> requestClass, final Object responseMsg) {
2367 this.requestClass = requestClass;
2368 this.responseMsg = responseMsg;
2372 public void onReceive(final Object message) throws Exception {
2373 if (message.equals(CLEAR_RESPONSE)) {
2376 super.onReceive(message);
2377 if (message.getClass().equals(requestClass) && responseMsg != null) {
2378 getSender().tell(responseMsg, getSelf());