Allow incremental recovery

author Tibor Král <tibor.kral@pantheon.tech>

Wed, 22 Jan 2020 11:53:41 +0000 (12:53 +0100)

committer Robert Varga <robert.varga@pantheon.tech>

Sun, 14 Jun 2020 15:15:47 +0000 (17:15 +0200)
author Tibor Král <tibor.kral@pantheon.tech>
Wed, 22 Jan 2020 11:53:41 +0000 (12:53 +0100)
committer Robert Varga <robert.varga@pantheon.tech>
Sun, 14 Jun 2020 15:15:47 +0000 (17:15 +0200)
diff --git a/opendaylight/md-sal/sal-akka-raft/src/main/java/org/opendaylight/controller/cluster/raft/ConfigParams.java b/opendaylight/md-sal/sal-akka-raft/src/main/java/org/opendaylight/controller/cluster/raft/ConfigParams.java

index 070218e92e46448a74f82fd2416c1458b2f320c5..c5c78130e8fcb22c5c614a03032a74acae40a2bc 100644 (file)
--- a/opendaylight/md-sal/sal-akka-raft/src/main/java/org/opendaylight/controller/cluster/raft/ConfigParams.java
+++ b/opendaylight/md-sal/sal-akka-raft/src/main/java/org/opendaylight/controller/cluster/raft/ConfigParams.java
@@ -40,6 +40,15 @@ public interface ConfigParams {
       */
      int getSnapshotDataThresholdPercentage();
  
+
+    /**
+     * Returns the interval(in seconds) after which a snapshot should be taken during recovery.
+     * Negative value means don't take snapshots.
+     *
+     * @return the interval of recovery snapshot in seconds
+     */
+    int getRecoverySnapshotIntervalSeconds();
+
      /**
       * Returns the interval at which a heart beat message should be sent to remote followers.
       *
diff --git a/opendaylight/md-sal/sal-akka-raft/src/main/java/org/opendaylight/controller/cluster/raft/DefaultConfigParamsImpl.java b/opendaylight/md-sal/sal-akka-raft/src/main/java/org/opendaylight/controller/cluster/raft/DefaultConfigParamsImpl.java

index a7a5c62769e8f36dacda70ef0be6dc7f739dffe8..97838b03212f8ea8b3fbd6201995b398a9b61977 100644 (file)
--- a/opendaylight/md-sal/sal-akka-raft/src/main/java/org/opendaylight/controller/cluster/raft/DefaultConfigParamsImpl.java
+++ b/opendaylight/md-sal/sal-akka-raft/src/main/java/org/opendaylight/controller/cluster/raft/DefaultConfigParamsImpl.java
@@ -29,6 +29,10 @@ public class DefaultConfigParamsImpl implements ConfigParams {
      private static final Logger LOG = LoggerFactory.getLogger(DefaultConfigParamsImpl.class);
  
      private static final int SNAPSHOT_BATCH_COUNT = 20000;
+    /**
+     * Interval after which a snapshot should be taken during the recovery process. 0 if never.
+     */
+    private static final int RECOVERY_SNAPSHOT_INTERVAL_SECONDS = 0;
  
      private static final int JOURNAL_RECOVERY_LOG_BATCH_SIZE = 1000;
  
@@ -56,6 +60,7 @@ public class DefaultConfigParamsImpl implements ConfigParams {
      private FiniteDuration heartBeatInterval = HEART_BEAT_INTERVAL;
      private long snapshotBatchCount = SNAPSHOT_BATCH_COUNT;
      private int journalRecoveryLogBatchSize = JOURNAL_RECOVERY_LOG_BATCH_SIZE;
+    private int recoverySnapshotIntervalSeconds = RECOVERY_SNAPSHOT_INTERVAL_SECONDS;
      private long isolatedLeaderCheckInterval = HEART_BEAT_INTERVAL.$times(1000).toMillis();
      private FiniteDuration electionTimeOutInterval;
  
@@ -86,6 +91,11 @@ public class DefaultConfigParamsImpl implements ConfigParams {
          this.snapshotBatchCount = snapshotBatchCount;
      }
  
+    public void setRecoverySnapshotIntervalSeconds(int recoverySnapshotInterval) {
+        checkArgument(recoverySnapshotInterval >= 0);
+        this.recoverySnapshotIntervalSeconds = recoverySnapshotInterval;
+    }
+
      public void setSnapshotDataThresholdPercentage(final int snapshotDataThresholdPercentage) {
          this.snapshotDataThresholdPercentage = snapshotDataThresholdPercentage;
      }
@@ -138,6 +148,11 @@ public class DefaultConfigParamsImpl implements ConfigParams {
          return snapshotDataThresholdPercentage;
      }
  
+    @Override
+    public int getRecoverySnapshotIntervalSeconds() {
+        return this.recoverySnapshotIntervalSeconds;
+    }
+
      @Override
      public FiniteDuration getHeartBeatInterval() {
          return heartBeatInterval;
diff --git a/opendaylight/md-sal/sal-akka-raft/src/main/java/org/opendaylight/controller/cluster/raft/RaftActorRecoverySupport.java b/opendaylight/md-sal/sal-akka-raft/src/main/java/org/opendaylight/controller/cluster/raft/RaftActorRecoverySupport.java

index 873b8514a2e30038f4327a01507df063b2468211..10375f9406666234bb3f6f69d14cb2ea003ef7f8 100644 (file)
--- a/opendaylight/md-sal/sal-akka-raft/src/main/java/org/opendaylight/controller/cluster/raft/RaftActorRecoverySupport.java
+++ b/opendaylight/md-sal/sal-akka-raft/src/main/java/org/opendaylight/controller/cluster/raft/RaftActorRecoverySupport.java
@@ -11,6 +11,7 @@ import akka.persistence.RecoveryCompleted;
  import akka.persistence.SnapshotOffer;
  import com.google.common.base.Stopwatch;
  import java.util.Collections;
+import java.util.concurrent.TimeUnit;
  import org.opendaylight.controller.cluster.PersistentDataProvider;
  import org.opendaylight.controller.cluster.raft.base.messages.ApplySnapshot;
  import org.opendaylight.controller.cluster.raft.persisted.ApplyJournalEntries;
@@ -39,6 +40,7 @@ class RaftActorRecoverySupport {
      private boolean hasMigratedDataRecovered;
  
      private Stopwatch recoveryTimer;
+    private Stopwatch recoverySnapshotTimer;
      private final Logger log;
  
      RaftActorRecoverySupport(final RaftActorContext context, final RaftActorRecoveryCohort cohort) {
@@ -100,16 +102,19 @@ class RaftActorRecoverySupport {
          return context.getReplicatedLog();
      }
  
-    private void initRecoveryTimer() {
+    private void initRecoveryTimers() {
          if (recoveryTimer == null) {
              recoveryTimer = Stopwatch.createStarted();
          }
+        if (recoverySnapshotTimer == null && context.getConfigParams().getRecoverySnapshotIntervalSeconds() > 0) {
+            recoverySnapshotTimer = Stopwatch.createStarted();
+        }
      }
  
      private void onRecoveredSnapshot(final SnapshotOffer offer) {
          log.debug("{}: SnapshotOffer called.", context.getId());
  
-        initRecoveryTimer();
+        initRecoveryTimers();
  
          Snapshot snapshot = (Snapshot) offer.snapshot();
  
@@ -200,6 +205,14 @@ class RaftActorRecoverySupport {
              if (logEntry != null) {
                  lastApplied++;
                  batchRecoveredLogEntry(logEntry);
+                if (shouldTakeRecoverySnapshot() && !context.getSnapshotManager().isCapturing()) {
+                    if (currentRecoveryBatchCount > 0) {
+                        endCurrentLogRecoveryBatch();
+                    }
+                    context.setLastApplied(lastApplied);
+                    context.setCommitIndex(lastApplied);
+                    takeRecoverySnapshot(logEntry);
+                }
              } else {
                  // Shouldn't happen but cover it anyway.
                  log.error("{}: Log entry not found for index {}", context.getId(), i);
@@ -220,7 +233,7 @@ class RaftActorRecoverySupport {
      }
  
      private void batchRecoveredLogEntry(final ReplicatedLogEntry logEntry) {
-        initRecoveryTimer();
+        initRecoveryTimers();
  
          int batchSize = context.getConfigParams().getJournalRecoveryLogBatchSize();
          if (!isServerConfigurationPayload(logEntry)) {
@@ -236,6 +249,23 @@ class RaftActorRecoverySupport {
          }
      }
  
+    private void takeRecoverySnapshot(final ReplicatedLogEntry logEntry) {
+        log.info("Time for recovery snapshot on entry with index {}", logEntry.getIndex());
+        final SnapshotManager snapshotManager = context.getSnapshotManager();
+        if (snapshotManager.capture(logEntry, -1)) {
+            log.info("Capturing snapshot, resetting timer for the next recovery snapshot interval.");
+            this.recoverySnapshotTimer.reset().start();
+        } else {
+            log.info("SnapshotManager is not able to capture snapshot at this time. It will be retried "
+                + "again with the next recovered entry.");
+        }
+    }
+
+    private boolean shouldTakeRecoverySnapshot() {
+        return this.recoverySnapshotTimer != null && this.recoverySnapshotTimer.elapsed(TimeUnit.SECONDS)
+            >= context.getConfigParams().getRecoverySnapshotIntervalSeconds();
+    }
+
      private void endCurrentLogRecoveryBatch() {
          cohort.applyCurrentLogRecoveryBatch();
          currentRecoveryBatchCount = 0;
@@ -254,6 +284,11 @@ class RaftActorRecoverySupport {
              recoveryTime = "";
          }
  
+        if (recoverySnapshotTimer != null) {
+            recoverySnapshotTimer.stop();
+            recoverySnapshotTimer = null;
+        }
+
          log.info("{}: Recovery completed {} - Switching actor to Follower - last log index = {}, last log term = {}, "
                  + "snapshot index = {}, snapshot term = {}, journal size = {}", context.getId(), recoveryTime,
                  replicatedLog().lastIndex(), replicatedLog().lastTerm(), replicatedLog().getSnapshotIndex(),
diff --git a/opendaylight/md-sal/sal-akka-raft/src/test/java/org/opendaylight/controller/cluster/raft/RaftActorRecoverySupportTest.java b/opendaylight/md-sal/sal-akka-raft/src/test/java/org/opendaylight/controller/cluster/raft/RaftActorRecoverySupportTest.java

index 4855f42931da658d3d6f7912edb930fd78498bf8..0d29c31ee4b3b1d5f9e879c3a014317fa188e850 100644 (file)
--- a/opendaylight/md-sal/sal-akka-raft/src/test/java/org/opendaylight/controller/cluster/raft/RaftActorRecoverySupportTest.java
+++ b/opendaylight/md-sal/sal-akka-raft/src/test/java/org/opendaylight/controller/cluster/raft/RaftActorRecoverySupportTest.java
@@ -14,17 +14,32 @@ import static org.mockito.ArgumentMatchers.any;
  import static org.mockito.ArgumentMatchers.anyInt;
  import static org.mockito.Mockito.doNothing;
  import static org.mockito.Mockito.doReturn;
+import static org.mockito.Mockito.mock;
  import static org.mockito.Mockito.never;
+import static org.mockito.Mockito.times;
  import static org.mockito.Mockito.verify;
  import static org.mockito.Mockito.verifyNoMoreInteractions;
  
+import akka.actor.ActorRef;
+import akka.actor.ActorSystem;
+import akka.actor.Props;
  import akka.persistence.RecoveryCompleted;
  import akka.persistence.SnapshotMetadata;
  import akka.persistence.SnapshotOffer;
  import com.google.common.collect.Sets;
  import com.google.common.util.concurrent.MoreExecutors;
+import java.io.OutputStream;
  import java.util.Arrays;
  import java.util.Collections;
+import java.util.Optional;
+import java.util.concurrent.ExecutionException;
+import java.util.concurrent.Executors;
+import java.util.concurrent.ScheduledExecutorService;
+import java.util.concurrent.ScheduledFuture;
+import java.util.concurrent.TimeUnit;
+import java.util.concurrent.atomic.AtomicInteger;
+import java.util.function.Consumer;
+import org.junit.Assert;
  import org.junit.Before;
  import org.junit.Test;
  import org.mockito.ArgumentMatchers;
@@ -44,6 +59,7 @@ import org.opendaylight.controller.cluster.raft.persisted.SimpleReplicatedLogEnt
  import org.opendaylight.controller.cluster.raft.persisted.Snapshot;
  import org.opendaylight.controller.cluster.raft.persisted.UpdateElectionTerm;
  import org.opendaylight.controller.cluster.raft.protobuff.client.messages.Payload;
+import org.opendaylight.controller.cluster.raft.utils.DoNothingActor;
  import org.slf4j.Logger;
  import org.slf4j.LoggerFactory;
  
@@ -59,30 +75,31 @@ public class RaftActorRecoverySupportTest {
      @Mock
      private DataPersistenceProvider mockPersistence;
  
-
      @Mock
      private RaftActorRecoveryCohort mockCohort;
  
-    @Mock
-    private RaftActorSnapshotCohort mockSnapshotCohort;
-
      @Mock
      PersistentDataProvider mockPersistentProvider;
  
+    ActorRef mockActorRef;
+
+    ActorSystem mockActorSystem;
+
      private RaftActorRecoverySupport support;
  
      private RaftActorContext context;
      private final DefaultConfigParamsImpl configParams = new DefaultConfigParamsImpl();
      private final String localId = "leader";
  
-
      @Before
      public void setup() {
          MockitoAnnotations.initMocks(this);
-
-        context = new RaftActorContextImpl(null, null, localId, new ElectionTermImpl(mockPersistentProvider, "test",
-                LOG), -1, -1, Collections.<String,String>emptyMap(), configParams,
-                mockPersistence, applyState -> { }, LOG,  MoreExecutors.directExecutor());
+        mockActorSystem = ActorSystem.create();
+        mockActorRef = mockActorSystem.actorOf(Props.create(DoNothingActor.class));
+        context = new RaftActorContextImpl(mockActorRef, null, localId,
+                new ElectionTermImpl(mockPersistentProvider, "test", LOG), -1, -1,
+                Collections.<String, String>emptyMap(), configParams, mockPersistence, applyState -> {
+        }, LOG, MoreExecutors.directExecutor());
  
          support = new RaftActorRecoverySupport(context, mockCohort);
  
@@ -159,6 +176,40 @@ public class RaftActorRecoverySupportTest {
          inOrder.verifyNoMoreInteractions();
      }
  
+    @Test
+    public void testIncrementalRecovery() {
+        int recoverySnapshotInterval = 3;
+        int numberOfEntries = 5;
+        configParams.setRecoverySnapshotIntervalSeconds(recoverySnapshotInterval);
+        Consumer<Optional<OutputStream>> mockSnapshotConsumer = mock(Consumer.class);
+        context.getSnapshotManager().setCreateSnapshotConsumer(mockSnapshotConsumer);
+
+        ScheduledExecutorService applyEntriesExecutor = Executors.newSingleThreadScheduledExecutor();
+        ReplicatedLog replicatedLog = context.getReplicatedLog();
+
+        for (int i = 0; i <= numberOfEntries; i++) {
+            replicatedLog.append(new SimpleReplicatedLogEntry(i, 1,
+                new MockRaftActorContext.MockPayload(String.valueOf(i))));
+        }
+
+        AtomicInteger entryCount = new AtomicInteger();
+        ScheduledFuture<?> applyEntriesFuture = applyEntriesExecutor.scheduleAtFixedRate(() -> {
+            int run = entryCount.getAndIncrement();
+            LOG.info("Sending entry number {}", run);
+            sendMessageToSupport(new ApplyJournalEntries(run));
+        }, 0, 1, TimeUnit.SECONDS);
+
+        ScheduledFuture<Boolean> canceller = applyEntriesExecutor.schedule(() -> applyEntriesFuture.cancel(false),
+            numberOfEntries, TimeUnit.SECONDS);
+        try {
+            canceller.get();
+            verify(mockSnapshotConsumer, times(1)).accept(any());
+            applyEntriesExecutor.shutdown();
+        } catch (InterruptedException | ExecutionException e) {
+            Assert.fail();
+        }
+    }
+
      @Test
      public void testOnSnapshotOffer() {
  
@@ -184,7 +235,7 @@ public class RaftActorRecoverySupportTest {
                  lastAppliedDuringSnapshotCapture, 1, electionTerm, electionVotedFor, null);
  
          SnapshotMetadata metadata = new SnapshotMetadata("test", 6, 12345);
-        SnapshotOffer snapshotOffer = new SnapshotOffer(metadata , snapshot);
+        SnapshotOffer snapshotOffer = new SnapshotOffer(metadata, snapshot);
  
          sendMessageToSupport(snapshotOffer);
  
@@ -298,8 +349,8 @@ public class RaftActorRecoverySupportTest {
      }
  
      static UpdateElectionTerm updateElectionTerm(final long term, final String votedFor) {
-        return ArgumentMatchers.argThat(
-            other -> term == other.getCurrentTerm() && votedFor.equals(other.getVotedFor()));
+        return ArgumentMatchers.argThat(other ->
+                term == other.getCurrentTerm() && votedFor.equals(other.getVotedFor()));
      }
  
      @Test
@@ -380,16 +431,16 @@ public class RaftActorRecoverySupportTest {
          long electionTerm = 2;
          String electionVotedFor = "member-2";
          ServerConfigurationPayload serverPayload = new ServerConfigurationPayload(Arrays.asList(
-                                                        new ServerInfo(localId, true),
-                                                        new ServerInfo("follower1", true),
-                                                        new ServerInfo("follower2", true)));
+                new ServerInfo(localId, true),
+                new ServerInfo("follower1", true),
+                new ServerInfo("follower2", true)));
  
          MockSnapshotState snapshotState = new MockSnapshotState(Arrays.asList(new MockPayload("1")));
          Snapshot snapshot = Snapshot.create(snapshotState, Collections.<ReplicatedLogEntry>emptyList(),
                  -1, -1, -1, -1, electionTerm, electionVotedFor, serverPayload);
  
          SnapshotMetadata metadata = new SnapshotMetadata("test", 6, 12345);
-        SnapshotOffer snapshotOffer = new SnapshotOffer(metadata , snapshot);
+        SnapshotOffer snapshotOffer = new SnapshotOffer(metadata, snapshot);
  
          sendMessageToSupport(snapshotOffer);
  
@@ -398,6 +449,6 @@ public class RaftActorRecoverySupportTest {
          assertEquals("Election votedFor", electionVotedFor, context.getTermInformation().getVotedFor());
          assertTrue("Dynamic server configuration", context.isDynamicServerConfigurationInUse());
          assertEquals("Peer List", Sets.newHashSet("follower1", "follower2"),
-            Sets.newHashSet(context.getPeerIds()));
+                Sets.newHashSet(context.getPeerIds()));
      }
-}
+}
+\ No newline at end of file
diff --git a/opendaylight/md-sal/sal-clustering-config/src/main/resources/initial/datastore.cfg b/opendaylight/md-sal/sal-clustering-config/src/main/resources/initial/datastore.cfg

index afceb37f7ac7ba825e5e4e9381ccad003738cde4..798816dc572deb03b369cd3dd5735d71ecd83b6d 100644 (file)
--- a/opendaylight/md-sal/sal-clustering-config/src/main/resources/initial/datastore.cfg
+++ b/opendaylight/md-sal/sal-clustering-config/src/main/resources/initial/datastore.cfg
@@ -112,4 +112,7 @@ operational.persistent=false
  # Multiplicator of shard-leader-election-timeout-in-seconds for the purposes of initial datastore
  # convergence. Each frontend datastore instance will wait specified amount of time before becoming
  # exposed as a service. A value of 0 indicates waiting forever. Defaults to 3.
-initial-settle-timeout-multiplier=3
+#initial-settle-timeout-multiplier=3
+
+#Interval after which a snapshot should be taken during the recovery process.
+#recovery-snapshot-interval-seconds=0
diff --git a/opendaylight/md-sal/sal-distributed-datastore/src/main/java/org/opendaylight/controller/cluster/datastore/DatastoreContext.java b/opendaylight/md-sal/sal-distributed-datastore/src/main/java/org/opendaylight/controller/cluster/datastore/DatastoreContext.java

index e6d8ed84573d0094e222b38f0088a8175c953280..dc736872f03895c350c66feb62887d61ed64f30a 100644 (file)
--- a/opendaylight/md-sal/sal-distributed-datastore/src/main/java/org/opendaylight/controller/cluster/datastore/DatastoreContext.java
+++ b/opendaylight/md-sal/sal-distributed-datastore/src/main/java/org/opendaylight/controller/cluster/datastore/DatastoreContext.java
@@ -45,6 +45,7 @@ public class DatastoreContext implements ClientActorConfig {
      public static final int DEFAULT_SHARD_TX_COMMIT_TIMEOUT_IN_SECONDS = 30;
      public static final int DEFAULT_JOURNAL_RECOVERY_BATCH_SIZE = 1;
      public static final int DEFAULT_SNAPSHOT_BATCH_COUNT = 20000;
+    public static final int DEFAULT_RECOVERY_SNAPSHOT_INTERVAL_SECONDS = 0;
      public static final int DEFAULT_HEARTBEAT_INTERVAL_IN_MILLIS = 500;
      public static final int DEFAULT_ISOLATED_LEADER_CHECK_INTERVAL_IN_MILLIS =
              DEFAULT_HEARTBEAT_INTERVAL_IN_MILLIS * 10;
@@ -107,6 +108,7 @@ public class DatastoreContext implements ClientActorConfig {
      DatastoreContext() {
          setShardJournalRecoveryLogBatchSize(DEFAULT_JOURNAL_RECOVERY_BATCH_SIZE);
          setSnapshotBatchCount(DEFAULT_SNAPSHOT_BATCH_COUNT);
+        setRecoverySnapshotIntervalSeconds(DEFAULT_RECOVERY_SNAPSHOT_INTERVAL_SECONDS);
          setHeartbeatInterval(DEFAULT_HEARTBEAT_INTERVAL_IN_MILLIS);
          setIsolatedLeaderCheckInterval(DEFAULT_ISOLATED_LEADER_CHECK_INTERVAL_IN_MILLIS);
          setSnapshotDataThresholdPercentage(DEFAULT_SHARD_SNAPSHOT_DATA_THRESHOLD_PERCENTAGE);
@@ -145,6 +147,7 @@ public class DatastoreContext implements ClientActorConfig {
  
          setShardJournalRecoveryLogBatchSize(other.raftConfig.getJournalRecoveryLogBatchSize());
          setSnapshotBatchCount(other.raftConfig.getSnapshotBatchCount());
+        setRecoverySnapshotIntervalSeconds(other.raftConfig.getRecoverySnapshotIntervalSeconds());
          setHeartbeatInterval(other.raftConfig.getHeartBeatInterval().toMillis());
          setIsolatedLeaderCheckInterval(other.raftConfig.getIsolatedCheckIntervalInMillis());
          setSnapshotDataThresholdPercentage(other.raftConfig.getSnapshotDataThresholdPercentage());
@@ -303,6 +306,14 @@ public class DatastoreContext implements ClientActorConfig {
          raftConfig.setSnapshotBatchCount(shardSnapshotBatchCount);
      }
  
+    /**
+     * Set the interval in seconds after which a snapshot should be taken during the recovery process.
+     * 0 means don't take snapshots
+     */
+    private void setRecoverySnapshotIntervalSeconds(final int recoverySnapshotInterval) {
+        raftConfig.setRecoverySnapshotIntervalSeconds(recoverySnapshotInterval);
+    }
+
      @Deprecated
      private void setShardSnapshotChunkSize(final int shardSnapshotChunkSize) {
          // We'll honor the shardSnapshotChunkSize setting for backwards compatibility but only if it doesn't exceed
@@ -441,6 +452,12 @@ public class DatastoreContext implements ClientActorConfig {
              return this;
          }
  
+        public Builder recoverySnapshotIntervalSeconds(final int recoverySnapshotIntervalSeconds) {
+            checkArgument(recoverySnapshotIntervalSeconds >= 0);
+            datastoreContext.setRecoverySnapshotIntervalSeconds(recoverySnapshotIntervalSeconds);
+            return this;
+        }
+
          public Builder shardSnapshotDataThresholdPercentage(final int shardSnapshotDataThresholdPercentage) {
              datastoreContext.setSnapshotDataThresholdPercentage(shardSnapshotDataThresholdPercentage);
              return this;
diff --git a/opendaylight/md-sal/sal-distributed-datastore/src/main/yang/distributed-datastore-provider.yang b/opendaylight/md-sal/sal-distributed-datastore/src/main/yang/distributed-datastore-provider.yang

index 7a932b8b1107b599d6a9f5b494e516224e59fbe1..e2e146c7c57756a37888fe89440dacd12c93498a 100644 (file)
--- a/opendaylight/md-sal/sal-distributed-datastore/src/main/yang/distributed-datastore-provider.yang
+++ b/opendaylight/md-sal/sal-distributed-datastore/src/main/yang/distributed-datastore-provider.yang
@@ -151,6 +151,12 @@ module distributed-datastore-provider {
                           Zero value means wait indefinitely (as long as it takes).";
          }
  
+        leaf recovery-snapshot-interval-seconds {
+            default 0;
+            type uint32;
+            description "Interval after which a snapshot should be taken during the recovery process.";
+        }
+
          leaf shard-batched-modification-count {
              default 1000;
              type non-zero-uint32-type;
diff --git a/opendaylight/md-sal/sal-distributed-datastore/src/test/java/org/opendaylight/controller/cluster/datastore/DatastoreContextIntrospectorTest.java b/opendaylight/md-sal/sal-distributed-datastore/src/test/java/org/opendaylight/controller/cluster/datastore/DatastoreContextIntrospectorTest.java

index f98a9b75d44eb66992e757954df4890b12d4981a..ef00e161d863ad75910e87c98ec2491515db36fc 100644 (file)
--- a/opendaylight/md-sal/sal-distributed-datastore/src/test/java/org/opendaylight/controller/cluster/datastore/DatastoreContextIntrospectorTest.java
+++ b/opendaylight/md-sal/sal-distributed-datastore/src/test/java/org/opendaylight/controller/cluster/datastore/DatastoreContextIntrospectorTest.java
@@ -86,6 +86,7 @@ public class DatastoreContextIntrospectorTest {
          properties.put("shard-initialization-timeout-in-seconds", "82");
          properties.put("shard-leader-election-timeout-in-seconds", "66");
          properties.put("initial-settle-timeout-multiplier", "5");
+        properties.put("recovery-snapshot-interval-seconds", "360");
          properties.put("shard-isolated-leader-check-interval-in-millis", "123");
          properties.put("shard-snapshot-data-threshold-percentage", "100");
          properties.put("shard-election-timeout-factor", "21");
@@ -112,6 +113,7 @@ public class DatastoreContextIntrospectorTest {
          assertEquals(82, context.getShardInitializationTimeout().duration().toSeconds());
          assertEquals(66, context.getShardLeaderElectionTimeout().duration().toSeconds());
          assertEquals(5, context.getInitialSettleTimeoutMultiplier());
+        assertEquals(360, context.getShardRaftConfig().getRecoverySnapshotIntervalSeconds());
          assertEquals(123, context.getShardRaftConfig().getIsolatedCheckIntervalInMillis());
          assertEquals(100, context.getShardRaftConfig().getSnapshotDataThresholdPercentage());
          assertEquals(21, context.getShardRaftConfig().getElectionTimeoutFactor());
diff --git a/opendaylight/md-sal/sal-distributed-datastore/src/test/java/org/opendaylight/controller/cluster/datastore/DatastoreContextTest.java b/opendaylight/md-sal/sal-distributed-datastore/src/test/java/org/opendaylight/controller/cluster/datastore/DatastoreContextTest.java

index 504618cd1fa94a777afe0252a60b2db0f3e317a7..59c7d5ab8e3623c98a88913abee0982a84262f88 100644 (file)
--- a/opendaylight/md-sal/sal-distributed-datastore/src/test/java/org/opendaylight/controller/cluster/datastore/DatastoreContextTest.java
+++ b/opendaylight/md-sal/sal-distributed-datastore/src/test/java/org/opendaylight/controller/cluster/datastore/DatastoreContextTest.java
@@ -17,6 +17,7 @@ import static org.opendaylight.controller.cluster.datastore.DatastoreContext.DEF
  import static org.opendaylight.controller.cluster.datastore.DatastoreContext.DEFAULT_MAX_MESSAGE_SLICE_SIZE;
  import static org.opendaylight.controller.cluster.datastore.DatastoreContext.DEFAULT_OPERATION_TIMEOUT_IN_MS;
  import static org.opendaylight.controller.cluster.datastore.DatastoreContext.DEFAULT_PERSISTENT;
+import static org.opendaylight.controller.cluster.datastore.DatastoreContext.DEFAULT_RECOVERY_SNAPSHOT_INTERVAL_SECONDS;
  import static org.opendaylight.controller.cluster.datastore.DatastoreContext.DEFAULT_SHARD_BATCHED_MODIFICATION_COUNT;
  import static org.opendaylight.controller.cluster.datastore.DatastoreContext.DEFAULT_SHARD_ELECTION_TIMEOUT_FACTOR;
  import static org.opendaylight.controller.cluster.datastore.DatastoreContext.DEFAULT_SHARD_INITIALIZATION_TIMEOUT;
@@ -85,6 +86,7 @@ public class DatastoreContextTest {
          builder.shardTransactionCommitTimeoutInSeconds(DEFAULT_SHARD_TX_COMMIT_TIMEOUT_IN_SECONDS + 1);
          builder.shardJournalRecoveryLogBatchSize(DEFAULT_JOURNAL_RECOVERY_BATCH_SIZE + 1);
          builder.shardSnapshotBatchCount(DEFAULT_SNAPSHOT_BATCH_COUNT + 1);
+        builder.recoverySnapshotIntervalSeconds(DEFAULT_RECOVERY_SNAPSHOT_INTERVAL_SECONDS + 1);
          builder.shardHeartbeatIntervalInMillis(DEFAULT_HEARTBEAT_INTERVAL_IN_MILLIS + 1);
          builder.shardTransactionCommitQueueCapacity(DEFAULT_SHARD_TX_COMMIT_QUEUE_CAPACITY + 1);
          builder.shardInitializationTimeout(DEFAULT_SHARD_INITIALIZATION_TIMEOUT
@@ -134,6 +136,8 @@ public class DatastoreContextTest {
          assertEquals(DEFAULT_JOURNAL_RECOVERY_BATCH_SIZE + 1,
                  context.getShardRaftConfig().getJournalRecoveryLogBatchSize());
          assertEquals(DEFAULT_SNAPSHOT_BATCH_COUNT + 1, context.getShardRaftConfig().getSnapshotBatchCount());
+        assertEquals(DEFAULT_RECOVERY_SNAPSHOT_INTERVAL_SECONDS + 1,
+                context.getShardRaftConfig().getRecoverySnapshotIntervalSeconds());
          assertEquals(DEFAULT_HEARTBEAT_INTERVAL_IN_MILLIS + 1,
                  context.getShardRaftConfig().getHeartBeatInterval().length());
          assertEquals(DEFAULT_SHARD_TX_COMMIT_QUEUE_CAPACITY + 1, context.getShardTransactionCommitQueueCapacity());
author	Tibor Král <tibor.kral@pantheon.tech>
	Wed, 22 Jan 2020 11:53:41 +0000 (12:53 +0100)
committer	Robert Varga <robert.varga@pantheon.tech>
	Sun, 14 Jun 2020 15:15:47 +0000 (17:15 +0200)
opendaylight/md-sal/sal-akka-raft/src/main/java/org/opendaylight/controller/cluster/raft/ConfigParams.java		patch \| blob \| history
opendaylight/md-sal/sal-akka-raft/src/main/java/org/opendaylight/controller/cluster/raft/DefaultConfigParamsImpl.java		patch \| blob \| history
opendaylight/md-sal/sal-akka-raft/src/main/java/org/opendaylight/controller/cluster/raft/RaftActorRecoverySupport.java		patch \| blob \| history
opendaylight/md-sal/sal-akka-raft/src/test/java/org/opendaylight/controller/cluster/raft/RaftActorRecoverySupportTest.java		patch \| blob \| history
opendaylight/md-sal/sal-clustering-config/src/main/resources/initial/datastore.cfg		patch \| blob \| history
opendaylight/md-sal/sal-distributed-datastore/src/main/java/org/opendaylight/controller/cluster/datastore/DatastoreContext.java		patch \| blob \| history
opendaylight/md-sal/sal-distributed-datastore/src/main/yang/distributed-datastore-provider.yang		patch \| blob \| history
opendaylight/md-sal/sal-distributed-datastore/src/test/java/org/opendaylight/controller/cluster/datastore/DatastoreContextIntrospectorTest.java		patch \| blob \| history
opendaylight/md-sal/sal-distributed-datastore/src/test/java/org/opendaylight/controller/cluster/datastore/DatastoreContextTest.java		patch \| blob \| history