X-Git-Url: https://git.opendaylight.org/gerrit/gitweb?a=blobdiff_plain;f=opendaylight%2Fmd-sal%2Fsal-akka-raft%2Fsrc%2Fmain%2Fjava%2Forg%2Fopendaylight%2Fcontroller%2Fcluster%2Fraft%2Fbehaviors%2FCandidate.java;h=c125bd32b60a5c5d714ea13e7008417f904d88dc;hb=refs%2Fchanges%2F16%2F87616%2F4;hp=ecd49012461a7b1ee76f4678c7451a4fa1edbfb1;hpb=7b82869e73c5a9c8137521f1bf9b4e446d48440c;p=controller.git
diff --git a/opendaylight/md-sal/sal-akka-raft/src/main/java/org/opendaylight/controller/cluster/raft/behaviors/Candidate.java b/opendaylight/md-sal/sal-akka-raft/src/main/java/org/opendaylight/controller/cluster/raft/behaviors/Candidate.java
index ecd4901246..a8762ec76e 100644
--- a/opendaylight/md-sal/sal-akka-raft/src/main/java/org/opendaylight/controller/cluster/raft/behaviors/Candidate.java
+++ b/opendaylight/md-sal/sal-akka-raft/src/main/java/org/opendaylight/controller/cluster/raft/behaviors/Candidate.java
@@ -10,22 +10,25 @@ package org.opendaylight.controller.cluster.raft.behaviors;
import akka.actor.ActorRef;
import akka.actor.ActorSelection;
+import java.util.ArrayList;
+import java.util.Collection;
+import org.opendaylight.controller.cluster.raft.PeerInfo;
import org.opendaylight.controller.cluster.raft.RaftActorContext;
import org.opendaylight.controller.cluster.raft.RaftState;
-import org.opendaylight.controller.cluster.raft.internal.messages.ElectionTimeout;
+import org.opendaylight.controller.cluster.raft.ReplicatedLogEntry;
+import org.opendaylight.controller.cluster.raft.base.messages.ApplyState;
+import org.opendaylight.controller.cluster.raft.base.messages.ElectionTimeout;
import org.opendaylight.controller.cluster.raft.messages.AppendEntries;
import org.opendaylight.controller.cluster.raft.messages.AppendEntriesReply;
import org.opendaylight.controller.cluster.raft.messages.RaftRPC;
import org.opendaylight.controller.cluster.raft.messages.RequestVote;
import org.opendaylight.controller.cluster.raft.messages.RequestVoteReply;
-
-import java.util.Collection;
-import java.util.HashMap;
-import java.util.Map;
+import scala.concurrent.duration.FiniteDuration;
/**
- * The behavior of a RaftActor when it is in the CandidateState
- *
+ * The behavior of a RaftActor when it is in the Candidate raft state.
+ *
+ *
* Candidates (§5.2):
*
* - On conversion to candidate, start election:
@@ -43,137 +46,179 @@ import java.util.Map;
*/
public class Candidate extends AbstractRaftActorBehavior {
- private final Map peerToActor = new HashMap<>();
-
private int voteCount;
private final int votesRequired;
- public Candidate(RaftActorContext context) {
- super(context);
+ private final Collection votingPeers = new ArrayList<>();
- Collection peerPaths = context.getPeerAddresses().values();
+ public Candidate(final RaftActorContext context) {
+ super(context, RaftState.Candidate);
- for (String peerPath : peerPaths) {
- peerToActor.put(peerPath,
- context.actorSelection(peerPath));
+ for (PeerInfo peer: context.getPeers()) {
+ if (peer.isVoting()) {
+ votingPeers.add(peer.getId());
+ }
}
- context.getLogger().debug("Election:Candidate has following peers:"+peerToActor.keySet());
- if(peerPaths.size() > 0) {
- // Votes are required from a majority of the peers including self.
- // The votesRequired field therefore stores a calculated value
- // of the number of votes required for this candidate to win an
- // election based on it's known peers.
- // If a peer was added during normal operation and raft replicas
- // came to know about them then the new peer would also need to be
- // taken into consideration when calculating this value.
- // Here are some examples for what the votesRequired would be for n
- // peers
- // 0 peers = 1 votesRequired (0 + 1) / 2 + 1 = 1
- // 2 peers = 2 votesRequired (2 + 1) / 2 + 1 = 2
- // 4 peers = 3 votesRequired (4 + 1) / 2 + 1 = 3
- int noOfPeers = peerPaths.size();
- int self = 1;
- votesRequired = (noOfPeers + self) / 2 + 1;
- } else {
- votesRequired = 0;
- }
+ log.debug("{}: Election: Candidate has following voting peers: {}", logName(), votingPeers);
+
+ votesRequired = getMajorityVoteCount(votingPeers.size());
startNewTerm();
- scheduleElection(electionDuration());
+
+ if (votingPeers.isEmpty()) {
+ actor().tell(ElectionTimeout.INSTANCE, actor());
+ } else {
+ scheduleElection(electionDuration());
+ }
}
- @Override protected RaftState handleAppendEntries(ActorRef sender,
- AppendEntries appendEntries) {
+ @Override
+ public final String getLeaderId() {
+ return null;
+ }
- return state();
+ @Override
+ public final short getLeaderPayloadVersion() {
+ return -1;
}
- @Override protected RaftState handleAppendEntriesReply(ActorRef sender,
- AppendEntriesReply appendEntriesReply) {
+ @Override
+ protected RaftActorBehavior handleAppendEntries(final ActorRef sender, final AppendEntries appendEntries) {
+
+ log.debug("{}: handleAppendEntries: {}", logName(), appendEntries);
+
+ // Some other candidate for the same term became a leader and sent us an append entry
+ if (currentTerm() == appendEntries.getTerm()) {
+ log.info("{}: New Leader {} sent an AppendEntries to Candidate for term {} - will switch to Follower",
+ logName(), appendEntries.getLeaderId(), currentTerm());
- return state();
+ return switchBehavior(new Follower(context));
+ }
+
+ return this;
}
- @Override protected RaftState handleRequestVoteReply(ActorRef sender,
- RequestVoteReply requestVoteReply) {
+ @Override
+ protected RaftActorBehavior handleAppendEntriesReply(final ActorRef sender,
+ final AppendEntriesReply appendEntriesReply) {
+ return this;
+ }
+
+ @Override
+ protected RaftActorBehavior handleRequestVoteReply(final ActorRef sender, final RequestVoteReply requestVoteReply) {
+ log.debug("{}: handleRequestVoteReply: {}, current voteCount: {}", logName(), requestVoteReply, voteCount);
if (requestVoteReply.isVoteGranted()) {
voteCount++;
}
if (voteCount >= votesRequired) {
- return RaftState.Leader;
+ if (context.getLastApplied() < context.getReplicatedLog().lastIndex()) {
+ log.info("{}: LastApplied index {} is behind last index {} - switching to PreLeader",
+ logName(), context.getLastApplied(), context.getReplicatedLog().lastIndex());
+ return internalSwitchBehavior(RaftState.PreLeader);
+ } else {
+ return internalSwitchBehavior(RaftState.Leader);
+ }
}
- return state();
+ return this;
}
- @Override public RaftState state() {
- return RaftState.Candidate;
+ @Override
+ protected FiniteDuration electionDuration() {
+ return super.electionDuration().$div(context.getConfigParams().getCandidateElectionTimeoutDivisor());
}
- @Override
- public RaftState handleMessage(ActorRef sender, Object message) {
- if (message instanceof RaftRPC) {
- RaftRPC rpc = (RaftRPC) message;
- // If RPC request or response contains term T > currentTerm:
- // set currentTerm = T, convert to follower (§5.1)
- // This applies to all RPC messages and responses
- if (rpc.getTerm() > context.getTermInformation().getCurrentTerm()) {
- context.getTermInformation().updateAndPersist(rpc.getTerm(), null);
- return RaftState.Follower;
- }
- }
+ @Override
+ final ApplyState getApplyStateFor(final ReplicatedLogEntry entry) {
+ throw new IllegalStateException("A candidate should never attempt to apply " + entry);
+ }
+ @Override
+ public RaftActorBehavior handleMessage(final ActorRef sender, final Object message) {
if (message instanceof ElectionTimeout) {
+ log.debug("{}: Received ElectionTimeout", logName());
+
if (votesRequired == 0) {
// If there are no peers then we should be a Leader
// We wait for the election timeout to occur before declare
// ourselves the leader. This gives enough time for a leader
// who we do not know about (as a peer)
// to send a message to the candidate
- return RaftState.Leader;
+
+ return internalSwitchBehavior(RaftState.Leader);
}
+
startNewTerm();
scheduleElection(electionDuration());
- return state();
+ return this;
}
- return super.handleMessage(sender, message);
- }
+ if (message instanceof RaftRPC) {
- private void startNewTerm() {
+ RaftRPC rpc = (RaftRPC) message;
+ log.debug("{}: RaftRPC message received {}, my term is {}", logName(), rpc,
+ context.getTermInformation().getCurrentTerm());
+ // If RPC request or response contains term T > currentTerm:
+ // set currentTerm = T, convert to follower (§5.1)
+ // This applies to all RPC messages and responses
+ if (rpc.getTerm() > context.getTermInformation().getCurrentTerm()) {
+ log.info("{}: Term {} in \"{}\" message is greater than Candidate's term {} - switching to Follower",
+ logName(), rpc.getTerm(), rpc, context.getTermInformation().getCurrentTerm());
+
+ context.getTermInformation().updateAndPersist(rpc.getTerm(), null);
+
+ // The raft paper does not say whether or not a Candidate can/should process a RequestVote in
+ // this case but doing so gains quicker convergence when the sender's log is more up-to-date.
+ if (message instanceof RequestVote) {
+ super.handleMessage(sender, message);
+ }
+
+ return internalSwitchBehavior(RaftState.Follower);
+ }
+ }
+
+ return super.handleMessage(sender, message);
+ }
+
+ private void startNewTerm() {
// set voteCount back to 1 (that is voting for self)
voteCount = 1;
// Increment the election term and vote for self
long currentTerm = context.getTermInformation().getCurrentTerm();
- context.getTermInformation().updateAndPersist(currentTerm + 1, context.getId());
+ long newTerm = currentTerm + 1;
+ context.getTermInformation().updateAndPersist(newTerm, context.getId());
- context.getLogger().debug("Starting new term " + (currentTerm+1));
+ log.info("{}: Starting new election term {}", logName(), newTerm);
// Request for a vote
// TODO: Retry request for vote if replies do not arrive in a reasonable
// amount of time TBD
- for (ActorSelection peerActor : peerToActor.values()) {
- peerActor.tell(new RequestVote(
- context.getTermInformation().getCurrentTerm(),
- context.getId(),
- context.getReplicatedLog().lastIndex(),
- context.getReplicatedLog().lastTerm()),
- context.getActor()
- );
+ for (String peerId : votingPeers) {
+ ActorSelection peerActor = context.getPeerActorSelection(peerId);
+ if (peerActor != null) {
+ RequestVote requestVote = new RequestVote(
+ context.getTermInformation().getCurrentTerm(),
+ context.getId(),
+ context.getReplicatedLog().lastIndex(),
+ context.getReplicatedLog().lastTerm());
+
+ log.debug("{}: Sending {} to peer {}", logName(), requestVote, peerId);
+
+ peerActor.tell(requestVote, context.getActor());
+ }
}
-
-
}
- @Override public void close() throws Exception {
+ @Override
+ public void close() {
stopElection();
}
}