com.teambytes.inflatable.raft.Leader.scala Maven / Gradle / Ivy

Go to download
Show more of this group Show more artifacts with this name
Show all versions of inflatable_2.11 Show documentation
inflatable
There is a newer version: 1.0.5
package com.teambytes.inflatable.raft

import akka.actor.ActorRef

import model._
import protocol._
import config.RaftConfig

private[raft] trait Leader {
  this: RaftActor =>

  protected def raftConfig: RaftConfig

  private val HeartbeatTimerName = "heartbeat-timer"

  val leaderBehavior: StateFunction = {
    case Event(ElectedAsLeader, m: LeaderMeta) =>
      log.info("Became leader for {}", m.currentTerm)
      initializeLeaderState(m.config.members)
      startHeartbeat(m)
      stay()

    case Event(SendHeartbeat, m: LeaderMeta) =>
      sendHeartbeat(m)
      stay()

    // already won election, but votes may still be coming in
    case Event(_: ElectionMessage, _) =>
      stay()

    // client request
    case Event(ClientMessage(client, cmd: Command), m: LeaderMeta) =>
      log.info("Appending command: [{}] from {} to replicated log...", cmd, client)

      val entry = Entry(cmd, m.currentTerm, replicatedLog.nextIndex, Some(client))

      log.debug("adding to log: {}", entry)
      replicatedLog += entry
      matchIndex.put(m.clusterSelf, entry.index)
      log.debug("log status = {}", replicatedLog)

      val meta = maybeUpdateConfiguration(m, entry.command)
      replicateLog(meta)

      if (meta.config.isPartOfNewConfiguration(m.clusterSelf))
        stay() using meta
      else
        goto(Follower) using meta.forFollower // or maybe goto something else?

    // rogue Leader handling
    case Event(append: AppendEntries[Command], m: LeaderMeta) if append.term > m.currentTerm =>
      log.info("Leader (@ {}) got AppendEntries from fresher Leader (@ {}), will step down and the Leader will keep being: {}", m.currentTerm, append.term, sender())
      stepDown(m)

    case Event(append: AppendEntries[Command], m: LeaderMeta) if append.term <= m.currentTerm =>
      log.warning("Leader (@ {}) got AppendEntries from rogue Leader ({} @ {}); It's not fresher than self. Will send entries, to force it to step down.", m.currentTerm, sender(), append.term)
      sendEntries(sender(), m)
      stay()
    // end of rogue Leader handling

    // append entries response handling

    case Event(AppendRejected(term, index), m: LeaderMeta) if term > m.currentTerm =>
      stopHeartbeat()
      stepDown(m) // since there seems to be another leader!

    case Event(msg: AppendRejected, m: LeaderMeta) =>
      registerAppendRejected(follower(), msg, m)

    case Event(msg: AppendSuccessful, m: LeaderMeta) =>
      registerAppendSuccessful(follower(), msg, m)

    case Event(RequestConfiguration, m: LeaderMeta) =>
      sender() ! ChangeConfiguration(m.config)
      stay()

    case Event(AskForState, _) =>
      sender() ! IAmInState(Leader)
      stay()
  }

  def initializeLeaderState(members: Set[ActorRef]) {
    log.info("Preparing nextIndex and matchIndex table for followers, init all to: replicatedLog.lastIndex = {}", replicatedLog.lastIndex)
    nextIndex = LogIndexMap.initialize(members, replicatedLog.lastIndex)
    matchIndex = LogIndexMap.initialize(members, -1)
  }

  def sendEntries(follower: ActorRef, m: LeaderMeta) {
    follower ! AppendEntries(
      m.currentTerm,
      replicatedLog,
      fromIndex = nextIndex.valueFor(follower),
      leaderCommitId = replicatedLog.committedIndex
    )
  }

  def stopHeartbeat() {
    cancelTimer(HeartbeatTimerName)
  }

  def startHeartbeat(m: LeaderMeta) {
    sendHeartbeat(m)
    log.info("Starting hearbeat, with interval: {}", heartbeatInterval)
    setTimer(HeartbeatTimerName, SendHeartbeat, heartbeatInterval, repeat = true)
  }

  /** heartbeat is implemented as basically sending AppendEntry messages */
  def sendHeartbeat(m: LeaderMeta) {
    replicateLog(m)
  }

  def replicateLog(m: LeaderMeta) {
    m.membersExceptSelf foreach { member =>
      // todo remove me
//      log.info("sending: {} to {}", AppendEntries(m.currentTerm, replicatedLog, fromIndex = nextIndex.valueFor(member), leaderCommitId = replicatedLog.committedIndex), member)

      member ! AppendEntries(
        m.currentTerm,
        replicatedLog,
        fromIndex = nextIndex.valueFor(member),
        leaderCommitId = replicatedLog.committedIndex
      )
    }
  }

  def registerAppendRejected(member: ActorRef, msg: AppendRejected, m: LeaderMeta) = {
    val AppendRejected(followerTerm, followerIndex) = msg

    log.info("Follower {} rejected write: {} @ {}, back out the first index in this term and retry", follower(), followerTerm, followerIndex)

    nextIndex.putIfSmaller(follower(), followerIndex)

//    todo think if we send here or keep in heartbeat
    sendEntries(follower(), m)

    stay()
  }

  def registerAppendSuccessful(member: ActorRef, msg: AppendSuccessful, m: LeaderMeta) = {
    val AppendSuccessful(followerTerm, followerIndex) = msg

    log.info("Follower {} took write in term: {}, index: {}", follower(), followerTerm, nextIndex.valueFor(follower()))

    // update our tables for this member
    nextIndex.put(follower(), followerIndex)
    matchIndex.putIfGreater(follower(), nextIndex.valueFor(follower()))

    replicatedLog = maybeCommitEntry(m, matchIndex, replicatedLog)

    stay()
  }

  def maybeCommitEntry(m: LeaderMeta, matchIndex: LogIndexMap, replicatedLog: ReplicatedLog[Command]): ReplicatedLog[Command] = {
    val indexOnMajority = matchIndex.consensusForIndex(m.config)
    val willCommit = indexOnMajority > replicatedLog.committedIndex

    if (willCommit) log.info("Consensus for persisted index: {}. (Comitted index: {}, will commit now: {})", indexOnMajority, replicatedLog.committedIndex, willCommit)
    else log.info("Consensus for persisted index: {}. (Comitted index: {})", indexOnMajority, replicatedLog.committedIndex)

    if (willCommit) {
      val entries = replicatedLog.between(replicatedLog.committedIndex, indexOnMajority)

      entries foreach { entry =>
        handleCommitIfSpecialEntry.applyOrElse(entry, default = handleNormalEntry)

        if (raftConfig.publishTestingEvents)
          context.system.eventStream.publish(EntryCommitted(entry.index, m.clusterSelf))
      }

      replicatedLog.commit(indexOnMajority)
    } else {
      replicatedLog
    }
  }

  /**
   * Used for handling special messages, such as ''new Configuration'' or a ''Snapshot entry'' being comitted.
   *
   * Note that special log entries will NOT be propagated to the client state machine.
   */
  private val handleCommitIfSpecialEntry: PartialFunction[Entry[Command], Unit] = {
    case Entry(jointConfig: JointConsensusClusterConfiguration, _, _, _) =>
      self ! ClientMessage(self, jointConfig.transitionToStable) // will cause comitting of only "new" config

    case Entry(stableConfig: StableClusterConfiguration, _, _, _) =>
      // simply ignore, once this message is in our log we started using the new configuration anyway,
      // there's no need to apply this message onto the client state machine.
  }

  private val handleNormalEntry: PartialFunction[Any, Unit] = {
    case entry: Entry[Command] =>
      log.info("Committing log at index: {}; Applying command: {}, will send result to client: {}", entry.index, entry.command, entry.client)
      val result = apply(entry.command) // todo what if we apply a message the actor didnt understand? should fail "nicely"
      entry.client foreach { _ ! result }
  }

  /**
   * Configurations must be used by each node right away when they get appended to their logs (doesn't matter if not committed).
   * This method updates the Meta object if a configuration change is discovered.
   */
  def maybeUpdateConfiguration(meta: LeaderMeta, entry: Command): LeaderMeta = entry match {
    case newConfig: ClusterConfiguration if newConfig.isNewerThan(meta.config) =>
      log.info("Appended new configuration, will start using it now: {}", newConfig)
      meta.withConfig(newConfig)

    case _ =>
      meta
  }

}