pekko/akka-cluster/src/main/scala/akka/cluster/Cluster.scala

/**
 * Copyright (C) 2009-2017 Lightbend Inc. <http://www.lightbend.com>
 */

package akka.cluster

import java.io.Closeable
import java.util.concurrent.ThreadFactory
import java.util.concurrent.atomic.AtomicBoolean

import akka.ConfigurationException
import akka.actor._
import akka.cluster.ClusterSettings.DataCenter
import akka.dispatch.MonitorableThreadFactory
import akka.event.{ Logging, LoggingAdapter }
import akka.japi.Util
import akka.pattern._
import akka.remote.{ DefaultFailureDetectorRegistry, FailureDetector, _ }
import com.typesafe.config.{ Config, ConfigFactory }

import scala.annotation.varargs
import scala.collection.immutable
import scala.concurrent.duration._
import scala.concurrent.{ Await, ExecutionContext }
import scala.util.control.NonFatal

/**
 * Cluster Extension Id and factory for creating Cluster extension.
 */
object Cluster extends ExtensionId[Cluster] with ExtensionIdProvider {
  override def get(system: ActorSystem): Cluster = super.get(system)

  override def lookup = Cluster

  override def createExtension(system: ExtendedActorSystem): Cluster = new Cluster(system)

  /**
   * INTERNAL API
   */
  private[cluster] final val isAssertInvariantsEnabled: Boolean =
    System.getProperty("akka.cluster.assert", "off").toLowerCase match {
      case "on" | "true" ⇒ true
      case _             ⇒ false
    }
}

/**
 * This module is responsible cluster membership information. Changes to the cluster
 * information is retrieved through [[#subscribe]]. Commands to operate the cluster is
 * available through methods in this class, such as [[#join]], [[#down]] and [[#leave]].
 *
 * Each cluster [[Member]] is identified by its [[akka.actor.Address]], and
 * the cluster address of this actor system is [[#selfAddress]]. A member also has a status;
 * initially [[MemberStatus]] `Joining` followed by [[MemberStatus]] `Up`.
 */
class Cluster(val system: ExtendedActorSystem) extends Extension {

  import ClusterEvent._

  val settings = new ClusterSettings(system.settings.config, system.name)
  import InfoLogger._
  import settings._

  /**
   * The address including a `uid` of this cluster member.
   * The `uid` is needed to be able to distinguish different
   * incarnations of a member with same hostname and port.
   */
  val selfUniqueAddress: UniqueAddress = system.provider match {
    case c: ClusterActorRefProvider ⇒
      UniqueAddress(c.transport.defaultAddress, AddressUidExtension(system).longAddressUid)
    case other ⇒ throw new ConfigurationException(
      s"ActorSystem [${system}] needs to have a 'ClusterActorRefProvider' enabled in the configuration, currently uses [${other.getClass.getName}]")
  }

  /**
   * The address of this cluster member.
   */
  def selfAddress: Address = selfUniqueAddress.address

  /** Data center to which this node belongs to (defaults to "default" if not configured explicitly) */
  def selfDataCenter: DataCenter = settings.SelfDataCenter

  /**
   * roles that this member has
   */
  def selfRoles: Set[String] = settings.Roles

  /**
   * Java API: roles that this member has
   */
  def getSelfRoles: java.util.Set[String] =
    scala.collection.JavaConverters.setAsJavaSetConverter(selfRoles).asJava

  private val _isTerminated = new AtomicBoolean(false)
  private val log = Logging(system, getClass.getName)
  // ClusterJmx is initialized as the last thing in the constructor
  private var clusterJmx: Option[ClusterJmx] = None

  logInfo("Starting up...")

  val failureDetector: FailureDetectorRegistry[Address] = {
    val createFailureDetector = () ⇒
      FailureDetectorLoader.load(settings.FailureDetectorImplementationClass, settings.FailureDetectorConfig, system)

    new DefaultFailureDetectorRegistry(createFailureDetector)
  }

  val crossDcFailureDetector: FailureDetectorRegistry[Address] = {
    val createFailureDetector = () ⇒
      FailureDetectorLoader.load(
        settings.MultiDataCenter.CrossDcFailureDetectorSettings.ImplementationClass,
        settings.MultiDataCenter.CrossDcFailureDetectorSettings.config, system)

    new DefaultFailureDetectorRegistry(createFailureDetector)
  }

  // needs to be lazy to allow downing provider impls to access Cluster (if not we get deadlock)
  lazy val downingProvider: DowningProvider =
    DowningProvider.load(settings.DowningProviderClassName, system)

  // ========================================================
  // ===================== WORK DAEMONS =====================
  // ========================================================

  /**
   * INTERNAL API
   */
  private[cluster] val scheduler: Scheduler = {
    if (system.scheduler.maxFrequency < 1.second / SchedulerTickDuration) {
      logInfo(
        "Using a dedicated scheduler for cluster. Default scheduler can be used if configured " +
          "with 'akka.scheduler.tick-duration' [{} ms] <=  'akka.cluster.scheduler.tick-duration' [{} ms].",
        (1000 / system.scheduler.maxFrequency).toInt, SchedulerTickDuration.toMillis)

      val cfg = ConfigFactory.parseString(
        s"akka.scheduler.tick-duration=${SchedulerTickDuration.toMillis}ms").withFallback(
          system.settings.config)
      val threadFactory = system.threadFactory match {
        case tf: MonitorableThreadFactory ⇒ tf.withName(tf.name + "-cluster-scheduler")
        case tf                           ⇒ tf
      }
      system.dynamicAccess.createInstanceFor[Scheduler](system.settings.SchedulerClass, immutable.Seq(
        classOf[Config] → cfg,
        classOf[LoggingAdapter] → log,
        classOf[ThreadFactory] → threadFactory)).get
    } else {
      // delegate to system.scheduler, but don't close over system
      val systemScheduler = system.scheduler
      new Scheduler with Closeable {
        override def close(): Unit = () // we are using system.scheduler, which we are not responsible for closing

        override def maxFrequency: Double = systemScheduler.maxFrequency

        override def schedule(initialDelay: FiniteDuration, interval: FiniteDuration,
                              runnable: Runnable)(implicit executor: ExecutionContext): Cancellable =
          systemScheduler.schedule(initialDelay, interval, runnable)

        override def scheduleOnce(
          delay:    FiniteDuration,
          runnable: Runnable)(implicit executor: ExecutionContext): Cancellable =
          systemScheduler.scheduleOnce(delay, runnable)
      }
    }
  }

  // create supervisor for daemons under path "/system/cluster"
  private val clusterDaemons: ActorRef = {
    system.systemActorOf(Props(classOf[ClusterDaemon], settings).
      withDispatcher(UseDispatcher).withDeploy(Deploy.local), name = "cluster")
  }

  /**
   * INTERNAL API
   */
  private[cluster] val clusterCore: ActorRef = {
    implicit val timeout = system.settings.CreationTimeout
    try {
      Await.result((clusterDaemons ? InternalClusterAction.GetClusterCoreRef).mapTo[ActorRef], timeout.duration)
    } catch {
      case NonFatal(e) ⇒
        log.error(e, "Failed to startup Cluster. You can try to increase 'akka.actor.creation-timeout'.")
        shutdown()
        // don't re-throw, that would cause the extension to be re-recreated
        // from shutdown() or other places, which may result in
        // InvalidActorNameException: actor name [cluster] is not unique
        system.deadLetters
    }
  }

  private[cluster] val readView: ClusterReadView = new ClusterReadView(this)

  system.registerOnTermination(shutdown())

  if (JmxEnabled)
    clusterJmx = {
      val jmx = new ClusterJmx(this, log)
      jmx.createMBean()
      Some(jmx)
    }

  logInfo("Started up successfully")

  // ======================================================
  // ===================== PUBLIC API =====================
  // ======================================================

  /**
   * Returns true if this cluster instance has be shutdown.
   */
  def isTerminated: Boolean = _isTerminated.get

  /**
   * Current snapshot state of the cluster.
   */
  def state: CurrentClusterState = readView.state

  /**
   * Subscribe to one or more cluster domain events.
   * The `to` classes can be [[akka.cluster.ClusterEvent.ClusterDomainEvent]]
   * or subclasses.
   *
   * A snapshot of [[akka.cluster.ClusterEvent.CurrentClusterState]]
   * will be sent to the subscriber as the first message.
   */
  @varargs def subscribe(subscriber: ActorRef, to: Class[_]*): Unit =
    subscribe(subscriber, initialStateMode = InitialStateAsSnapshot, to: _*)

  /**
   * Subscribe to one or more cluster domain events.
   * The `to` classes can be [[akka.cluster.ClusterEvent.ClusterDomainEvent]]
   * or subclasses.
   *
   * If `initialStateMode` is `ClusterEvent.InitialStateAsEvents` the events corresponding
   * to the current state will be sent to the subscriber to mimic what you would
   * have seen if you were listening to the events when they occurred in the past.
   *
   * If `initialStateMode` is `ClusterEvent.InitialStateAsSnapshot` a snapshot of
   * [[akka.cluster.ClusterEvent.CurrentClusterState]] will be sent to the subscriber as the
   * first message.
   *
   * Note that for large clusters it is more efficient to use `InitialStateAsSnapshot`.
   */
  @varargs def subscribe(subscriber: ActorRef, initialStateMode: SubscriptionInitialStateMode, to: Class[_]*): Unit = {
    require(to.length > 0, "at least one `ClusterDomainEvent` class is required")
    require(
      to.forall(classOf[ClusterDomainEvent].isAssignableFrom),
      s"subscribe to `akka.cluster.ClusterEvent.ClusterDomainEvent` or subclasses, was [${to.map(_.getName).mkString(", ")}]")
    clusterCore ! InternalClusterAction.Subscribe(subscriber, initialStateMode, to.toSet)
  }

  /**
   * Unsubscribe to all cluster domain events.
   */
  def unsubscribe(subscriber: ActorRef): Unit =
    clusterCore ! InternalClusterAction.Unsubscribe(subscriber, None)

  /**
   * Unsubscribe to a specific type of cluster domain events,
   * matching previous `subscribe` registration.
   */
  def unsubscribe(subscriber: ActorRef, to: Class[_]): Unit =
    clusterCore ! InternalClusterAction.Unsubscribe(subscriber, Some(to))

  /**
   * Send current (full) state of the cluster to the specified
   * receiver. If you want this to happen periodically you need to schedule
   * a call to this method yourself. Note that you can also retrieve the current
   * state with [[#state]].
   */
  def sendCurrentClusterState(receiver: ActorRef): Unit =
    clusterCore ! InternalClusterAction.SendCurrentClusterState(receiver)

  /**
   * Try to join this cluster node with the node specified by 'address'.
   * A 'Join(selfAddress)' command is sent to the node to join.
   *
   * An actor system can only join a cluster once. Additional attempts will be ignored.
   * When it has successfully joined it must be restarted to be able to join another
   * cluster or to join the same cluster again.
   *
   * The name of the [[akka.actor.ActorSystem]] must be the same for all members of a
   * cluster.
   */
  def join(address: Address): Unit =
    clusterCore ! ClusterUserAction.JoinTo(fillLocal(address))

  private def fillLocal(address: Address): Address = {
    // local address might be used if grabbed from actorRef.path.address
    if (address.hasLocalScope && address.system == selfAddress.system) selfAddress
    else address
  }

  /**
   * Join the specified seed nodes without defining them in config.
   * Especially useful from tests when Addresses are unknown before startup time.
   *
   * An actor system can only join a cluster once. Additional attempts will be ignored.
   * When it has successfully joined it must be restarted to be able to join another
   * cluster or to join the same cluster again.
   */
  def joinSeedNodes(seedNodes: immutable.Seq[Address]): Unit =
    clusterCore ! InternalClusterAction.JoinSeedNodes(seedNodes.toVector.map(fillLocal))

  /**
   * Java API
   *
   * Join the specified seed nodes without defining them in config.
   * Especially useful from tests when Addresses are unknown before startup time.
   *
   * An actor system can only join a cluster once. Additional attempts will be ignored.
   * When it has successfully joined it must be restarted to be able to join another
   * cluster or to join the same cluster again.
   */
  def joinSeedNodes(seedNodes: java.util.List[Address]): Unit =
    joinSeedNodes(Util.immutableSeq(seedNodes))

  /**
   * Send command to issue state transition to LEAVING for the node specified by 'address'.
   * The member will go through the status changes [[MemberStatus]] `Leaving` (not published to
   * subscribers) followed by [[MemberStatus]] `Exiting` and finally [[MemberStatus]] `Removed`.
   *
   * Note that this command can be issued to any member in the cluster, not necessarily the
   * one that is leaving. The cluster extension, but not the actor system or JVM, of the
   * leaving member will be shutdown after the leader has changed status of the member to
   * Exiting. Thereafter the member will be removed from the cluster. Normally this is
   * handled automatically, but in case of network failures during this process it might
   * still be necessary to set the node’s status to Down in order to complete the removal.
   */
  def leave(address: Address): Unit =
    clusterCore ! ClusterUserAction.Leave(fillLocal(address))

  /**
   * Send command to DOWN the node specified by 'address'.
   *
   * When a member is considered by the failure detector to be unreachable the leader is not
   * allowed to perform its duties, such as changing status of new joining members to 'Up'.
   * The status of the unreachable member must be changed to 'Down', which can be done with
   * this method.
   */
  def down(address: Address): Unit =
    clusterCore ! ClusterUserAction.Down(fillLocal(address))

  /**
   * The supplied thunk will be run, once, when current cluster member is `Up`.
   * Typically used together with configuration option `akka.cluster.min-nr-of-members`
   * to defer some action, such as starting actors, until the cluster has reached
   * a certain size.
   */
  def registerOnMemberUp[T](code: ⇒ T): Unit =
    registerOnMemberUp(new Runnable { def run() = code })

  /**
   * Java API: The supplied callback will be run, once, when current cluster member is `Up`.
   * Typically used together with configuration option `akka.cluster.min-nr-of-members`
   * to defer some action, such as starting actors, until the cluster has reached
   * a certain size.
   */
  def registerOnMemberUp(callback: Runnable): Unit =
    clusterDaemons ! InternalClusterAction.AddOnMemberUpListener(callback)

  /**
   * The supplied thunk will be run, once, when current cluster member is `Removed`.
   * If the cluster has already been shutdown the thunk will run on the caller thread immediately.
   * Typically used together `cluster.leave(cluster.selfAddress)` and then `system.terminate()`.
   */
  def registerOnMemberRemoved[T](code: ⇒ T): Unit =
    registerOnMemberRemoved(new Runnable { override def run(): Unit = code })

  /**
   * Java API: The supplied thunk will be run, once, when current cluster member is `Removed`.
   * If the cluster has already been shutdown the thunk will run on the caller thread immediately.
   * Typically used together `cluster.leave(cluster.selfAddress)` and then `system.terminate()`.
   */
  def registerOnMemberRemoved(callback: Runnable): Unit = {
    if (_isTerminated.get())
      callback.run()
    else
      clusterDaemons ! InternalClusterAction.AddOnMemberRemovedListener(callback)
  }

  /**
   * Generate the remote actor path by replacing the Address in the RootActor Path for the given
   * ActorRef with the cluster's `selfAddress`, unless address' host is already defined
   */
  def remotePathOf(actorRef: ActorRef): ActorPath = {
    val path = actorRef.path
    if (path.address.host.isDefined) {
      path
    } else {
      path.root.copy(selfAddress) / path.elements withUid path.uid
    }
  }

  // ========================================================
  // ===================== INTERNAL API =====================
  // ========================================================

  /**
   * INTERNAL API.
   *
   * Shuts down all connections to other members, the cluster daemon and the periodic gossip and cleanup tasks.
   *
   * Should not called by the user. The user can issue a LEAVE command which will tell the node
   * to go through graceful handoff process `LEAVE -&gt; EXITING -&gt; REMOVED -&gt; SHUTDOWN`.
   */
  private[cluster] def shutdown(): Unit = {
    if (_isTerminated.compareAndSet(false, true)) {
      logInfo("Shutting down...")

      system.stop(clusterDaemons)

      // readView might be null if init fails before it is created
      if (readView != null)
        readView.close()

      closeScheduler()

      clusterJmx foreach { _.unregisterMBean() }

      logInfo("Successfully shut down")
    }
  }

  private def closeScheduler(): Unit = scheduler match {
    case x: Closeable ⇒ x.close()
    case _            ⇒ // ignore, this is fine
  }

  /**
   * INTERNAL API
   */
  private[cluster] object InfoLogger {

    def logInfo(message: String): Unit =
      if (LogInfo)
        if (settings.SelfDataCenter == ClusterSettings.DefaultDataCenter)
          log.info("Cluster Node [{}] - {}", selfAddress, message)
        else
          log.info("Cluster Node [{}] dc [{}] - {}", selfAddress, settings.SelfDataCenter, message)

    def logInfo(template: String, arg1: Any): Unit =
      if (LogInfo)
        if (settings.SelfDataCenter == ClusterSettings.DefaultDataCenter)
          log.info("Cluster Node [{}] - " + template, selfAddress, arg1)
        else
          log.info("Cluster Node [{}] dc [{}] - " + template, selfAddress, settings.SelfDataCenter, arg1)

    def logInfo(template: String, arg1: Any, arg2: Any): Unit =
      if (LogInfo)
        if (settings.SelfDataCenter == ClusterSettings.DefaultDataCenter)
          log.info("Cluster Node [{}] - " + template, selfAddress, arg1, arg2)
        else
          log.info("Cluster Node [{}] dc [{}] - " + template, selfAddress, settings.SelfDataCenter, arg1, arg2)

    def logInfo(template: String, arg1: Any, arg2: Any, arg3: Any): Unit =
      if (LogInfo)
        if (settings.SelfDataCenter == ClusterSettings.DefaultDataCenter)
          log.info("Cluster Node [{}] - " + template, selfAddress, arg1, arg2, arg3)
        else
          log.info("Cluster Node [{}] dc [" + settings.SelfDataCenter + "] - " + template, selfAddress, arg1, arg2, arg3)
  }

}
-												Initial version of gossip based cluster membership.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2011-10-26 08:48:16 +02:00
+								/**
-												extended copyright into 2017

											
										
										
											2017-01-04 17:37:10 +01:00
+								 * Copyright (C) 2009-2017 Lightbend Inc. <http://www.lightbend.com>
-												Initial version of gossip based cluster membership.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2011-10-26 08:48:16 +02:00
+								 */
-												Moved Gossiper, FailureDetector and VectorClock (with tests) to the akka-cluster module. Deleted all old unused cluster code (ZooKeeper-based stuff).

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-01-31 13:33:04 +01:00
+								package akka.cluster
-												Initial version of gossip based cluster membership.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2011-10-26 08:48:16 +02:00
-												+clu #16736 add registerOnMemberRemoved to get notified when current member removed from the cluster

											
										
										
											2015-04-17 17:28:37 +08:00
+								import java.io.Closeable
 								import java.util.concurrent.ThreadFactory
 								import java.util.concurrent.atomic.AtomicBoolean
-												Redesign of life-cycle management of EXITING -> REMOVED. Fixes #2177.

- Removed REMOVED as explicit valid member state
- Implemented leader moving either itself or other member from EXITING -> REMOVED
- Added sending Remove message for removed node to shut down itself
- Fixed a few bugs
- Removed 'remove' from Cluster and JMX interface
- Added bunch of ScalaDoc
- Added isRunning method

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-06-16 00:00:19 +02:00
+								import akka.ConfigurationException
-												+clu #16736 add registerOnMemberRemoved to get notified when current member removed from the cluster

											
										
										
											2015-04-17 17:28:37 +08:00
+								import akka.actor._
-												=clu #23229 multi-dc heartbeating, only N nodes perform monitoring


											
										
										
											2017-07-07 13:17:41 +02:00
+								import akka.cluster.ClusterSettings.DataCenter
-												Moving to s.c.EC and s.c.A, compiles but tests aren't passing

											
										
										
											2012-06-29 16:40:36 +02:00
+								import akka.dispatch.MonitorableThreadFactory
-												+clu #16736 add registerOnMemberRemoved to get notified when current member removed from the cluster

											
										
										
											2015-04-17 17:28:37 +08:00
+								import akka.event.{ Logging, LoggingAdapter }
-												+clu #17870 add Java api for joinSeedNodes

											
										
										
											2015-07-01 10:38:13 +02:00
+								import akka.japi.Util
-												Reintroduce 'seed' nodes, see #2219

* Implement the join to seed nodes process
  When a new node is started started it sends a message to all
  seed nodes and then sends join command to the one that answers
  first.
* Configuration of seed-nodes and auto-join
* New JoinSeedNodeSpec that verifies the auto join to seed nodes
* In tests seed nodes are configured by overriding seedNodes
  function, since addresses are not known before start
* Deputy nodes are the live members of the seed nodes (not sure if
  that will be the final solution, see ticket 2252
* Updated cluster.rst with latest info about deputy and seed nodes

											
										
										
											2012-06-21 10:58:35 +02:00
+								import akka.pattern._
-												+clu #16736 add registerOnMemberRemoved to get notified when current member removed from the cluster

											
										
										
											2015-04-17 17:28:37 +08:00
+								import akka.remote.{ DefaultFailureDetectorRegistry, FailureDetector, _ }
 								import com.typesafe.config.{ Config, ConfigFactory }
 								import scala.annotation.varargs
-												Merge branch 'master' into wip-2547-metrics-router-patriknw

Conflicts:
	akka-actor/src/main/scala/akka/actor/Deployer.scala
	akka-cluster/src/main/scala/akka/cluster/ClusterMetricsCollector.scala
	akka-cluster/src/test/scala/akka/cluster/MetricsCollectorSpec.scala

											
										
										
											2012-11-15 12:33:11 +01:00
+								import scala.collection.immutable
-												+clu #16736 add registerOnMemberRemoved to get notified when current member removed from the cluster

											
										
										
											2015-04-17 17:28:37 +08:00
+								import scala.concurrent.duration._
 								import scala.concurrent.{ Await, ExecutionContext }
-												Shutdown/cleanup cluster extension if actor init fails, see #3162

* Stop ClusterDaemon if init of core actor fails.
* Activate jmx-enabled setting
* Adjust the err msg of InvalidActorNameException to match conventions

											
										
										
											2013-03-19 17:36:36 +01:00
+								import scala.util.control.NonFatal
-												Added initial join cluster through seed nodes phase to Gossiper plus misc other fixes and additions.

- Added JoinCluster phase (connect and get initial data from seed nodes) to Gossiper.
- Added '/system/cluster' daemon actor to Gossiper responsible for gossip communication.
- Added various config options to Gossiper.
- Fixed misc bugs in Gossiper.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-01-24 12:09:32 +01:00
-												Turned cluster Node into an Extension.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-02-22 18:40:16 +01:00
+								/**
-												Renamed 'Node' to 'Cluster'.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-03-22 23:04:04 +01:00
+								 * Cluster Extension Id and factory for creating Cluster extension.
-												Turned cluster Node into an Extension.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-02-22 18:40:16 +01:00
+								 */
-												Renamed 'Node' to 'Cluster'.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-03-22 23:04:04 +01:00
+								object Cluster extends ExtensionId[Cluster] with ExtensionIdProvider {
 								  override def get(system: ActorSystem): Cluster = super.get(system)
-												Turned cluster Node into an Extension.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-02-22 18:40:16 +01:00
-												Renamed 'Node' to 'Cluster'.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-03-22 23:04:04 +01:00
+								  override def lookup = Cluster
-												Turned cluster Node into an Extension.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-02-22 18:40:16 +01:00
-												Fix leaking this in constructor of Cluster, see #2473

* Major refactoring to remove the need to use special
  Cluster instance for testing. Use default Cluster
  extension instead. Most of it is trivial changes.
* Used failure-detector.implementation-class from config
  to swap to Puppet
* Removed FailureDetectorStrategy, since it doesn't add any value
* Added Cluster.joinSeedNodes to be able to test seedNodes when Addresses
  are unknown before startup time.
* Removed ClusterEnvironment that was passed around among the actors,
  instead they use the ordinary Cluster extension.
* Overall much cleaner design

											
										
										
											2012-09-06 21:48:40 +02:00
+								  override def createExtension(system: ExtendedActorSystem): Cluster = new Cluster(system)
-												=clu #3600 Disable Cluster assertInvariants checks by default

* asserts can be enabled by system property 'akka.cluster.assert=on'

											
										
										
											2013-09-11 13:38:56 +02:00
 								  /**
 								   * INTERNAL API
 								   */
 								  private[cluster] final val isAssertInvariantsEnabled: Boolean =
 								    System.getProperty("akka.cluster.assert", "off").toLowerCase match {
 								      case "on" | "true" ⇒ true
 								      case _             ⇒ false
 								    }
-												Turned cluster Node into an Extension.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-02-22 18:40:16 +01:00
+								}
-												Finalized initial cluster membership and merging of vector clocks and gossips in case of concurrent cluster updates. Plus misc other fixes.

* Finalized initial cluster membership.
* Added merging of vector clocks and gossips in case of concurrent cluster updates.
* Added toString methods to all cluster protocol classes
* Fixed bugs in incrementation of vector clocks
* Added updates of 'seen' table for cluster convergence
* Revamped to use new VectorClock impl
* Refactored Gossip.State

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-02-14 20:50:12 +01:00
-												Initial version of gossip based cluster membership.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2011-10-26 08:48:16 +02:00
+								/**
-												=clu:3152 Improve scaladoc of cluster

											
										
										
											2013-07-08 13:42:44 +02:00
+								 * This module is responsible cluster membership information. Changes to the cluster
 								 * information is retrieved through [[#subscribe]]. Commands to operate the cluster is
 								 * available through methods in this class, such as [[#join]], [[#down]] and [[#leave]].
 								 *
 								 * Each cluster [[Member]] is identified by its [[akka.actor.Address]], and
 								 * the cluster address of this actor system is [[#selfAddress]]. A member also has a status;
-												= #17380 fix doc comments for java8 doclint

* actor and cluster-metrics comments
* agent/camel/cluster/osgi/persistence/remote comments
* comments in contrib/persistence-tck/multi-node/typed

											
										
										
											2015-05-15 16:53:24 +02:00
+								 * initially [[MemberStatus]] `Joining` followed by [[MemberStatus]] `Up`.
-												Initial version of gossip based cluster membership.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2011-10-26 08:48:16 +02:00
+								 */
-												Fix leaking this in constructor of Cluster, see #2473

* Major refactoring to remove the need to use special
  Cluster instance for testing. Use default Cluster
  extension instead. Most of it is trivial changes.
* Used failure-detector.implementation-class from config
  to swap to Puppet
* Removed FailureDetectorStrategy, since it doesn't add any value
* Added Cluster.joinSeedNodes to be able to test seedNodes when Addresses
  are unknown before startup time.
* Removed ClusterEnvironment that was passed around among the actors,
  instead they use the ordinary Cluster extension.
* Overall much cleaner design

											
										
										
											2012-09-06 21:48:40 +02:00
+								class Cluster(val system: ExtendedActorSystem) extends Extension {
-												Turned cluster Node into an Extension.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-02-22 18:40:16 +01:00
-												Publish cluster changes to event bus, see #2202

* ClusterEventBus
* Removed register listener and related
* Removed Gossip.meta because it doesn't handle version conflicts

											
										
										
											2012-08-14 10:58:30 +02:00
+								  import ClusterEvent._
-												Initial version of gossip based cluster membership.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2011-10-26 08:48:16 +02:00
-												First step in refactoring of cluster internals to actors, see #2311

* Move clustering code to ClusterCore actor
* More will be done, comitting this for early review

											
										
										
											2012-07-04 11:37:56 +02:00
+								  val settings = new ClusterSettings(system.settings.config, system.name)
-												Config of cluster info logging, see #3225

											
										
										
											2013-05-23 13:36:35 +02:00
+								  import InfoLogger._
-												+clu #16736 add registerOnMemberRemoved to get notified when current member removed from the cluster

											
										
										
											2015-04-17 17:28:37 +08:00
+								  import settings._
-												Removed cluster seed nodes, added 'join.contact-point', changed joining phase, added singleton cluster mode plus misc other changes.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-02-07 16:53:49 +01:00
-												Disallow re-joining, see #2873

* Disallow join requests when already part of a cluster
* Remove wipe state when joining, since join can only be
  performed from empty state
* When trying to join, only accept gossip from that member
* Ignore gossips from unknown (and unreachable) members
* Make sure received gossip contains selfAddress
* Test join of fresh node with same host:port
* Remove JoinTwoClustersSpec
* Welcome message as reply to Join
* Retry unsucessful join request
* AddressUidExtension
* Uid in cluster Member identifier
  To be able to distinguish nodes with same host:port
  after restart.
* Ignore gossip with wrong uid
* Renamed Remove command to Shutdown
* Use uid in vclock identifier
* Update sample, Member apply is private
* Disabled config duration syntax and cleanup of io settings
* Update documentation

											
										
										
											2013-04-11 09:18:12 +02:00
+								  /**
-												+clu #15365 Make cluster.UniqueAddress public

(cherry picked from commit 2a2caeebd585d6dde53bbca0125e62626f7bae51)

Conflicts:
	akka-cluster/src/main/scala/akka/cluster/Member.scala

											
										
										
											2014-06-05 13:25:42 +02:00
+								   * The address including a `uid` of this cluster member.
 								   * The `uid` is needed to be able to distinguish different
 								   * incarnations of a member with same hostname and port.
-												Disallow re-joining, see #2873

* Disallow join requests when already part of a cluster
* Remove wipe state when joining, since join can only be
  performed from empty state
* When trying to join, only accept gossip from that member
* Ignore gossips from unknown (and unreachable) members
* Make sure received gossip contains selfAddress
* Test join of fresh node with same host:port
* Remove JoinTwoClustersSpec
* Welcome message as reply to Join
* Retry unsucessful join request
* AddressUidExtension
* Uid in cluster Member identifier
  To be able to distinguish nodes with same host:port
  after restart.
* Ignore gossip with wrong uid
* Renamed Remove command to Shutdown
* Use uid in vclock identifier
* Update sample, Member apply is private
* Disabled config duration syntax and cleanup of io settings
* Update documentation

											
										
										
											2013-04-11 09:18:12 +02:00
+								   */
-												+clu #15365 Make cluster.UniqueAddress public

(cherry picked from commit 2a2caeebd585d6dde53bbca0125e62626f7bae51)

Conflicts:
	akka-cluster/src/main/scala/akka/cluster/Member.scala

											
										
										
											2014-06-05 13:25:42 +02:00
+								  val selfUniqueAddress: UniqueAddress = system.provider match {
-												Disallow re-joining, see #2873

* Disallow join requests when already part of a cluster
* Remove wipe state when joining, since join can only be
  performed from empty state
* When trying to join, only accept gossip from that member
* Ignore gossips from unknown (and unreachable) members
* Make sure received gossip contains selfAddress
* Test join of fresh node with same host:port
* Remove JoinTwoClustersSpec
* Welcome message as reply to Join
* Retry unsucessful join request
* AddressUidExtension
* Uid in cluster Member identifier
  To be able to distinguish nodes with same host:port
  after restart.
* Ignore gossip with wrong uid
* Renamed Remove command to Shutdown
* Use uid in vclock identifier
* Update sample, Member apply is private
* Disabled config duration syntax and cleanup of io settings
* Update documentation

											
										
										
											2013-04-11 09:18:12 +02:00
+								    case c: ClusterActorRefProvider ⇒
-												Use long uid in artery remoting and cluster #20644


											
										
										
											2016-09-26 15:34:59 +02:00
+								      UniqueAddress(c.transport.defaultAddress, AddressUidExtension(system).longAddressUid)
-												Improvements based on review comments from √, see #2103

											
										
										
											2012-09-11 19:11:20 +02:00
+								    case other ⇒ throw new ConfigurationException(
-												Disallow re-joining, see #2873

* Disallow join requests when already part of a cluster
* Remove wipe state when joining, since join can only be
  performed from empty state
* When trying to join, only accept gossip from that member
* Ignore gossips from unknown (and unreachable) members
* Make sure received gossip contains selfAddress
* Test join of fresh node with same host:port
* Remove JoinTwoClustersSpec
* Welcome message as reply to Join
* Retry unsucessful join request
* AddressUidExtension
* Uid in cluster Member identifier
  To be able to distinguish nodes with same host:port
  after restart.
* Ignore gossip with wrong uid
* Renamed Remove command to Shutdown
* Use uid in vclock identifier
* Update sample, Member apply is private
* Disabled config duration syntax and cleanup of io settings
* Update documentation

											
										
										
											2013-04-11 09:18:12 +02:00
+								      s"ActorSystem [${system}] needs to have a 'ClusterActorRefProvider' enabled in the configuration, currently uses [${other.getClass.getName}]")
-												Improvements based on review comments from √, see #2103

											
										
										
											2012-09-11 19:11:20 +02:00
+								  }
-												Fixed bunch of stuff based on feedback on pull request.
Moved all cluster config to akka-cluster (and added test).

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-01-31 15:00:46 +01:00
-												Disallow re-joining, see #2873

* Disallow join requests when already part of a cluster
* Remove wipe state when joining, since join can only be
  performed from empty state
* When trying to join, only accept gossip from that member
* Ignore gossips from unknown (and unreachable) members
* Make sure received gossip contains selfAddress
* Test join of fresh node with same host:port
* Remove JoinTwoClustersSpec
* Welcome message as reply to Join
* Retry unsucessful join request
* AddressUidExtension
* Uid in cluster Member identifier
  To be able to distinguish nodes with same host:port
  after restart.
* Ignore gossip with wrong uid
* Renamed Remove command to Shutdown
* Use uid in vclock identifier
* Update sample, Member apply is private
* Disabled config duration syntax and cleanup of io settings
* Update documentation

											
										
										
											2013-04-11 09:18:12 +02:00
+								  /**
 								   * The address of this cluster member.
 								   */
 								  def selfAddress: Address = selfUniqueAddress.address
-												=clu #23229 multi-dc heartbeating, only N nodes perform monitoring


											
										
										
											2017-07-07 13:17:41 +02:00
+								  /** Data center to which this node belongs to (defaults to "default" if not configured explicitly) */
-												Renamed/moved the self data center setting #23312 (#23344)


											
										
										
											2017-07-12 11:47:32 +01:00
+								  def selfDataCenter: DataCenter = settings.SelfDataCenter
-												=clu #23229 multi-dc heartbeating, only N nodes perform monitoring


											
										
										
											2017-07-07 13:17:41 +02:00
-												Cluster node roles, see #3049

* Config of node roles cluster.role
* Cluster router configurable with use-role
* RoleLeaderChanged event
* Cluster singleton per role
* Cluster only starts once all required per-role node
  counts are reached,
  role.<role-name>.min-nr-of-members config
*  Update documentation and make use of the roles in the examples

											
										
										
											2013-03-14 20:32:43 +01:00
+								  /**
 								   * roles that this member has
 								   */
 								  def selfRoles: Set[String] = settings.Roles
 								  /**
 								   * Java API: roles that this member has
 								   */
 								  def getSelfRoles: java.util.Set[String] =
 								    scala.collection.JavaConverters.setAsJavaSetConverter(selfRoles).asJava
-												Incorporate review comments and cleanup isAvailable, see #2018

* Renamed isRunning to isTerminated (with negation of course)
* Removed Running from JMX API, since the mbean is deregistered anyway
* Cleanup isAvailable, isUnavailbe
* Misc minor

											
										
										
											2012-12-06 15:26:57 +01:00
+								  private val _isTerminated = new AtomicBoolean(false)
-												= akka-*: full name space for loggers - resolve #16138

reflect logger name changes in the migration guide

fix typo in migration guide

fix typo in migration guide (xml)

											
										
										
											2014-11-17 17:17:52 -06:00
+								  private val log = Logging(system, getClass.getName)
-												Shutdown/cleanup cluster extension if actor init fails, see #3162

* Stop ClusterDaemon if init of core actor fails.
* Activate jmx-enabled setting
* Adjust the err msg of InvalidActorNameException to match conventions

											
										
										
											2013-03-19 17:36:36 +01:00
+								  // ClusterJmx is initialized as the last thing in the constructor
 								  private var clusterJmx: Option[ClusterJmx] = None
-												Initial commit of 'akka-cluster' CLI tool working together with the new Cluster JMX API

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-04-14 20:06:03 +02:00
-												Config of cluster info logging, see #3225

											
										
										
											2013-05-23 13:36:35 +02:00
+								  logInfo("Starting up...")
-												Added DOWNING (user downing and auto-downing) and LEADER actions.

* Added possibility for user to 'down' a node
* Added possibility for the leader to 'auto-down' a node.
* Added leader role actions
  - Moving nodes from JOINING -> UP
  - Moving nodes from EXITING -> REMOVED
  - AUTO-DOWNING
* Added tests for user and leader downing
* Added 'auto-down' option to turn auto-downing on and off
* Fixed bug in semantic Member Ordering
* Removed FSM stuff from ClusterCommandDaemon (including the test) since the node status should only be in the converged gossip state

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-03-09 12:56:56 +01:00
-												Failure detector refactoring, see #2690

* Failure detector was previously copied with refactoring to
  akka-remote and this refactoring makes use of that and removes
  the failure detector in akka-cluster
* Adjustments to reference.conf
* Refactoring of FailureDetectorPuppet

											
										
										
											2013-01-29 11:55:33 +01:00
+								  val failureDetector: FailureDetectorRegistry[Address] = {
-												=clu #23229 multi-dc heartbeating, only N nodes perform monitoring


											
										
										
											2017-07-07 13:17:41 +02:00
+								    val createFailureDetector = () ⇒
-												EventStream is now passed to failure detectors

 - Also, dynamic loading is now centralized (DRY)

											
										
										
											2013-05-17 14:16:26 +02:00
+								      FailureDetectorLoader.load(settings.FailureDetectorImplementationClass, settings.FailureDetectorConfig, system)
-												Failure detector refactoring, see #2690

* Failure detector was previously copied with refactoring to
  akka-remote and this refactoring makes use of that and removes
  the failure detector in akka-cluster
* Adjustments to reference.conf
* Refactoring of FailureDetectorPuppet

											
										
										
											2013-01-29 11:55:33 +01:00
-												=clu #23229 multi-dc heartbeating, only N nodes perform monitoring


											
										
										
											2017-07-07 13:17:41 +02:00
+								    new DefaultFailureDetectorRegistry(createFailureDetector)
 								  }
 								  val crossDcFailureDetector: FailureDetectorRegistry[Address] = {
 								    val createFailureDetector = () ⇒
-												limit cross dc gossip #23282


											
										
										
											2017-07-07 13:19:10 +01:00
+								      FailureDetectorLoader.load(
 								        settings.MultiDataCenter.CrossDcFailureDetectorSettings.ImplementationClass,
 								        settings.MultiDataCenter.CrossDcFailureDetectorSettings.config, system)
-												=clu #23229 multi-dc heartbeating, only N nodes perform monitoring


											
										
										
											2017-07-07 13:17:41 +02:00
 								    new DefaultFailureDetectorRegistry(createFailureDetector)
-												Fix leaking this in constructor of Cluster, see #2473

* Major refactoring to remove the need to use special
  Cluster instance for testing. Use default Cluster
  extension instead. Most of it is trivial changes.
* Used failure-detector.implementation-class from config
  to swap to Puppet
* Removed FailureDetectorStrategy, since it doesn't add any value
* Added Cluster.joinSeedNodes to be able to test seedNodes when Addresses
  are unknown before startup time.
* Removed ClusterEnvironment that was passed around among the actors,
  instead they use the ordinary Cluster extension.
* Overall much cleaner design

											
										
										
											2012-09-06 21:48:40 +02:00
+								  }
-												clu #20309 API for pluggable cluster downing

											
										
										
											2016-04-11 10:33:02 +02:00
+								  // needs to be lazy to allow downing provider impls to access Cluster (if not we get deadlock)
 								  lazy val downingProvider: DowningProvider =
 								    DowningProvider.load(settings.DowningProviderClassName, system)
-												Added DOWNING (user downing and auto-downing) and LEADER actions.

* Added possibility for user to 'down' a node
* Added possibility for the leader to 'auto-down' a node.
* Added leader role actions
  - Moving nodes from JOINING -> UP
  - Moving nodes from EXITING -> REMOVED
  - AUTO-DOWNING
* Added tests for user and leader downing
* Added 'auto-down' option to turn auto-downing on and off
* Fixed bug in semantic Member Ordering
* Removed FSM stuff from ClusterCommandDaemon (including the test) since the node status should only be in the converged gossip state

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-03-09 12:56:56 +01:00
+								  // ========================================================
 								  // ===================== WORK DAEMONS =====================
 								  // ========================================================
 								  /**
-												First step in refactoring of cluster internals to actors, see #2311

* Move clustering code to ClusterCore actor
* More will be done, comitting this for early review

											
										
										
											2012-07-04 11:37:56 +02:00
+								   * INTERNAL API
-												Added DOWNING (user downing and auto-downing) and LEADER actions.

* Added possibility for user to 'down' a node
* Added possibility for the leader to 'auto-down' a node.
* Added leader role actions
  - Moving nodes from JOINING -> UP
  - Moving nodes from EXITING -> REMOVED
  - AUTO-DOWNING
* Added tests for user and leader downing
* Added 'auto-down' option to turn auto-downing on and off
* Fixed bug in semantic Member Ordering
* Removed FSM stuff from ClusterCommandDaemon (including the test) since the node status should only be in the converged gossip state

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-03-09 12:56:56 +01:00
+								   */
-												Create cluster scheduler from configured scheduler class, see #3034

											
										
										
											2013-02-13 15:37:22 +01:00
+								  private[cluster] val scheduler: Scheduler = {
-												LightArrayRevolverScheduler, see #2904

- based on a wheel (AtomicReferenceArray) from which atomic
  single-linked lists dangle
- no locks
- deterministic tests due to overridable time source
- also bring docs up to date

											
										
										
											2013-01-14 23:21:51 +01:00
+								    if (system.scheduler.maxFrequency < 1.second / SchedulerTickDuration) {
-												Update to a working version of Scalariform

											
										
										
											2016-06-02 14:06:57 +02:00
+								      logInfo(
 								        "Using a dedicated scheduler for cluster. Default scheduler can be used if configured " +
 								          "with 'akka.scheduler.tick-duration' [{} ms] <=  'akka.cluster.scheduler.tick-duration' [{} ms].",
-												fix-up Cluster’s complaint for too slow Scheduler, see #2904

											
										
										
											2013-01-24 13:43:40 +01:00
+								        (1000 / system.scheduler.maxFrequency).toInt, SchedulerTickDuration.toMillis)
-												Create cluster scheduler from configured scheduler class, see #3034

											
										
										
											2013-02-13 15:37:22 +01:00
 								      val cfg = ConfigFactory.parseString(
 								        s"akka.scheduler.tick-duration=${SchedulerTickDuration.toMillis}ms").withFallback(
 								          system.settings.config)
 								      val threadFactory = system.threadFactory match {
 								        case tf: MonitorableThreadFactory ⇒ tf.withName(tf.name + "-cluster-scheduler")
 								        case tf                           ⇒ tf
 								      }
 								      system.dynamicAccess.createInstanceFor[Scheduler](system.settings.SchedulerClass, immutable.Seq(
-												Update to a working version of Scalariform

											
										
										
											2016-06-02 14:06:57 +02:00
+								        classOf[Config] → cfg,
 								        classOf[LoggingAdapter] → log,
 								        classOf[ThreadFactory] → threadFactory)).get
-												Info log about dedicated scheduler, and refactoring, see #2214

* Refactoring with wrapping of Scheduler according to @viktorklang's wish

											
										
										
											2012-06-12 14:16:30 +02:00
+								    } else {
-												Making it possible/mandatory to signal which ExecutionContext will actually execute something scheduled

											
										
										
											2012-08-08 15:57:30 +02:00
+								      // delegate to system.scheduler, but don't close over system
-												Info log about dedicated scheduler, and refactoring, see #2214

* Refactoring with wrapping of Scheduler according to @viktorklang's wish

											
										
										
											2012-06-12 14:16:30 +02:00
+								      val systemScheduler = system.scheduler
 								      new Scheduler with Closeable {
-												Making it possible/mandatory to signal which ExecutionContext will actually execute something scheduled

											
										
										
											2012-08-08 15:57:30 +02:00
+								        override def close(): Unit = () // we are using system.scheduler, which we are not responsible for closing
-												LightArrayRevolverScheduler, see #2904

- based on a wheel (AtomicReferenceArray) from which atomic
  single-linked lists dangle
- no locks
- deterministic tests due to overridable time source
- also bring docs up to date

											
										
										
											2013-01-14 23:21:51 +01:00
+								        override def maxFrequency: Double = systemScheduler.maxFrequency
-												Making it possible/mandatory to signal which ExecutionContext will actually execute something scheduled

											
										
										
											2012-08-08 15:57:30 +02:00
-												more conversion to FiniteDuration, plus fix the build, see #2521

- also remove resetReceiveTimeout and change receiveTimeout() to return
  a Duration (which may be Undefined)
- also move akka.actor.{cell -> dungeon}, because that is
  + an adequate name
  + and does not coincide with the lowercase version of a class name

											
										
										
											2012-09-18 18:17:44 +02:00
+								        override def schedule(initialDelay: FiniteDuration, interval: FiniteDuration,
-												Making it possible/mandatory to signal which ExecutionContext will actually execute something scheduled

											
										
										
											2012-08-08 15:57:30 +02:00
+								                              runnable: Runnable)(implicit executor: ExecutionContext): Cancellable =
-												more conversion to FiniteDuration, plus fix the build, see #2521

- also remove resetReceiveTimeout and change receiveTimeout() to return
  a Duration (which may be Undefined)
- also move akka.actor.{cell -> dungeon}, because that is
  + an adequate name
  + and does not coincide with the lowercase version of a class name

											
										
										
											2012-09-18 18:17:44 +02:00
+								          systemScheduler.schedule(initialDelay, interval, runnable)
-												Making it possible/mandatory to signal which ExecutionContext will actually execute something scheduled

											
										
										
											2012-08-08 15:57:30 +02:00
-												Update to a working version of Scalariform

											
										
										
											2016-06-02 14:06:57 +02:00
+								        override def scheduleOnce(
 								          delay:    FiniteDuration,
 								          runnable: Runnable)(implicit executor: ExecutionContext): Cancellable =
-												Info log about dedicated scheduler, and refactoring, see #2214

* Refactoring with wrapping of Scheduler according to @viktorklang's wish

											
										
										
											2012-06-12 14:16:30 +02:00
+								          systemScheduler.scheduleOnce(delay, runnable)
 								      }
 								    }
-												Use dedicated cluster scheduler only when default scheduler resolution isn't good enough, see #2214

* Config properties for scheduler
* Commented shutdown considerations

											
										
										
											2012-06-12 13:34:59 +02:00
+								  }
-												Schedule cluster tasks with more accurate, see #2114

* Use scheduler with more accurate settings
* New FixedRateTask that compensates for inaccuracy

											
										
										
											2012-06-11 22:12:45 +02:00
-												First step in refactoring of cluster internals to actors, see #2311

* Move clustering code to ClusterCore actor
* More will be done, comitting this for early review

											
										
										
											2012-07-04 11:37:56 +02:00
+								  // create supervisor for daemons under path "/system/cluster"
 								  private val clusterDaemons: ActorRef = {
-												+act #3900 make systemActorOf available to Extensions

											
										
										
											2014-03-03 12:00:25 +01:00
+								    system.systemActorOf(Props(classOf[ClusterDaemon], settings).
-												make LocalScope mean “purely local” and avoid Props serialization check, see #3210

											
										
										
											2013-05-29 16:13:10 +02:00
+								      withDispatcher(UseDispatcher).withDeploy(Deploy.local), name = "cluster")
-												First step in refactoring of cluster internals to actors, see #2311

* Move clustering code to ClusterCore actor
* More will be done, comitting this for early review

											
										
										
											2012-07-04 11:37:56 +02:00
+								  }
-												Added DOWNING (user downing and auto-downing) and LEADER actions.

* Added possibility for user to 'down' a node
* Added possibility for the leader to 'auto-down' a node.
* Added leader role actions
  - Moving nodes from JOINING -> UP
  - Moving nodes from EXITING -> REMOVED
  - AUTO-DOWNING
* Added tests for user and leader downing
* Added 'auto-down' option to turn auto-downing on and off
* Fixed bug in semantic Member Ordering
* Removed FSM stuff from ClusterCommandDaemon (including the test) since the node status should only be in the converged gossip state

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-03-09 12:56:56 +01:00
-												Unit tests of Cluster, see 2163

* ClusterSpec
- Test gossiping rules for deputies and unreachable
- Fix strange/wrong probabilites for gossip to unreachable and deputy nodes
- Fix lost order of Members when using map (without .toSeq) on the members SortedSet

* MemberSpec
- Test equals, hashCode

* GossipSpec
- Test member merge by status prio
- Fix bug in member merge (groupBy was wrong)

											
										
										
											2012-06-05 22:16:15 +02:00
+								  /**
-												First step in refactoring of cluster internals to actors, see #2311

* Move clustering code to ClusterCore actor
* More will be done, comitting this for early review

											
										
										
											2012-07-04 11:37:56 +02:00
+								   * INTERNAL API
-												Unit tests of Cluster, see 2163

* ClusterSpec
- Test gossiping rules for deputies and unreachable
- Fix strange/wrong probabilites for gossip to unreachable and deputy nodes
- Fix lost order of Members when using map (without .toSeq) on the members SortedSet

* MemberSpec
- Test equals, hashCode

* GossipSpec
- Test member merge by status prio
- Fix bug in member merge (groupBy was wrong)

											
										
										
											2012-06-05 22:16:15 +02:00
+								   */
-												Make Cluster ready for use before constructor returns, #2311

											
										
										
											2012-07-05 07:56:40 +02:00
+								  private[cluster] val clusterCore: ActorRef = {
 								    implicit val timeout = system.settings.CreationTimeout
-												Shutdown/cleanup cluster extension if actor init fails, see #3162

* Stop ClusterDaemon if init of core actor fails.
* Activate jmx-enabled setting
* Adjust the err msg of InvalidActorNameException to match conventions

											
										
										
											2013-03-19 17:36:36 +01:00
+								    try {
 								      Await.result((clusterDaemons ? InternalClusterAction.GetClusterCoreRef).mapTo[ActorRef], timeout.duration)
 								    } catch {
 								      case NonFatal(e) ⇒
-												=clu #3533 Harden cluster startup error handling

											
										
										
											2013-09-17 16:52:08 +02:00
+								        log.error(e, "Failed to startup Cluster. You can try to increase 'akka.actor.creation-timeout'.")
-												Shutdown/cleanup cluster extension if actor init fails, see #3162

* Stop ClusterDaemon if init of core actor fails.
* Activate jmx-enabled setting
* Adjust the err msg of InvalidActorNameException to match conventions

											
										
										
											2013-03-19 17:36:36 +01:00
+								        shutdown()
-												=clu #3533 Harden cluster startup error handling

											
										
										
											2013-09-17 16:52:08 +02:00
+								        // don't re-throw, that would cause the extension to be re-recreated
-												=clu #17712 Guard against readView not created

* readView might be null if Cluster init fails before it is created,
  i.e. shutdown is called from constructor

											
										
										
											2015-07-01 14:39:20 +02:00
+								        // from shutdown() or other places, which may result in
-												=clu #3533 Harden cluster startup error handling

											
										
										
											2013-09-17 16:52:08 +02:00
+								        // InvalidActorNameException: actor name [cluster] is not unique
 								        system.deadLetters
-												Shutdown/cleanup cluster extension if actor init fails, see #3162

* Stop ClusterDaemon if init of core actor fails.
* Activate jmx-enabled setting
* Adjust the err msg of InvalidActorNameException to match conventions

											
										
										
											2013-03-19 17:36:36 +01:00
+								    }
-												Make Cluster ready for use before constructor returns, #2311

											
										
										
											2012-07-05 07:56:40 +02:00
+								  }
-												Initial commit of 'akka-cluster' CLI tool working together with the new Cluster JMX API

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-04-14 20:06:03 +02:00
-												!clu #3617 API improvements related to CurrentClusterState

* Getter for CurrentClusterState in Cluster extension, updated via
  ClusterReadView
* Remove lazy init of readView. Otherwise the cluster.state will be
  empty on first access, wich is probably surprising
* Subscribe to several cluster event types at once, to ensure *one*
  CurrentClusterEvent followed by change events
* Deprecate publishCurrentClusterState, was a bad idea, use sendCurrentClusterState
  instead
* Possibility to subscribe with InitialStateAsEvents to receive events corresponding
  to CurrentClusterState
* CurrentClusterState not a ClusterDomainEvent, ticket #3614

											
										
										
											2014-01-08 14:14:48 +01:00
+								  private[cluster] val readView: ClusterReadView = new ClusterReadView(this)
-												Improve publish of domain events, see #2202

* Gossip is not exposed in user api
* Better and more events
* Snapshot event sent to new subscriber
* Updated tests
* Periodic publish only for internal stats

											
										
										
											2012-08-15 16:47:34 +02:00
-												Schedule cluster tasks with more accurate, see #2114

* Use scheduler with more accurate settings
* New FixedRateTask that compensates for inaccuracy

											
										
										
											2012-06-11 22:12:45 +02:00
+								  system.registerOnTermination(shutdown())
-												Shutdown/cleanup cluster extension if actor init fails, see #3162

* Stop ClusterDaemon if init of core actor fails.
* Activate jmx-enabled setting
* Adjust the err msg of InvalidActorNameException to match conventions

											
										
										
											2013-03-19 17:36:36 +01:00
+								  if (JmxEnabled)
 								    clusterJmx = {
 								      val jmx = new ClusterJmx(this, log)
 								      jmx.createMBean()
 								      Some(jmx)
 								    }
-												Add back Cluster JMX, see 2311

* Separate class
* Simple test

											
										
										
											2012-07-05 11:56:54 +02:00
-												Config of cluster info logging, see #3225

											
										
										
											2013-05-23 13:36:35 +02:00
+								  logInfo("Started up successfully")
-												Added DOWNING (user downing and auto-downing) and LEADER actions.

* Added possibility for user to 'down' a node
* Added possibility for the leader to 'auto-down' a node.
* Added leader role actions
  - Moving nodes from JOINING -> UP
  - Moving nodes from EXITING -> REMOVED
  - AUTO-DOWNING
* Added tests for user and leader downing
* Added 'auto-down' option to turn auto-downing on and off
* Fixed bug in semantic Member Ordering
* Removed FSM stuff from ClusterCommandDaemon (including the test) since the node status should only be in the converged gossip state

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-03-09 12:56:56 +01:00
-												Finalized initial cluster membership and merging of vector clocks and gossips in case of concurrent cluster updates. Plus misc other fixes.

* Finalized initial cluster membership.
* Added merging of vector clocks and gossips in case of concurrent cluster updates.
* Added toString methods to all cluster protocol classes
* Fixed bugs in incrementation of vector clocks
* Added updates of 'seen' table for cluster convergence
* Revamped to use new VectorClock impl
* Refactored Gossip.State

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-02-14 20:50:12 +01:00
+								  // ======================================================
 								  // ===================== PUBLIC API =====================
 								  // ======================================================
-												Redesign of life-cycle management of EXITING -> REMOVED. Fixes #2177.

- Removed REMOVED as explicit valid member state
- Implemented leader moving either itself or other member from EXITING -> REMOVED
- Added sending Remove message for removed node to shut down itself
- Fixed a few bugs
- Removed 'remove' from Cluster and JMX interface
- Added bunch of ScalaDoc
- Added isRunning method

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-06-16 00:00:19 +02:00
+								  /**
-												Incorporate review comments and cleanup isAvailable, see #2018

* Renamed isRunning to isTerminated (with negation of course)
* Removed Running from JMX API, since the mbean is deregistered anyway
* Cleanup isAvailable, isUnavailbe
* Misc minor

											
										
										
											2012-12-06 15:26:57 +01:00
+								   * Returns true if this cluster instance has be shutdown.
-												Redesign of life-cycle management of EXITING -> REMOVED. Fixes #2177.

- Removed REMOVED as explicit valid member state
- Implemented leader moving either itself or other member from EXITING -> REMOVED
- Added sending Remove message for removed node to shut down itself
- Fixed a few bugs
- Removed 'remove' from Cluster and JMX interface
- Added bunch of ScalaDoc
- Added isRunning method

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-06-16 00:00:19 +02:00
+								   */
-												Incorporate review comments and cleanup isAvailable, see #2018

* Renamed isRunning to isTerminated (with negation of course)
* Removed Running from JMX API, since the mbean is deregistered anyway
* Cleanup isAvailable, isUnavailbe
* Misc minor

											
										
										
											2012-12-06 15:26:57 +01:00
+								  def isTerminated: Boolean = _isTerminated.get
-												Redesign of life-cycle management of EXITING -> REMOVED. Fixes #2177.

- Removed REMOVED as explicit valid member state
- Implemented leader moving either itself or other member from EXITING -> REMOVED
- Added sending Remove message for removed node to shut down itself
- Fixed a few bugs
- Removed 'remove' from Cluster and JMX interface
- Added bunch of ScalaDoc
- Added isRunning method

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-06-16 00:00:19 +02:00
-												Added support for 'deputy-nodes'.

* Added 'nr-of-deputy-nodes' config option
* Added fetching of current deputy node addresses
* Minor refactorings

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2011-01-01 01:50:33 +01:00
+								  /**
-												!clu #3617 API improvements related to CurrentClusterState

* Getter for CurrentClusterState in Cluster extension, updated via
  ClusterReadView
* Remove lazy init of readView. Otherwise the cluster.state will be
  empty on first access, wich is probably surprising
* Subscribe to several cluster event types at once, to ensure *one*
  CurrentClusterEvent followed by change events
* Deprecate publishCurrentClusterState, was a bad idea, use sendCurrentClusterState
  instead
* Possibility to subscribe with InitialStateAsEvents to receive events corresponding
  to CurrentClusterState
* CurrentClusterState not a ClusterDomainEvent, ticket #3614

											
										
										
											2014-01-08 14:14:48 +01:00
+								   * Current snapshot state of the cluster.
 								   */
 								  def state: CurrentClusterState = readView.state
 								  /**
 								   * Subscribe to one or more cluster domain events.
 								   * The `to` classes can be [[akka.cluster.ClusterEvent.ClusterDomainEvent]]
 								   * or subclasses.
-												Detect failure when no heartbeats sent, see #2907

* Subscribe to InstantMemberEvent and start heartbeating when
  InstantMemberUp. Same for metrics.
* HeartbeatNodeRing data structure for bidirectional mapping of
  heartbeat sender and receiver. Not using ConsistentHash anymore.
  Node addresses are hashed to ensure that neighbors are spread out.
* HeartbeatRequest when receiver detects that it has not received
  expected heartbeats.
* New test InitialHeartbeatSpec that simulates the problem
* Add/remove some related conf properties
* Add some more logging to be able to diagnose eventual problems
* Explicit config of nr-of-end-heartbeats

											
										
										
											2013-01-15 09:35:07 +01:00
+								   *
 								   * A snapshot of [[akka.cluster.ClusterEvent.CurrentClusterState]]
-												!clu #3617 API improvements related to CurrentClusterState

* Getter for CurrentClusterState in Cluster extension, updated via
  ClusterReadView
* Remove lazy init of readView. Otherwise the cluster.state will be
  empty on first access, wich is probably surprising
* Subscribe to several cluster event types at once, to ensure *one*
  CurrentClusterEvent followed by change events
* Deprecate publishCurrentClusterState, was a bad idea, use sendCurrentClusterState
  instead
* Possibility to subscribe with InitialStateAsEvents to receive events corresponding
  to CurrentClusterState
* CurrentClusterState not a ClusterDomainEvent, ticket #3614

											
										
										
											2014-01-08 14:14:48 +01:00
+								   * will be sent to the subscriber as the first message.
 								   */
 								  @varargs def subscribe(subscriber: ActorRef, to: Class[_]*): Unit =
-												=clu #15404 Require at least one subscribe class

* also check ClusterDomainEvent isAssignableFrom

											
										
										
											2015-07-01 15:09:16 +02:00
+								    subscribe(subscriber, initialStateMode = InitialStateAsSnapshot, to: _*)
-												!clu #3617 API improvements related to CurrentClusterState

* Getter for CurrentClusterState in Cluster extension, updated via
  ClusterReadView
* Remove lazy init of readView. Otherwise the cluster.state will be
  empty on first access, wich is probably surprising
* Subscribe to several cluster event types at once, to ensure *one*
  CurrentClusterEvent followed by change events
* Deprecate publishCurrentClusterState, was a bad idea, use sendCurrentClusterState
  instead
* Possibility to subscribe with InitialStateAsEvents to receive events corresponding
  to CurrentClusterState
* CurrentClusterState not a ClusterDomainEvent, ticket #3614

											
										
										
											2014-01-08 14:14:48 +01:00
 								  /**
 								   * Subscribe to one or more cluster domain events.
 								   * The `to` classes can be [[akka.cluster.ClusterEvent.ClusterDomainEvent]]
 								   * or subclasses.
 								   *
-												= #17380 fix doc comments for java8 doclint

* actor and cluster-metrics comments
* agent/camel/cluster/osgi/persistence/remote comments
* comments in contrib/persistence-tck/multi-node/typed

											
										
										
											2015-05-15 16:53:24 +02:00
+								   * If `initialStateMode` is `ClusterEvent.InitialStateAsEvents` the events corresponding
-												!clu #3617 API improvements related to CurrentClusterState

* Getter for CurrentClusterState in Cluster extension, updated via
  ClusterReadView
* Remove lazy init of readView. Otherwise the cluster.state will be
  empty on first access, wich is probably surprising
* Subscribe to several cluster event types at once, to ensure *one*
  CurrentClusterEvent followed by change events
* Deprecate publishCurrentClusterState, was a bad idea, use sendCurrentClusterState
  instead
* Possibility to subscribe with InitialStateAsEvents to receive events corresponding
  to CurrentClusterState
* CurrentClusterState not a ClusterDomainEvent, ticket #3614

											
										
										
											2014-01-08 14:14:48 +01:00
+								   * to the current state will be sent to the subscriber to mimic what you would
 								   * have seen if you were listening to the events when they occurred in the past.
 								   *
-												= #17380 fix doc comments for java8 doclint

* actor and cluster-metrics comments
* agent/camel/cluster/osgi/persistence/remote comments
* comments in contrib/persistence-tck/multi-node/typed

											
										
										
											2015-05-15 16:53:24 +02:00
+								   * If `initialStateMode` is `ClusterEvent.InitialStateAsSnapshot` a snapshot of
-												!clu #3617 API improvements related to CurrentClusterState

* Getter for CurrentClusterState in Cluster extension, updated via
  ClusterReadView
* Remove lazy init of readView. Otherwise the cluster.state will be
  empty on first access, wich is probably surprising
* Subscribe to several cluster event types at once, to ensure *one*
  CurrentClusterEvent followed by change events
* Deprecate publishCurrentClusterState, was a bad idea, use sendCurrentClusterState
  instead
* Possibility to subscribe with InitialStateAsEvents to receive events corresponding
  to CurrentClusterState
* CurrentClusterState not a ClusterDomainEvent, ticket #3614

											
										
										
											2014-01-08 14:14:48 +01:00
+								   * [[akka.cluster.ClusterEvent.CurrentClusterState]] will be sent to the subscriber as the
 								   * first message.
 								   *
 								   * Note that for large clusters it is more efficient to use `InitialStateAsSnapshot`.
-												Added support for 'deputy-nodes'.

* Added 'nr-of-deputy-nodes' config option
* Added fetching of current deputy node addresses
* Minor refactorings

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2011-01-01 01:50:33 +01:00
+								   */
-												=clu #15404 Require at least one subscribe class

* also check ClusterDomainEvent isAssignableFrom

											
										
										
											2015-07-01 15:09:16 +02:00
+								  @varargs def subscribe(subscriber: ActorRef, initialStateMode: SubscriptionInitialStateMode, to: Class[_]*): Unit = {
 								    require(to.length > 0, "at least one `ClusterDomainEvent` class is required")
-												Update to a working version of Scalariform

											
										
										
											2016-06-02 14:06:57 +02:00
+								    require(
 								      to.forall(classOf[ClusterDomainEvent].isAssignableFrom),
-												=clu #15404 Require at least one subscribe class

* also check ClusterDomainEvent isAssignableFrom

											
										
										
											2015-07-01 15:09:16 +02:00
+								      s"subscribe to `akka.cluster.ClusterEvent.ClusterDomainEvent` or subclasses, was [${to.map(_.getName).mkString(", ")}]")
-												!clu #3617 API improvements related to CurrentClusterState

* Getter for CurrentClusterState in Cluster extension, updated via
  ClusterReadView
* Remove lazy init of readView. Otherwise the cluster.state will be
  empty on first access, wich is probably surprising
* Subscribe to several cluster event types at once, to ensure *one*
  CurrentClusterEvent followed by change events
* Deprecate publishCurrentClusterState, was a bad idea, use sendCurrentClusterState
  instead
* Possibility to subscribe with InitialStateAsEvents to receive events corresponding
  to CurrentClusterState
* CurrentClusterState not a ClusterDomainEvent, ticket #3614

											
										
										
											2014-01-08 14:14:48 +01:00
+								    clusterCore ! InternalClusterAction.Subscribe(subscriber, initialStateMode, to.toSet)
-												=clu #15404 Require at least one subscribe class

* also check ClusterDomainEvent isAssignableFrom

											
										
										
											2015-07-01 15:09:16 +02:00
+								  }
-												Remove ClusterEventBus and system.eventStream, see #2202

											
										
										
											2012-08-14 15:33:34 +02:00
 								  /**
-												Cluster.unsubscribe with class parameter, see #2567

											
										
										
											2012-09-28 13:09:36 +02:00
+								   * Unsubscribe to all cluster domain events.
-												Remove ClusterEventBus and system.eventStream, see #2202

											
										
										
											2012-08-14 15:33:34 +02:00
+								   */
-												Improve publish of domain events, see #2202

* Gossip is not exposed in user api
* Better and more events
* Snapshot event sent to new subscriber
* Updated tests
* Periodic publish only for internal stats

											
										
										
											2012-08-15 16:47:34 +02:00
+								  def unsubscribe(subscriber: ActorRef): Unit =
-												Cluster.unsubscribe with class parameter, see #2567

											
										
										
											2012-09-28 13:09:36 +02:00
+								    clusterCore ! InternalClusterAction.Unsubscribe(subscriber, None)
 								  /**
 								   * Unsubscribe to a specific type of cluster domain events,
 								   * matching previous `subscribe` registration.
 								   */
 								  def unsubscribe(subscriber: ActorRef, to: Class[_]): Unit =
 								    clusterCore ! InternalClusterAction.Unsubscribe(subscriber, Some(to))
-												Added support for 'deputy-nodes'.

* Added 'nr-of-deputy-nodes' config option
* Added fetching of current deputy node addresses
* Minor refactorings

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2011-01-01 01:50:33 +01:00
-												Request send/publish of CurrentClusterState, see #2438

* Added publishCurrentClusterState and sendCurrentClusterState
* Removed Ping/Pong that was used for some tests, since awaitCond is
  now needed anyway, since publish to eventStream is done afterwards

											
										
										
											2012-09-12 09:23:02 +02:00
+								  /**
-												!clu #3920 Remove deprecated Cluster.publishCurrentClusterState

											
										
										
											2014-03-12 11:38:09 +01:00
+								   * Send current (full) state of the cluster to the specified
-												Request send/publish of CurrentClusterState, see #2438

* Added publishCurrentClusterState and sendCurrentClusterState
* Removed Ping/Pong that was used for some tests, since awaitCond is
  now needed anyway, since publish to eventStream is done afterwards

											
										
										
											2012-09-12 09:23:02 +02:00
+								   * receiver. If you want this to happen periodically you need to schedule
-												!clu #3617 API improvements related to CurrentClusterState

* Getter for CurrentClusterState in Cluster extension, updated via
  ClusterReadView
* Remove lazy init of readView. Otherwise the cluster.state will be
  empty on first access, wich is probably surprising
* Subscribe to several cluster event types at once, to ensure *one*
  CurrentClusterEvent followed by change events
* Deprecate publishCurrentClusterState, was a bad idea, use sendCurrentClusterState
  instead
* Possibility to subscribe with InitialStateAsEvents to receive events corresponding
  to CurrentClusterState
* CurrentClusterState not a ClusterDomainEvent, ticket #3614

											
										
										
											2014-01-08 14:14:48 +01:00
+								   * a call to this method yourself. Note that you can also retrieve the current
 								   * state with [[#state]].
-												Request send/publish of CurrentClusterState, see #2438

* Added publishCurrentClusterState and sendCurrentClusterState
* Removed Ping/Pong that was used for some tests, since awaitCond is
  now needed anyway, since publish to eventStream is done afterwards

											
										
										
											2012-09-12 09:23:02 +02:00
+								   */
 								  def sendCurrentClusterState(receiver: ActorRef): Unit =
-												!clu #3920 Remove deprecated Cluster.publishCurrentClusterState

											
										
										
											2014-03-12 11:38:09 +01:00
+								    clusterCore ! InternalClusterAction.SendCurrentClusterState(receiver)
-												Request send/publish of CurrentClusterState, see #2438

* Added publishCurrentClusterState and sendCurrentClusterState
* Removed Ping/Pong that was used for some tests, since awaitCond is
  now needed anyway, since publish to eventStream is done afterwards

											
										
										
											2012-09-12 09:23:02 +02:00
-												Cleaned up failure detector fixing minor issues after review. Renamed internal classes in Node.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-02-29 10:02:00 +01:00
+								  /**
-												Renamed methods in public Cluster API, plus changed semantics of Cluster.join (was wrong before).

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-04-12 22:50:50 +02:00
+								   * Try to join this cluster node with the node specified by 'address'.
-												Disallow re-joining, see #2873

* Disallow join requests when already part of a cluster
* Remove wipe state when joining, since join can only be
  performed from empty state
* When trying to join, only accept gossip from that member
* Ignore gossips from unknown (and unreachable) members
* Make sure received gossip contains selfAddress
* Test join of fresh node with same host:port
* Remove JoinTwoClustersSpec
* Welcome message as reply to Join
* Retry unsucessful join request
* AddressUidExtension
* Uid in cluster Member identifier
  To be able to distinguish nodes with same host:port
  after restart.
* Ignore gossip with wrong uid
* Renamed Remove command to Shutdown
* Use uid in vclock identifier
* Update sample, Member apply is private
* Disabled config duration syntax and cleanup of io settings
* Update documentation

											
										
										
											2013-04-11 09:18:12 +02:00
+								   * A 'Join(selfAddress)' command is sent to the node to join.
-												Make Make Cluster.joinSeedNodes public, see #3468

											
										
										
											2013-06-24 11:46:29 +02:00
+								   *
 								   * An actor system can only join a cluster once. Additional attempts will be ignored.
 								   * When it has successfully joined it must be restarted to be able to join another
 								   * cluster or to join the same cluster again.
-												Clarify system name requirement for cluster members

* Clarify system name requirement for cluster members

* Recommend againsts auto-down, stronger

											
										
										
											2016-04-04 12:37:12 +02:00
+								   *
 								   * The name of the [[akka.actor.ActorSystem]] must be the same for all members of a
 								   * cluster.
-												Cleaned up failure detector fixing minor issues after review. Renamed internal classes in Node.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-02-29 10:02:00 +01:00
+								   */
-												First step in refactoring of cluster internals to actors, see #2311

* Move clustering code to ClusterCore actor
* More will be done, comitting this for early review

											
										
										
											2012-07-04 11:37:56 +02:00
+								  def join(address: Address): Unit =
-												=clu #18345 Support local address in cluster commands

* and clarify the doc sample for leave

											
										
										
											2015-09-04 08:53:36 +02:00
+								    clusterCore ! ClusterUserAction.JoinTo(fillLocal(address))
 								  private def fillLocal(address: Address): Address = {
 								    // local address might be used if grabbed from actorRef.path.address
 								    if (address.hasLocalScope && address.system == selfAddress.system) selfAddress
 								    else address
 								  }
-												Cleaned up failure detector fixing minor issues after review. Renamed internal classes in Node.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-02-29 10:02:00 +01:00
-												Make Make Cluster.joinSeedNodes public, see #3468

											
										
										
											2013-06-24 11:46:29 +02:00
+								  /**
 								   * Join the specified seed nodes without defining them in config.
 								   * Especially useful from tests when Addresses are unknown before startup time.
 								   *
 								   * An actor system can only join a cluster once. Additional attempts will be ignored.
 								   * When it has successfully joined it must be restarted to be able to join another
 								   * cluster or to join the same cluster again.
 								   */
 								  def joinSeedNodes(seedNodes: immutable.Seq[Address]): Unit =
-												=clu #18345 Support local address in cluster commands

* and clarify the doc sample for leave

											
										
										
											2015-09-04 08:53:36 +02:00
+								    clusterCore ! InternalClusterAction.JoinSeedNodes(seedNodes.toVector.map(fillLocal))
-												Make Make Cluster.joinSeedNodes public, see #3468

											
										
										
											2013-06-24 11:46:29 +02:00
-												+clu #17870 add Java api for joinSeedNodes

											
										
										
											2015-07-01 10:38:13 +02:00
+								  /**
 								   * Java API
 								   *
 								   * Join the specified seed nodes without defining them in config.
 								   * Especially useful from tests when Addresses are unknown before startup time.
 								   *
 								   * An actor system can only join a cluster once. Additional attempts will be ignored.
 								   * When it has successfully joined it must be restarted to be able to join another
 								   * cluster or to join the same cluster again.
 								   */
 								  def joinSeedNodes(seedNodes: java.util.List[Address]): Unit =
 								    joinSeedNodes(Util.immutableSeq(seedNodes))
-												Cleaned up failure detector fixing minor issues after review. Renamed internal classes in Node.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-02-29 10:02:00 +01:00
+								  /**
-												Renamed methods in public Cluster API, plus changed semantics of Cluster.join (was wrong before).

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-04-12 22:50:50 +02:00
+								   * Send command to issue state transition to LEAVING for the node specified by 'address'.
-												= #17380 fix doc comments for java8 doclint

* actor and cluster-metrics comments
* agent/camel/cluster/osgi/persistence/remote comments
* comments in contrib/persistence-tck/multi-node/typed

											
										
										
											2015-05-15 16:53:24 +02:00
+								   * The member will go through the status changes [[MemberStatus]] `Leaving` (not published to
 								   * subscribers) followed by [[MemberStatus]] `Exiting` and finally [[MemberStatus]] `Removed`.
-												=clu:3152 Improve scaladoc of cluster

											
										
										
											2013-07-08 13:42:44 +02:00
+								   *
 								   * Note that this command can be issued to any member in the cluster, not necessarily the
 								   * one that is leaving. The cluster extension, but not the actor system or JVM, of the
 								   * leaving member will be shutdown after the leader has changed status of the member to
 								   * Exiting. Thereafter the member will be removed from the cluster. Normally this is
 								   * handled automatically, but in case of network failures during this process it might
 								   * still be necessary to set the node’s status to Down in order to complete the removal.
-												Cleaned up failure detector fixing minor issues after review. Renamed internal classes in Node.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-02-29 10:02:00 +01:00
+								   */
-												First step in refactoring of cluster internals to actors, see #2311

* Move clustering code to ClusterCore actor
* More will be done, comitting this for early review

											
										
										
											2012-07-04 11:37:56 +02:00
+								  def leave(address: Address): Unit =
-												=clu #18345 Support local address in cluster commands

* and clarify the doc sample for leave

											
										
										
											2015-09-04 08:53:36 +02:00
+								    clusterCore ! ClusterUserAction.Leave(fillLocal(address))
-												Cleaned up failure detector fixing minor issues after review. Renamed internal classes in Node.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-02-29 10:02:00 +01:00
 								  /**
-												Implemented/Fixed Cluster.remove() and state transition from LEAVING -> REMOVED.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-06-08 11:51:34 +02:00
+								   * Send command to DOWN the node specified by 'address'.
-												=clu:3152 Improve scaladoc of cluster

											
										
										
											2013-07-08 13:42:44 +02:00
+								   *
 								   * When a member is considered by the failure detector to be unreachable the leader is not
 								   * allowed to perform its duties, such as changing status of new joining members to 'Up'.
 								   * The status of the unreachable member must be changed to 'Down', which can be done with
 								   * this method.
-												Cleaned up failure detector fixing minor issues after review. Renamed internal classes in Node.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-02-29 10:02:00 +01:00
+								   */
-												First step in refactoring of cluster internals to actors, see #2311

* Move clustering code to ClusterCore actor
* More will be done, comitting this for early review

											
										
										
											2012-07-04 11:37:56 +02:00
+								  def down(address: Address): Unit =
-												=clu #18345 Support local address in cluster commands

* and clarify the doc sample for leave

											
										
										
											2015-09-04 08:53:36 +02:00
+								    clusterCore ! ClusterUserAction.Down(fillLocal(address))
-												Cleaned up failure detector fixing minor issues after review. Renamed internal classes in Node.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-02-29 10:02:00 +01:00
-												min-nr-of-members and registerOnMemberUp, see #2306

* Leader moves joining members to up when min-nr-of-members reached
* Tested by MinMembersBeforeUpSpec
* Used in factorial sample
* Docs

											
										
										
											2012-12-10 08:46:25 +01:00
+								  /**
 								   * The supplied thunk will be run, once, when current cluster member is `Up`.
-												= #17380 fix doc comments for java8 doclint

* actor and cluster-metrics comments
* agent/camel/cluster/osgi/persistence/remote comments
* comments in contrib/persistence-tck/multi-node/typed

											
										
										
											2015-05-15 16:53:24 +02:00
+								   * Typically used together with configuration option `akka.cluster.min-nr-of-members`
-												min-nr-of-members and registerOnMemberUp, see #2306

* Leader moves joining members to up when min-nr-of-members reached
* Tested by MinMembersBeforeUpSpec
* Used in factorial sample
* Docs

											
										
										
											2012-12-10 08:46:25 +01:00
+								   * to defer some action, such as starting actors, until the cluster has reached
 								   * a certain size.
 								   */
 								  def registerOnMemberUp[T](code: ⇒ T): Unit =
-												+clu #16736 add registerOnMemberRemoved to get notified when current member removed from the cluster

											
										
										
											2015-04-17 17:28:37 +08:00
+								    registerOnMemberUp(new Runnable { def run() = code })
-												min-nr-of-members and registerOnMemberUp, see #2306

* Leader moves joining members to up when min-nr-of-members reached
* Tested by MinMembersBeforeUpSpec
* Used in factorial sample
* Docs

											
										
										
											2012-12-10 08:46:25 +01:00
 								  /**
-												fix formatting of Java API in doc comments + genjavadoc 0.3

											
										
										
											2013-03-07 09:05:55 +01:00
+								   * Java API: The supplied callback will be run, once, when current cluster member is `Up`.
-												= #17380 fix doc comments for java8 doclint

* actor and cluster-metrics comments
* agent/camel/cluster/osgi/persistence/remote comments
* comments in contrib/persistence-tck/multi-node/typed

											
										
										
											2015-05-15 16:53:24 +02:00
+								   * Typically used together with configuration option `akka.cluster.min-nr-of-members`
-												min-nr-of-members and registerOnMemberUp, see #2306

* Leader moves joining members to up when min-nr-of-members reached
* Tested by MinMembersBeforeUpSpec
* Used in factorial sample
* Docs

											
										
										
											2012-12-10 08:46:25 +01:00
+								   * to defer some action, such as starting actors, until the cluster has reached
 								   * a certain size.
 								   */
-												+clu #16736 add registerOnMemberRemoved to get notified when current member removed from the cluster

											
										
										
											2015-04-17 17:28:37 +08:00
+								  def registerOnMemberUp(callback: Runnable): Unit =
 								    clusterDaemons ! InternalClusterAction.AddOnMemberUpListener(callback)
-												=clu #13226 Prune vector clocks from removed member

											
										
										
											2015-02-11 22:16:27 +01:00
-												+clu #16736 add registerOnMemberRemoved to get notified when current member removed from the cluster

											
										
										
											2015-04-17 17:28:37 +08:00
+								  /**
 								   * The supplied thunk will be run, once, when current cluster member is `Removed`.
-												=clu #18245 Improve registerOnMemberRemoved example

											
										
										
											2015-09-10 08:48:50 +02:00
+								   * If the cluster has already been shutdown the thunk will run on the caller thread immediately.
-												#19046 replace system.{shutdown => terminate}

											
										
										
											2016-01-17 15:48:52 +01:00
+								   * Typically used together `cluster.leave(cluster.selfAddress)` and then `system.terminate()`.
-												+clu #16736 add registerOnMemberRemoved to get notified when current member removed from the cluster

											
										
										
											2015-04-17 17:28:37 +08:00
+								   */
 								  def registerOnMemberRemoved[T](code: ⇒ T): Unit =
 								    registerOnMemberRemoved(new Runnable { override def run(): Unit = code })
-												min-nr-of-members and registerOnMemberUp, see #2306

* Leader moves joining members to up when min-nr-of-members reached
* Tested by MinMembersBeforeUpSpec
* Used in factorial sample
* Docs

											
										
										
											2012-12-10 08:46:25 +01:00
-												+clu #16736 add registerOnMemberRemoved to get notified when current member removed from the cluster

											
										
										
											2015-04-17 17:28:37 +08:00
+								  /**
 								   * Java API: The supplied thunk will be run, once, when current cluster member is `Removed`.
-												=clu #18245 Improve registerOnMemberRemoved example

											
										
										
											2015-09-10 08:48:50 +02:00
+								   * If the cluster has already been shutdown the thunk will run on the caller thread immediately.
-												#19046 replace system.{shutdown => terminate}

											
										
										
											2016-01-17 15:48:52 +01:00
+								   * Typically used together `cluster.leave(cluster.selfAddress)` and then `system.terminate()`.
-												+clu #16736 add registerOnMemberRemoved to get notified when current member removed from the cluster

											
										
										
											2015-04-17 17:28:37 +08:00
+								   */
 								  def registerOnMemberRemoved(callback: Runnable): Unit = {
 								    if (_isTerminated.get())
 								      callback.run()
 								    else
 								      clusterDaemons ! InternalClusterAction.AddOnMemberRemovedListener(callback)
 								  }
-												 #19192 Cluster extension helper to get full path of an actor ref

											
										
										
											2015-12-15 22:31:50 +01:00
 								  /**
 								   * Generate the remote actor path by replacing the Address in the RootActor Path for the given
 								   * ActorRef with the cluster's `selfAddress`, unless address' host is already defined
 								   */
 								  def remotePathOf(actorRef: ActorRef): ActorPath = {
 								    val path = actorRef.path
 								    if (path.address.host.isDefined) {
 								      path
 								    } else {
 								      path.root.copy(selfAddress) / path.elements withUid path.uid
 								    }
 								  }
-												Added support for 'deputy-nodes'.

* Added 'nr-of-deputy-nodes' config option
* Added fetching of current deputy node addresses
* Minor refactorings

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2011-01-01 01:50:33 +01:00
+								  // ========================================================
 								  // ===================== INTERNAL API =====================
 								  // ========================================================
-												Completed singleton and N-node cluster boot up and joining phase.

* Simplified node join phase.
* Added tests for cluster node startup and joining, both for singleton cluster and 2-node cluster.
* Fixed bug in cluster node address and cluster daemon lookup.
* Changed some APIs.
* Renamed 'contact-point' to 'node-to-join'.
* Minor refactorings.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-02-08 14:14:01 +01:00
+								  /**
-												Redesign of life-cycle management of EXITING -> REMOVED. Fixes #2177.

- Removed REMOVED as explicit valid member state
- Implemented leader moving either itself or other member from EXITING -> REMOVED
- Added sending Remove message for removed node to shut down itself
- Fixed a few bugs
- Removed 'remove' from Cluster and JMX interface
- Added bunch of ScalaDoc
- Added isRunning method

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-06-16 00:00:19 +02:00
+								   * INTERNAL API.
 								   *
 								   * Shuts down all connections to other members, the cluster daemon and the periodic gossip and cleanup tasks.
 								   *
 								   * Should not called by the user. The user can issue a LEAVE command which will tell the node
-												= #17380 fix doc comments for java8 doclint

* actor and cluster-metrics comments
* agent/camel/cluster/osgi/persistence/remote comments
* comments in contrib/persistence-tck/multi-node/typed

											
										
										
											2015-05-15 16:53:24 +02:00
+								   * to go through graceful handoff process `LEAVE -&gt; EXITING -&gt; REMOVED -&gt; SHUTDOWN`.
-												Redesign of life-cycle management of EXITING -> REMOVED. Fixes #2177.

- Removed REMOVED as explicit valid member state
- Implemented leader moving either itself or other member from EXITING -> REMOVED
- Added sending Remove message for removed node to shut down itself
- Fixed a few bugs
- Removed 'remove' from Cluster and JMX interface
- Added bunch of ScalaDoc
- Added isRunning method

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-06-16 00:00:19 +02:00
+								   */
 								  private[cluster] def shutdown(): Unit = {
-												Incorporate review comments and cleanup isAvailable, see #2018

* Renamed isRunning to isTerminated (with negation of course)
* Removed Running from JMX API, since the mbean is deregistered anyway
* Cleanup isAvailable, isUnavailbe
* Misc minor

											
										
										
											2012-12-06 15:26:57 +01:00
+								    if (_isTerminated.compareAndSet(false, true)) {
-												Config of cluster info logging, see #3225

											
										
										
											2013-05-23 13:36:35 +02:00
+								      logInfo("Shutting down...")
-												Redesign of life-cycle management of EXITING -> REMOVED. Fixes #2177.

- Removed REMOVED as explicit valid member state
- Implemented leader moving either itself or other member from EXITING -> REMOVED
- Added sending Remove message for removed node to shut down itself
- Fixed a few bugs
- Removed 'remove' from Cluster and JMX interface
- Added bunch of ScalaDoc
- Added isRunning method

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-06-16 00:00:19 +02:00
-												Improve publish of domain events, see #2202

* Gossip is not exposed in user api
* Better and more events
* Snapshot event sent to new subscriber
* Updated tests
* Periodic publish only for internal stats

											
										
										
											2012-08-15 16:47:34 +02:00
+								      system.stop(clusterDaemons)
-												=clu #17712 Guard against readView not created

* readView might be null if Cluster init fails before it is created,
  i.e. shutdown is called from constructor

											
										
										
											2015-07-01 14:39:20 +02:00
 								      // readView might be null if init fails before it is created
 								      if (readView != null)
 								        readView.close()
-												Redesign of life-cycle management of EXITING -> REMOVED. Fixes #2177.

- Removed REMOVED as explicit valid member state
- Implemented leader moving either itself or other member from EXITING -> REMOVED
- Added sending Remove message for removed node to shut down itself
- Fixed a few bugs
- Removed 'remove' from Cluster and JMX interface
- Added bunch of ScalaDoc
- Added isRunning method

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-06-16 00:00:19 +02:00
-												Create cluster scheduler from configured scheduler class, see #3034

											
										
										
											2013-02-13 15:37:22 +01:00
+								      closeScheduler()
-												Added DOWNING (user downing and auto-downing) and LEADER actions.

* Added possibility for user to 'down' a node
* Added possibility for the leader to 'auto-down' a node.
* Added leader role actions
  - Moving nodes from JOINING -> UP
  - Moving nodes from EXITING -> REMOVED
  - AUTO-DOWNING
* Added tests for user and leader downing
* Added 'auto-down' option to turn auto-downing on and off
* Fixed bug in semantic Member Ordering
* Removed FSM stuff from ClusterCommandDaemon (including the test) since the node status should only be in the converged gossip state

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-03-09 12:56:56 +01:00
-												Cluster config setting to disable jmx, see #2531

											
										
										
											2012-09-20 08:09:01 +02:00
+								      clusterJmx foreach { _.unregisterMBean() }
-												Added DOWNING (user downing and auto-downing) and LEADER actions.

* Added possibility for user to 'down' a node
* Added possibility for the leader to 'auto-down' a node.
* Added leader role actions
  - Moving nodes from JOINING -> UP
  - Moving nodes from EXITING -> REMOVED
  - AUTO-DOWNING
* Added tests for user and leader downing
* Added 'auto-down' option to turn auto-downing on and off
* Fixed bug in semantic Member Ordering
* Removed FSM stuff from ClusterCommandDaemon (including the test) since the node status should only be in the converged gossip state

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-03-09 12:56:56 +01:00
-												Config of cluster info logging, see #3225

											
										
										
											2013-05-23 13:36:35 +02:00
+								      logInfo("Successfully shut down")
-												Added DOWNING (user downing and auto-downing) and LEADER actions.

* Added possibility for user to 'down' a node
* Added possibility for the leader to 'auto-down' a node.
* Added leader role actions
  - Moving nodes from JOINING -> UP
  - Moving nodes from EXITING -> REMOVED
  - AUTO-DOWNING
* Added tests for user and leader downing
* Added 'auto-down' option to turn auto-downing on and off
* Fixed bug in semantic Member Ordering
* Removed FSM stuff from ClusterCommandDaemon (including the test) since the node status should only be in the converged gossip state

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2012-03-09 12:56:56 +01:00
+								    }
 								  }
-												Create cluster scheduler from configured scheduler class, see #3034

											
										
										
											2013-02-13 15:37:22 +01:00
+								  private def closeScheduler(): Unit = scheduler match {
 								    case x: Closeable ⇒ x.close()
-												=clu #23229 multi-dc heartbeating, only N nodes perform monitoring


											
										
										
											2017-07-07 13:17:41 +02:00
+								    case _            ⇒ // ignore, this is fine
-												Create cluster scheduler from configured scheduler class, see #3034

											
										
										
											2013-02-13 15:37:22 +01:00
+								  }
-												Config of cluster info logging, see #3225

											
										
										
											2013-05-23 13:36:35 +02:00
+								  /**
 								   * INTERNAL API
 								   */
 								  private[cluster] object InfoLogger {
 								    def logInfo(message: String): Unit =
-												[WIP] one leader per cluster team (#23239)

* Guarantee no sneaky type puts more teams in the role list

* Leader per team and initial tests

* MiMa filters

* Second iteration (not working though)

* Verbose gossip logging etc.

* Gossip to team-nodes even if there is inter-team unreachability

* More work ...

* Marking removed nodes with tombstones in Gossip

* More test coverage for Gossip.remove

* Bug failing other multi-node tests squashed

* Multi-node test for team-split

* Review fixes - only prune tombstones on leader ticks

* Clean code is happy code.

* All I want is for MiMa to be my friend

* These constants are internal

* Making the formatting gods happy

* I used the wrong reachability for ignoring gossip :/

* Still hadn't quite gotten how reachability was supposed to work

* Review feedback applied

* Cross-team downing should still work

* Actually prune tombstones in the prune tombstones method ...

* Another round against reachability. Reachability leading with 15 - 2 so far.

											
										
										
											2017-07-04 09:09:40 +01:00
+								      if (LogInfo)
-												Renamed/moved the self data center setting #23312 (#23344)


											
										
										
											2017-07-12 11:47:32 +01:00
+								        if (settings.SelfDataCenter == ClusterSettings.DefaultDataCenter)
-												[WIP] one leader per cluster team (#23239)

* Guarantee no sneaky type puts more teams in the role list

* Leader per team and initial tests

* MiMa filters

* Second iteration (not working though)

* Verbose gossip logging etc.

* Gossip to team-nodes even if there is inter-team unreachability

* More work ...

* Marking removed nodes with tombstones in Gossip

* More test coverage for Gossip.remove

* Bug failing other multi-node tests squashed

* Multi-node test for team-split

* Review fixes - only prune tombstones on leader ticks

* Clean code is happy code.

* All I want is for MiMa to be my friend

* These constants are internal

* Making the formatting gods happy

* I used the wrong reachability for ignoring gossip :/

* Still hadn't quite gotten how reachability was supposed to work

* Review feedback applied

* Cross-team downing should still work

* Actually prune tombstones in the prune tombstones method ...

* Another round against reachability. Reachability leading with 15 - 2 so far.

											
										
										
											2017-07-04 09:09:40 +01:00
+								          log.info("Cluster Node [{}] - {}", selfAddress, message)
 								        else
-												Renamed/moved the self data center setting #23312 (#23344)


											
										
										
											2017-07-12 11:47:32 +01:00
+								          log.info("Cluster Node [{}] dc [{}] - {}", selfAddress, settings.SelfDataCenter, message)
-												Config of cluster info logging, see #3225

											
										
										
											2013-05-23 13:36:35 +02:00
 								    def logInfo(template: String, arg1: Any): Unit =
-												[WIP] one leader per cluster team (#23239)

* Guarantee no sneaky type puts more teams in the role list

* Leader per team and initial tests

* MiMa filters

* Second iteration (not working though)

* Verbose gossip logging etc.

* Gossip to team-nodes even if there is inter-team unreachability

* More work ...

* Marking removed nodes with tombstones in Gossip

* More test coverage for Gossip.remove

* Bug failing other multi-node tests squashed

* Multi-node test for team-split

* Review fixes - only prune tombstones on leader ticks

* Clean code is happy code.

* All I want is for MiMa to be my friend

* These constants are internal

* Making the formatting gods happy

* I used the wrong reachability for ignoring gossip :/

* Still hadn't quite gotten how reachability was supposed to work

* Review feedback applied

* Cross-team downing should still work

* Actually prune tombstones in the prune tombstones method ...

* Another round against reachability. Reachability leading with 15 - 2 so far.

											
										
										
											2017-07-04 09:09:40 +01:00
+								      if (LogInfo)
-												Renamed/moved the self data center setting #23312 (#23344)


											
										
										
											2017-07-12 11:47:32 +01:00
+								        if (settings.SelfDataCenter == ClusterSettings.DefaultDataCenter)
-												[WIP] one leader per cluster team (#23239)

* Guarantee no sneaky type puts more teams in the role list

* Leader per team and initial tests

* MiMa filters

* Second iteration (not working though)

* Verbose gossip logging etc.

* Gossip to team-nodes even if there is inter-team unreachability

* More work ...

* Marking removed nodes with tombstones in Gossip

* More test coverage for Gossip.remove

* Bug failing other multi-node tests squashed

* Multi-node test for team-split

* Review fixes - only prune tombstones on leader ticks

* Clean code is happy code.

* All I want is for MiMa to be my friend

* These constants are internal

* Making the formatting gods happy

* I used the wrong reachability for ignoring gossip :/

* Still hadn't quite gotten how reachability was supposed to work

* Review feedback applied

* Cross-team downing should still work

* Actually prune tombstones in the prune tombstones method ...

* Another round against reachability. Reachability leading with 15 - 2 so far.

											
										
										
											2017-07-04 09:09:40 +01:00
+								          log.info("Cluster Node [{}] - " + template, selfAddress, arg1)
 								        else
-												Renamed/moved the self data center setting #23312 (#23344)


											
										
										
											2017-07-12 11:47:32 +01:00
+								          log.info("Cluster Node [{}] dc [{}] - " + template, selfAddress, settings.SelfDataCenter, arg1)
-												Config of cluster info logging, see #3225

											
										
										
											2013-05-23 13:36:35 +02:00
 								    def logInfo(template: String, arg1: Any, arg2: Any): Unit =
-												[WIP] one leader per cluster team (#23239)

* Guarantee no sneaky type puts more teams in the role list

* Leader per team and initial tests

* MiMa filters

* Second iteration (not working though)

* Verbose gossip logging etc.

* Gossip to team-nodes even if there is inter-team unreachability

* More work ...

* Marking removed nodes with tombstones in Gossip

* More test coverage for Gossip.remove

* Bug failing other multi-node tests squashed

* Multi-node test for team-split

* Review fixes - only prune tombstones on leader ticks

* Clean code is happy code.

* All I want is for MiMa to be my friend

* These constants are internal

* Making the formatting gods happy

* I used the wrong reachability for ignoring gossip :/

* Still hadn't quite gotten how reachability was supposed to work

* Review feedback applied

* Cross-team downing should still work

* Actually prune tombstones in the prune tombstones method ...

* Another round against reachability. Reachability leading with 15 - 2 so far.

											
										
										
											2017-07-04 09:09:40 +01:00
+								      if (LogInfo)
-												Renamed/moved the self data center setting #23312 (#23344)


											
										
										
											2017-07-12 11:47:32 +01:00
+								        if (settings.SelfDataCenter == ClusterSettings.DefaultDataCenter)
-												[WIP] one leader per cluster team (#23239)

* Guarantee no sneaky type puts more teams in the role list

* Leader per team and initial tests

* MiMa filters

* Second iteration (not working though)

* Verbose gossip logging etc.

* Gossip to team-nodes even if there is inter-team unreachability

* More work ...

* Marking removed nodes with tombstones in Gossip

* More test coverage for Gossip.remove

* Bug failing other multi-node tests squashed

* Multi-node test for team-split

* Review fixes - only prune tombstones on leader ticks

* Clean code is happy code.

* All I want is for MiMa to be my friend

* These constants are internal

* Making the formatting gods happy

* I used the wrong reachability for ignoring gossip :/

* Still hadn't quite gotten how reachability was supposed to work

* Review feedback applied

* Cross-team downing should still work

* Actually prune tombstones in the prune tombstones method ...

* Another round against reachability. Reachability leading with 15 - 2 so far.

											
										
										
											2017-07-04 09:09:40 +01:00
+								          log.info("Cluster Node [{}] - " + template, selfAddress, arg1, arg2)
 								        else
-												Renamed/moved the self data center setting #23312 (#23344)


											
										
										
											2017-07-12 11:47:32 +01:00
+								          log.info("Cluster Node [{}] dc [{}] - " + template, selfAddress, settings.SelfDataCenter, arg1, arg2)
-												[WIP] one leader per cluster team (#23239)

* Guarantee no sneaky type puts more teams in the role list

* Leader per team and initial tests

* MiMa filters

* Second iteration (not working though)

* Verbose gossip logging etc.

* Gossip to team-nodes even if there is inter-team unreachability

* More work ...

* Marking removed nodes with tombstones in Gossip

* More test coverage for Gossip.remove

* Bug failing other multi-node tests squashed

* Multi-node test for team-split

* Review fixes - only prune tombstones on leader ticks

* Clean code is happy code.

* All I want is for MiMa to be my friend

* These constants are internal

* Making the formatting gods happy

* I used the wrong reachability for ignoring gossip :/

* Still hadn't quite gotten how reachability was supposed to work

* Review feedback applied

* Cross-team downing should still work

* Actually prune tombstones in the prune tombstones method ...

* Another round against reachability. Reachability leading with 15 - 2 so far.

											
										
										
											2017-07-04 09:09:40 +01:00
 								    def logInfo(template: String, arg1: Any, arg2: Any, arg3: Any): Unit =
 								      if (LogInfo)
-												Renamed/moved the self data center setting #23312 (#23344)


											
										
										
											2017-07-12 11:47:32 +01:00
+								        if (settings.SelfDataCenter == ClusterSettings.DefaultDataCenter)
-												[WIP] one leader per cluster team (#23239)

* Guarantee no sneaky type puts more teams in the role list

* Leader per team and initial tests

* MiMa filters

* Second iteration (not working though)

* Verbose gossip logging etc.

* Gossip to team-nodes even if there is inter-team unreachability

* More work ...

* Marking removed nodes with tombstones in Gossip

* More test coverage for Gossip.remove

* Bug failing other multi-node tests squashed

* Multi-node test for team-split

* Review fixes - only prune tombstones on leader ticks

* Clean code is happy code.

* All I want is for MiMa to be my friend

* These constants are internal

* Making the formatting gods happy

* I used the wrong reachability for ignoring gossip :/

* Still hadn't quite gotten how reachability was supposed to work

* Review feedback applied

* Cross-team downing should still work

* Actually prune tombstones in the prune tombstones method ...

* Another round against reachability. Reachability leading with 15 - 2 so far.

											
										
										
											2017-07-04 09:09:40 +01:00
+								          log.info("Cluster Node [{}] - " + template, selfAddress, arg1, arg2, arg3)
 								        else
-												Renamed/moved the self data center setting #23312 (#23344)


											
										
										
											2017-07-12 11:47:32 +01:00
+								          log.info("Cluster Node [{}] dc [" + settings.SelfDataCenter + "] - " + template, selfAddress, arg1, arg2, arg3)
-												Config of cluster info logging, see #3225

											
										
										
											2013-05-23 13:36:35 +02:00
+								  }
-												Initial version of gossip based cluster membership.

Signed-off-by: Jonas Bonér <jonas@jonasboner.com>

											
										
										
											2011-10-26 08:48:16 +02:00
+								}