2011-04-27 01:10:00 +02:00
|
|
|
/**
|
|
|
|
|
* Copyright (C) 2009-2011 Scalable Solutions AB <http://scalablesolutions.se>
|
|
|
|
|
*/
|
2011-04-28 20:12:37 +02:00
|
|
|
package akka.cluster
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
import org.apache.zookeeper._
|
|
|
|
|
import org.apache.zookeeper.Watcher.Event._
|
|
|
|
|
import org.apache.zookeeper.data.Stat
|
|
|
|
|
import org.apache.zookeeper.recipes.lock.{WriteLock, LockListener}
|
|
|
|
|
|
|
|
|
|
import org.I0Itec.zkclient._
|
|
|
|
|
import org.I0Itec.zkclient.serialize._
|
|
|
|
|
import org.I0Itec.zkclient.exception._
|
|
|
|
|
|
|
|
|
|
import java.util.concurrent.atomic.{AtomicBoolean, AtomicReference, AtomicInteger}
|
|
|
|
|
import java.util.concurrent.{ConcurrentSkipListSet, CopyOnWriteArrayList, Callable, ConcurrentHashMap}
|
|
|
|
|
import java.util.{List => JList}
|
|
|
|
|
import java.net.InetSocketAddress
|
|
|
|
|
import javax.management.StandardMBean
|
|
|
|
|
|
|
|
|
|
import scala.collection.immutable.{HashMap, HashSet}
|
|
|
|
|
import scala.collection.mutable.ConcurrentMap
|
|
|
|
|
import scala.collection.JavaConversions._
|
|
|
|
|
|
|
|
|
|
import ClusterProtocol._
|
|
|
|
|
import RemoteDaemonMessageType._
|
|
|
|
|
|
|
|
|
|
import akka.util._
|
2011-04-28 20:12:37 +02:00
|
|
|
import Helpers._
|
2011-04-27 01:10:00 +02:00
|
|
|
import akka.actor._
|
|
|
|
|
import akka.actor.Actor._
|
|
|
|
|
import akka.event.EventHandler
|
|
|
|
|
import akka.dispatch.{Dispatchers, Future}
|
|
|
|
|
import akka.remoteinterface._
|
|
|
|
|
import akka.config.Config._
|
|
|
|
|
import akka.serialization.{Format, Serializer}
|
|
|
|
|
import akka.serialization.Compression.LZF
|
|
|
|
|
import akka.AkkaException
|
|
|
|
|
|
2011-04-29 15:47:56 +02:00
|
|
|
//import akka.monitoring.Monitoring
|
2011-04-28 20:12:37 +02:00
|
|
|
import akka.cluster.zookeeper._
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
import com.eaio.uuid.UUID
|
|
|
|
|
|
|
|
|
|
import com.google.protobuf.ByteString
|
|
|
|
|
|
|
|
|
|
// FIXME add watch for each node that when the entry for the node is removed then the node shuts itself down
|
|
|
|
|
// FIXME Provisioning data in ZK (file names etc) and files in S3 and on disk
|
|
|
|
|
|
|
|
|
|
class ClusterException(message: String) extends AkkaException(message)
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* JMX MBean for the cluster service.
|
|
|
|
|
*
|
|
|
|
|
* @author <a href="http://jonasboner.com">Jonas Bonér</a>
|
|
|
|
|
*/
|
|
|
|
|
trait ClusterNodeMBean {
|
|
|
|
|
def start: Unit
|
|
|
|
|
def stop: Unit
|
|
|
|
|
|
|
|
|
|
def disconnect: Unit
|
|
|
|
|
def reconnect: Unit
|
|
|
|
|
def resign: Unit
|
|
|
|
|
|
|
|
|
|
def isConnected: Boolean
|
|
|
|
|
|
|
|
|
|
def getRemoteServerHostname: String
|
|
|
|
|
def getRemoteServerPort: Int
|
|
|
|
|
|
|
|
|
|
def getNodeName: String
|
|
|
|
|
def getClusterName: String
|
|
|
|
|
def getZooKeeperServerAddresses: String
|
|
|
|
|
|
|
|
|
|
def getMemberNodes: Array[String]
|
|
|
|
|
def getLeader: String
|
|
|
|
|
|
|
|
|
|
def getUuidsForClusteredActors: Array[String]
|
2011-04-29 15:47:56 +02:00
|
|
|
def getAddressesForClusteredActors: Array[String]
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
def getUuidsForActorsInUse: Array[String]
|
2011-04-29 15:47:56 +02:00
|
|
|
def getAddressesForActorsInUse: Array[String]
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
def getNodesForActorInUseWithUuid(uuid: String): Array[String]
|
2011-04-29 15:47:56 +02:00
|
|
|
def getNodesForActorInUseWithAddress(address: String): Array[String]
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
def getUuidsForActorsInUseOnNode(nodeName: String): Array[String]
|
2011-04-29 15:47:56 +02:00
|
|
|
def getAddressesForActorsInUseOnNode(nodeName: String): Array[String]
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
def setConfigElement(key: String, value: String): Unit
|
|
|
|
|
def getConfigElement(key: String): AnyRef
|
|
|
|
|
def removeConfigElement(key: String): Unit
|
|
|
|
|
def getConfigElementKeys: Array[String]
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Node address holds the node name and the cluster name and can be used as a hash lookup key for a Node instance.
|
|
|
|
|
*
|
|
|
|
|
* @author <a href="http://jonasboner.com">Jonas Bonér</a>
|
|
|
|
|
*/
|
|
|
|
|
final case class NodeAddress(
|
|
|
|
|
clusterName: String,
|
|
|
|
|
nodeName: String,
|
|
|
|
|
hostname: String = Cluster.lookupLocalhostName,
|
|
|
|
|
port: Int = Cluster.remoteServerPort) {
|
|
|
|
|
if ((nodeName eq null) || nodeName == "") throw new NullPointerException("Node name must not be null or empty string")
|
|
|
|
|
if ((clusterName eq null) || clusterName == "") throw new NullPointerException("Cluster name must not be null or empty string")
|
|
|
|
|
override def toString = "%s:%s:%s:%s".format(clusterName, nodeName, hostname, port)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Factory object for ClusterNode. Also holds global state such as configuration data etc.
|
|
|
|
|
*
|
|
|
|
|
* @author <a href="http://jonasboner.com">Jonas Bonér</a>
|
|
|
|
|
*/
|
|
|
|
|
object Cluster {
|
|
|
|
|
val EMPTY_STRING = "".intern
|
|
|
|
|
val UUID_PREFIX = "uuid:".intern
|
|
|
|
|
|
|
|
|
|
// config options
|
2011-05-03 21:04:45 +02:00
|
|
|
val name = config.getString("akka.cluster.name", "default")
|
2011-04-28 20:12:37 +02:00
|
|
|
val zooKeeperServers = config.getString("akka.cluster.zookeeper-server-addresses", "localhost:2181")
|
|
|
|
|
val remoteServerPort = config.getInt("akka.cluster.remote-server-port", 2552)
|
|
|
|
|
val sessionTimeout = Duration(config.getInt("akka.cluster.session-timeout", 60), TIME_UNIT).toMillis.toInt
|
|
|
|
|
val connectionTimeout = Duration(config.getInt("akka.cluster.connection-timeout", 60), TIME_UNIT).toMillis.toInt
|
|
|
|
|
val maxTimeToWaitUntilConnected = Duration(config.getInt("akka.cluster.max-time-to-wait-until-connected", 30), TIME_UNIT).toMillis.toInt
|
|
|
|
|
val shouldCompressData = config.getBool("akka.cluster.use-compression", false)
|
|
|
|
|
val enableJMX = config.getBool("akka.enable-jmx", true)
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Cluster membership change listener.
|
|
|
|
|
* For Scala API.
|
|
|
|
|
*/
|
|
|
|
|
trait ChangeListener {
|
|
|
|
|
def notify(event: ChangeNotification, client: ClusterNode) = event match {
|
|
|
|
|
case NodeConnected(name) => nodeConnected(name, client)
|
|
|
|
|
case NodeDisconnected(name) => nodeDisconnected(name, client)
|
|
|
|
|
case NewLeader(name: String) => newLeader(name, client)
|
|
|
|
|
case NewSession => thisNodeNewSession(client)
|
|
|
|
|
case ThisNode.Connected => thisNodeConnected(client)
|
|
|
|
|
case ThisNode.Disconnected => thisNodeDisconnected(client)
|
|
|
|
|
case ThisNode.Expired => thisNodeExpired(client)
|
|
|
|
|
}
|
|
|
|
|
def nodeConnected(node: String, client: ClusterNode) = {}
|
|
|
|
|
def nodeDisconnected(node: String, client: ClusterNode) = {}
|
|
|
|
|
def newLeader(name: String, client: ClusterNode) = {}
|
|
|
|
|
def thisNodeNewSession(client: ClusterNode) = {}
|
|
|
|
|
def thisNodeConnected(client: ClusterNode) = {}
|
|
|
|
|
def thisNodeDisconnected(client: ClusterNode) = {}
|
|
|
|
|
def thisNodeExpired(client: ClusterNode) = {}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Cluster membership change listener.
|
|
|
|
|
* For Java API.
|
|
|
|
|
*/
|
|
|
|
|
abstract class ChangeListenerAdapter extends ChangeListener
|
|
|
|
|
|
|
|
|
|
sealed trait ChangeNotification
|
|
|
|
|
case class NodeConnected(node: String) extends ChangeNotification
|
|
|
|
|
case class NodeDisconnected(node: String) extends ChangeNotification
|
|
|
|
|
case class NewLeader(name: String) extends ChangeNotification
|
|
|
|
|
case object NewSession extends ChangeNotification
|
|
|
|
|
object ThisNode {
|
|
|
|
|
case object Connected extends ChangeNotification
|
|
|
|
|
case object Disconnected extends ChangeNotification
|
|
|
|
|
case object Expired extends ChangeNotification
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
type Nodes = HashMap[NodeAddress, ClusterNode]
|
|
|
|
|
|
|
|
|
|
val defaultSerializer = new SerializableSerializer
|
|
|
|
|
|
|
|
|
|
private val _zkServer = new AtomicReference[Option[ZkServer]](None)
|
|
|
|
|
private val _nodes = new AtomicReference(new Nodes)
|
|
|
|
|
private val _clusterNames = new ConcurrentSkipListSet[String]
|
|
|
|
|
|
|
|
|
|
private[cluster] def updateNodes(f: Nodes => Nodes) =
|
|
|
|
|
while (Some(_nodes.get).map(node => _nodes.compareAndSet(node, f(node)) == false).get) {}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Looks up the local hostname.
|
|
|
|
|
*/
|
|
|
|
|
def lookupLocalhostName = NetworkUtil.getLocalhostName
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Returns all the nodes created by this Cluster object, e.g. created in this class loader hierarchy in this JVM.
|
|
|
|
|
*/
|
|
|
|
|
def nodes = _nodes.get
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Returns an Array with NodeAddress for all the nodes in a specific cluster.
|
|
|
|
|
*/
|
|
|
|
|
def nodesInCluster(clusterName: String): Array[NodeAddress] = _nodes.get.filter(_._1 == clusterName).map(_._1).toArray
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Returns the NodeAddress for a random node in a specific cluster.
|
|
|
|
|
*/
|
|
|
|
|
def randomNodeInCluster(clusterName: String): NodeAddress = {
|
|
|
|
|
val nodes = nodesInCluster(clusterName)
|
|
|
|
|
val random = new java.util.Random
|
|
|
|
|
nodes(random.nextInt(nodes.length))
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Returns the names of all clusters that this JVM is connected to.
|
|
|
|
|
*/
|
|
|
|
|
def clusters: Array[String] = _clusterNames.toList.toArray
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Returns the node for a specific NodeAddress.
|
|
|
|
|
*/
|
|
|
|
|
def nodeFor(nodeAddress: NodeAddress) = _nodes.get()(nodeAddress)
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Creates a new cluster node; ClusterNode.
|
|
|
|
|
*/
|
|
|
|
|
def apply(
|
|
|
|
|
nodeAddress: NodeAddress,
|
|
|
|
|
zkServerAddresses: String = Cluster.zooKeeperServers,
|
|
|
|
|
serializer: ZkSerializer = Cluster.defaultSerializer): ClusterNode =
|
|
|
|
|
newNode(nodeAddress, zkServerAddresses, serializer)
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Creates a new cluster node; ClusterNode.
|
|
|
|
|
*/
|
|
|
|
|
def newNode(nodeAddress: NodeAddress): ClusterNode =
|
|
|
|
|
newNode(nodeAddress, Cluster.zooKeeperServers, Cluster.defaultSerializer)
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Creates a new cluster node; ClusterNode.
|
|
|
|
|
*/
|
|
|
|
|
def newNode(nodeAddress: NodeAddress, zkServerAddresses: String): ClusterNode =
|
|
|
|
|
newNode(nodeAddress, zkServerAddresses, Cluster.defaultSerializer)
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Creates a new cluster node; ClusterNode.
|
|
|
|
|
*/
|
|
|
|
|
def newNode(nodeAddress: NodeAddress, serializer: ZkSerializer): ClusterNode =
|
|
|
|
|
newNode(nodeAddress, Cluster.zooKeeperServers, serializer)
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Creates a new cluster node; ClusterNode.
|
|
|
|
|
*/
|
|
|
|
|
def newNode(
|
|
|
|
|
nodeAddress: NodeAddress,
|
|
|
|
|
zkServerAddresses: String,
|
|
|
|
|
serializer: ZkSerializer): ClusterNode = {
|
|
|
|
|
|
|
|
|
|
if (nodeAddress eq null) throw new IllegalArgumentException("NodeAddress can't be null")
|
|
|
|
|
|
|
|
|
|
val node = new ClusterNode(
|
|
|
|
|
nodeAddress,
|
|
|
|
|
if ((zkServerAddresses eq null) || zkServerAddresses == "") Cluster.zooKeeperServers else zkServerAddresses,
|
|
|
|
|
if (serializer eq null) Cluster.defaultSerializer else serializer)
|
|
|
|
|
|
|
|
|
|
// FIXME Cluster nodes are never removed?
|
|
|
|
|
updateNodes(_ + (nodeAddress -> node))
|
|
|
|
|
_clusterNames add nodeAddress.clusterName
|
|
|
|
|
node
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Starts up a local ZooKeeper server. Should only be used for testing purposes.
|
|
|
|
|
*/
|
|
|
|
|
def startLocalCluster(): ZkServer =
|
|
|
|
|
startLocalCluster("_akka_cluster/data", "_akka_cluster/log", 2181, 5000)
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Starts up a local ZooKeeper server. Should only be used for testing purposes.
|
|
|
|
|
*/
|
|
|
|
|
def startLocalCluster(port: Int, tickTime: Int): ZkServer =
|
|
|
|
|
startLocalCluster("_akka_cluster/data", "_akka_cluster/log", port, tickTime)
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Starts up a local ZooKeeper server. Should only be used for testing purposes.
|
|
|
|
|
*/
|
|
|
|
|
def startLocalCluster(tickTime: Int): ZkServer =
|
|
|
|
|
startLocalCluster("_akka_cluster/data", "_akka_cluster/log", 2181, tickTime)
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Starts up a local ZooKeeper server. Should only be used for testing purposes.
|
|
|
|
|
*/
|
|
|
|
|
def startLocalCluster(dataPath: String, logPath: String): ZkServer =
|
|
|
|
|
startLocalCluster(dataPath, logPath, 2181, 500)
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Starts up a local ZooKeeper server. Should only be used for testing purposes.
|
|
|
|
|
*/
|
|
|
|
|
def startLocalCluster(dataPath: String, logPath: String, port: Int, tickTime: Int): ZkServer = {
|
|
|
|
|
try {
|
|
|
|
|
val zkServer = AkkaZooKeeper.startLocalServer(dataPath, logPath, port, tickTime)
|
|
|
|
|
_zkServer.set(Some(zkServer))
|
|
|
|
|
zkServer
|
|
|
|
|
} catch {
|
|
|
|
|
case e: Throwable =>
|
|
|
|
|
EventHandler.error(e, this, "Could not start local ZooKeeper cluster")
|
|
|
|
|
throw e
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Resets all clusters managed connected to in this JVM.
|
|
|
|
|
* <p/>
|
|
|
|
|
* <b>WARNING: Use with care</b>
|
|
|
|
|
*/
|
|
|
|
|
def reset(): Unit = withPrintStackTraceOnError {
|
|
|
|
|
EventHandler.info(this, "Resetting all clusters connected to in this JVM")
|
|
|
|
|
if (!clusters.isEmpty) {
|
|
|
|
|
nodes foreach { tp =>
|
|
|
|
|
val (_, node) = tp
|
|
|
|
|
node.disconnect
|
|
|
|
|
node.remoteService.shutdown
|
|
|
|
|
}
|
|
|
|
|
implicit val zkClient = newZkClient
|
|
|
|
|
clusters foreach (resetNodesInCluster(_))
|
|
|
|
|
ignore[ZkNoNodeException](zkClient.deleteRecursive(ZooKeeperBarrier.BarriersNode))
|
|
|
|
|
zkClient.close
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Resets all nodes in a specific cluster.
|
|
|
|
|
*/
|
|
|
|
|
def resetNodesInCluster(clusterName: String)(implicit zkClient: AkkaZkClient = newZkClient) = withPrintStackTraceOnError {
|
|
|
|
|
EventHandler.info(this, "Resetting nodes in cluster [%s]".format(clusterName))
|
|
|
|
|
ignore[ZkNoNodeException](zkClient.deleteRecursive("/" + clusterName))
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Shut down the local ZooKeeper server.
|
|
|
|
|
*/
|
|
|
|
|
def shutdownLocalCluster() = withPrintStackTraceOnError {
|
|
|
|
|
EventHandler.info(this, "Shuts down local cluster")
|
|
|
|
|
reset
|
|
|
|
|
_zkServer.get.foreach(_.shutdown)
|
|
|
|
|
_zkServer.set(None)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Creates a new AkkaZkClient.
|
|
|
|
|
*/
|
|
|
|
|
def newZkClient: AkkaZkClient = new AkkaZkClient(zooKeeperServers, sessionTimeout, connectionTimeout, defaultSerializer)
|
|
|
|
|
|
|
|
|
|
def uuidToString(uuid: UUID): String = uuid.toString
|
|
|
|
|
|
|
|
|
|
def stringToUuid(uuid: String): UUID = {
|
|
|
|
|
if (uuid eq null) throw new ClusterException("UUID is null")
|
|
|
|
|
if (uuid == "") throw new ClusterException("UUID is an empty string")
|
|
|
|
|
try { new UUID(uuid) }
|
|
|
|
|
catch {
|
|
|
|
|
case e: StringIndexOutOfBoundsException =>
|
|
|
|
|
val error = new ClusterException("UUID not valid [" + uuid + "]")
|
|
|
|
|
EventHandler.error(error, this, "")
|
|
|
|
|
throw error
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
def uuidProtocolToUuid(uuid: UuidProtocol) = new UUID(uuid.getHigh, uuid.getLow)
|
|
|
|
|
|
|
|
|
|
def uuidToUuidProtocol(uuid: UUID) =
|
|
|
|
|
UuidProtocol.newBuilder
|
|
|
|
|
.setHigh(uuid.getTime)
|
|
|
|
|
.setLow(uuid.getClockSeqAndNode)
|
|
|
|
|
.build
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* @author <a href="http://jonasboner.com">Jonas Bonér</a>
|
|
|
|
|
*/
|
|
|
|
|
class ClusterNode private[akka] (
|
|
|
|
|
val nodeAddress: NodeAddress,
|
|
|
|
|
val zkServerAddresses: String,
|
|
|
|
|
val serializer: ZkSerializer) extends ErrorHandler { self =>
|
|
|
|
|
|
|
|
|
|
if (nodeAddress eq null) throw new IllegalArgumentException("'nodeAddress' can not be 'null'")
|
|
|
|
|
|
|
|
|
|
import Cluster._
|
|
|
|
|
|
|
|
|
|
EventHandler.info(this,
|
|
|
|
|
("\nCreating cluster node with" +
|
|
|
|
|
"\n\tnode name = [%s]" +
|
|
|
|
|
"\n\tcluster name = [%s]" +
|
|
|
|
|
"\n\tzookeeper server addresses = [%s]" +
|
|
|
|
|
"\n\tserializer = [%s]")
|
|
|
|
|
.format(nodeAddress.nodeName, nodeAddress.clusterName, zkServerAddresses, serializer))
|
|
|
|
|
|
|
|
|
|
val remoteClientLifeCycleListener = actorOf(new Actor {
|
|
|
|
|
def receive = {
|
|
|
|
|
case RemoteClientError(cause, client, address) => client.shutdownClientModule
|
|
|
|
|
case RemoteClientDisconnected(client, address) => client.shutdownClientModule
|
|
|
|
|
case _ => //ignore other
|
|
|
|
|
}
|
2011-04-28 20:12:37 +02:00
|
|
|
}, "akka.cluster.remoteClientLifeCycleListener").start
|
2011-04-27 01:10:00 +02:00
|
|
|
|
2011-04-28 20:12:37 +02:00
|
|
|
val remoteDaemon = actorOf(new RemoteClusterDaemon(this), RemoteClusterDaemon.ADDRESS).start
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
val remoteService: RemoteSupport = {
|
|
|
|
|
val remote = new akka.remote.netty.NettyRemoteSupport
|
|
|
|
|
remote.start(nodeAddress.hostname, nodeAddress.port)
|
2011-04-28 20:12:37 +02:00
|
|
|
remote.register(RemoteClusterDaemon.ADDRESS, remoteDaemon)
|
2011-04-27 01:10:00 +02:00
|
|
|
remote.addListener(remoteClientLifeCycleListener)
|
|
|
|
|
remote
|
|
|
|
|
}
|
|
|
|
|
val remoteServerAddress: InetSocketAddress = remoteService.address
|
|
|
|
|
|
|
|
|
|
val clusterJmxObjectName = JMX.nameFor(nodeAddress.hostname, "monitoring", "cluster")
|
|
|
|
|
|
|
|
|
|
// static nodes
|
2011-04-29 15:47:56 +02:00
|
|
|
val CLUSTER_NODE = "/" + nodeAddress.clusterName
|
|
|
|
|
val MEMBERSHIP_NODE = CLUSTER_NODE + "/members"
|
|
|
|
|
val CONFIGURATION_NODE = CLUSTER_NODE + "/config"
|
|
|
|
|
val PROVISIONING_NODE = CLUSTER_NODE + "/provisioning"
|
|
|
|
|
val ACTOR_REGISTRY_NODE = CLUSTER_NODE + "/actor-registry"
|
|
|
|
|
val ACTOR_LOCATIONS_NODE = CLUSTER_NODE + "/actor-locations"
|
|
|
|
|
val ACTOR_ADDRESS_TO_UUIDS_NODE = CLUSTER_NODE + "/actor-address-to-uuids"
|
|
|
|
|
val ACTORS_AT_NODE_NODE = CLUSTER_NODE + "/actors-at-address"
|
2011-04-27 01:10:00 +02:00
|
|
|
val baseNodes = List(
|
|
|
|
|
CLUSTER_NODE,
|
|
|
|
|
MEMBERSHIP_NODE,
|
|
|
|
|
ACTOR_REGISTRY_NODE,
|
|
|
|
|
ACTOR_LOCATIONS_NODE,
|
2011-04-29 15:47:56 +02:00
|
|
|
ACTORS_AT_NODE_NODE,
|
|
|
|
|
ACTOR_ADDRESS_TO_UUIDS_NODE,
|
2011-04-27 01:10:00 +02:00
|
|
|
CONFIGURATION_NODE,
|
|
|
|
|
PROVISIONING_NODE)
|
|
|
|
|
|
|
|
|
|
val LEADER_ELECTION_NODE = CLUSTER_NODE + "/leader" // should NOT be part of 'baseNodes' only used by 'leaderLock'
|
|
|
|
|
|
|
|
|
|
val isConnected = new Switch(false)
|
|
|
|
|
val isLeader = new AtomicBoolean(false)
|
|
|
|
|
val electionNumber = new AtomicInteger(Integer.MAX_VALUE)
|
|
|
|
|
|
2011-04-29 15:47:56 +02:00
|
|
|
private val membershipNodePath = membershipPathFor(nodeAddress.nodeName)
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
// local caches of ZK data
|
|
|
|
|
private[akka] val locallyCachedMembershipNodes = new ConcurrentSkipListSet[String]()
|
|
|
|
|
private[akka] val nodeNameToAddress: ConcurrentMap[String, InetSocketAddress] = new ConcurrentHashMap[String, InetSocketAddress]
|
|
|
|
|
private[akka] val locallyCheckedOutActors: ConcurrentMap[UUID, Array[Byte]] = new ConcurrentHashMap[UUID, Array[Byte]]
|
|
|
|
|
|
|
|
|
|
def membershipNodes: Array[String] = locallyCachedMembershipNodes.toList.toArray.asInstanceOf[Array[String]]
|
|
|
|
|
|
|
|
|
|
private[akka] val replicaConnections: ConcurrentMap[String, Tuple2[InetSocketAddress, ActorRef]] =
|
|
|
|
|
new ConcurrentHashMap[String, Tuple2[InetSocketAddress, ActorRef]]
|
|
|
|
|
|
|
|
|
|
// zookeeper listeners
|
|
|
|
|
private val stateListener = new StateListener(this)
|
|
|
|
|
private val membershipListener = new MembershipChildListener(this)
|
|
|
|
|
|
|
|
|
|
// cluster node listeners
|
|
|
|
|
private val changeListeners = new CopyOnWriteArrayList[ChangeListener]()
|
|
|
|
|
|
|
|
|
|
// Address -> ClusterActorRef
|
|
|
|
|
private val clusterActorRefs = new Index[InetSocketAddress, ClusterActorRef]
|
|
|
|
|
|
|
|
|
|
// resources
|
|
|
|
|
private[cluster] val zkClient = new AkkaZkClient(zkServerAddresses, sessionTimeout, connectionTimeout, serializer)
|
|
|
|
|
|
|
|
|
|
private[cluster] val leaderElectionCallback = new LockListener {
|
|
|
|
|
def lockAcquired {
|
|
|
|
|
EventHandler.info(this, "Node [%s] is the new leader".format(self.nodeAddress.nodeName))
|
|
|
|
|
self.isLeader.set(true)
|
|
|
|
|
self.publish(Cluster.NewLeader(self.nodeAddress.nodeName))
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
def lockReleased {
|
|
|
|
|
EventHandler.info(this,
|
|
|
|
|
"Node [%s] is *NOT* the leader anymore".format(self.nodeAddress.nodeName))
|
|
|
|
|
self.isLeader.set(false)
|
|
|
|
|
// self.publish(Cluster.LeaderChange)
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
private[cluster] val leaderLock = new WriteLock(
|
|
|
|
|
zkClient.connection.getZookeeper, LEADER_ELECTION_NODE, null, leaderElectionCallback) {
|
|
|
|
|
// ugly hack, but what do you do? <--- haha epic
|
|
|
|
|
private val ownerIdField = classOf[WriteLock].getDeclaredField("ownerId")
|
|
|
|
|
ownerIdField.setAccessible(true)
|
|
|
|
|
def leader: String = ownerIdField.get(this).asInstanceOf[String]
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (enableJMX) createMBean
|
|
|
|
|
|
|
|
|
|
// =======================================
|
|
|
|
|
// Node
|
|
|
|
|
// =======================================
|
|
|
|
|
|
|
|
|
|
def isRunning: Boolean = isConnected.isOn
|
|
|
|
|
|
|
|
|
|
def start(): ClusterNode = {
|
|
|
|
|
isConnected switchOn {
|
|
|
|
|
initializeNode
|
|
|
|
|
}
|
|
|
|
|
this
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
def stop(): Unit = isConnected switchOff {
|
|
|
|
|
ignore[ZkNoNodeException](zkClient.deleteRecursive(membershipNodePath))
|
|
|
|
|
|
|
|
|
|
locallyCachedMembershipNodes.clear
|
|
|
|
|
locallyCheckedOutActors.clear
|
|
|
|
|
|
|
|
|
|
replicaConnections.toList.foreach({ case (_, (address, _)) =>
|
|
|
|
|
remote.shutdownClientConnection(address) // shut down client connections
|
|
|
|
|
})
|
|
|
|
|
|
|
|
|
|
remoteService.shutdown // shutdown server
|
|
|
|
|
|
|
|
|
|
remoteClientLifeCycleListener.stop
|
|
|
|
|
remoteDaemon.stop
|
|
|
|
|
|
|
|
|
|
// for monitoring remote listener
|
2011-04-28 20:12:37 +02:00
|
|
|
registry.local.actors.filter(remoteService.hasListener).foreach(_.stop)
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
replicaConnections.clear
|
|
|
|
|
updateNodes(_ - nodeAddress)
|
|
|
|
|
|
|
|
|
|
disconnect()
|
|
|
|
|
EventHandler.info(this, "Cluster node shut down [%s]".format(nodeAddress))
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
def disconnect(): ClusterNode = {
|
|
|
|
|
zkClient.unsubscribeAll
|
|
|
|
|
zkClient.close
|
|
|
|
|
this
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
def reconnect(): ClusterNode = {
|
|
|
|
|
zkClient.reconnect
|
|
|
|
|
this
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// =======================================
|
|
|
|
|
// Change notification
|
|
|
|
|
// =======================================
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Registers a cluster change listener.
|
|
|
|
|
*/
|
|
|
|
|
def register(listener: ChangeListener): ClusterNode = if (isConnected.isOff) {
|
|
|
|
|
changeListeners.add(listener)
|
|
|
|
|
this
|
|
|
|
|
} else throw new IllegalStateException("Can not register 'ChangeListener' after the cluster node has been started")
|
|
|
|
|
|
|
|
|
|
private[cluster] def publish(change: ChangeNotification) = changeListeners.iterator.foreach(_.notify(change, this))
|
|
|
|
|
|
|
|
|
|
// =======================================
|
|
|
|
|
// Leader
|
|
|
|
|
// =======================================
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Returns the name of the current leader.
|
|
|
|
|
*/
|
|
|
|
|
def leader: String = leaderLock.leader
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Explicitly resign from being a leader. If this node is not a leader then this operation is a no-op.
|
|
|
|
|
*/
|
2011-04-30 15:44:46 +02:00
|
|
|
def resign() { if (isLeader.get) leaderLock.unlock }
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
// =======================================
|
|
|
|
|
// Actor
|
|
|
|
|
// =======================================
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Clusters an actor of a specific type. If the actor is already clustered then the clustered version will be updated
|
|
|
|
|
* with the actor passed in as argument. You can use this to save off snapshots of the actor to a highly
|
|
|
|
|
* available durable store.
|
|
|
|
|
*/
|
|
|
|
|
def store[T <: Actor]
|
2011-04-29 15:47:56 +02:00
|
|
|
(actorClass: Class[T], address: String)
|
|
|
|
|
(implicit format: Format[T]): ClusterNode = store(Actor.actorOf(actorClass, address).start, 0, false)
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Clusters an actor of a specific type. If the actor is already clustered then the clustered version will be updated
|
|
|
|
|
* with the actor passed in as argument. You can use this to save off snapshots of the actor to a highly
|
|
|
|
|
* available durable store.
|
|
|
|
|
*/
|
|
|
|
|
def store[T <: Actor]
|
2011-04-29 15:47:56 +02:00
|
|
|
(actorClass: Class[T], address: String, replicationFactor: Int)
|
|
|
|
|
(implicit format: Format[T]): ClusterNode = store(Actor.actorOf(actorClass, address).start, replicationFactor, false)
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Clusters an actor of a specific type. If the actor is already clustered then the clustered version will be updated
|
|
|
|
|
* with the actor passed in as argument. You can use this to save off snapshots of the actor to a highly
|
|
|
|
|
* available durable store.
|
|
|
|
|
*/
|
|
|
|
|
def store[T <: Actor]
|
2011-04-29 15:47:56 +02:00
|
|
|
(actorClass: Class[T], address: String, serializeMailbox: Boolean)
|
|
|
|
|
(implicit format: Format[T]): ClusterNode = store(Actor.actorOf(actorClass, address).start, 0, serializeMailbox)
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Clusters an actor of a specific type. If the actor is already clustered then the clustered version will be updated
|
|
|
|
|
* with the actor passed in as argument. You can use this to save off snapshots of the actor to a highly
|
|
|
|
|
* available durable store.
|
|
|
|
|
*/
|
|
|
|
|
def store[T <: Actor]
|
2011-04-29 15:47:56 +02:00
|
|
|
(actorClass: Class[T], address: String, replicationFactor: Int, serializeMailbox: Boolean)
|
2011-04-27 01:10:00 +02:00
|
|
|
(implicit format: Format[T]): ClusterNode =
|
2011-04-29 15:47:56 +02:00
|
|
|
store(Actor.actorOf(actorClass, address).start, replicationFactor, serializeMailbox)
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Clusters an actor with UUID. If the actor is already clustered then the clustered version will be updated
|
|
|
|
|
* with the actor passed in as argument. You can use this to save off snapshots of the actor to a highly
|
|
|
|
|
* available durable store.
|
|
|
|
|
*/
|
|
|
|
|
def store[T <: Actor]
|
|
|
|
|
(actorRef: ActorRef)
|
|
|
|
|
(implicit format: Format[T]): ClusterNode = store(actorRef, 0, false)
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Clusters an actor with UUID. If the actor is already clustered then the clustered version will be updated
|
|
|
|
|
* with the actor passed in as argument. You can use this to save off snapshots of the actor to a highly
|
|
|
|
|
* available durable store.
|
|
|
|
|
*/
|
|
|
|
|
def store[T <: Actor]
|
|
|
|
|
(actorRef: ActorRef, replicationFactor: Int)
|
|
|
|
|
(implicit format: Format[T]): ClusterNode = store(actorRef, replicationFactor, false)
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Clusters an actor with UUID. If the actor is already clustered then the clustered version will be updated
|
|
|
|
|
* with the actor passed in as argument. You can use this to save off snapshots of the actor to a highly
|
|
|
|
|
* available durable store.
|
|
|
|
|
*/
|
|
|
|
|
def store[T <: Actor]
|
|
|
|
|
(actorRef: ActorRef, serializeMailbox: Boolean)
|
|
|
|
|
(implicit format: Format[T]): ClusterNode = store(actorRef, 0, serializeMailbox)
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Clusters an actor with UUID. If the actor is already clustered then the clustered version will be updated
|
|
|
|
|
* with the actor passed in as argument. You can use this to save off snapshots of the actor to a highly
|
|
|
|
|
* available durable store.
|
|
|
|
|
*/
|
|
|
|
|
def store[T <: Actor]
|
|
|
|
|
(actorRef: ActorRef, replicationFactor: Int, serializeMailbox: Boolean)
|
|
|
|
|
(implicit format: Format[T]): ClusterNode = if (isConnected.isOn) {
|
|
|
|
|
|
|
|
|
|
import akka.serialization.ActorSerialization._
|
|
|
|
|
|
|
|
|
|
if (!actorRef.isInstanceOf[LocalActorRef]) throw new IllegalArgumentException(
|
|
|
|
|
"'actorRef' must be an instance of 'LocalActorRef' [" + actorRef.getClass.getName + "]")
|
|
|
|
|
|
|
|
|
|
val uuid = actorRef.uuid
|
|
|
|
|
EventHandler.debug(this,
|
2011-04-29 15:47:56 +02:00
|
|
|
"Clustering actor [%s] with UUID [%s]".format(actorRef.address, uuid))
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
val actorBytes = if (shouldCompressData) LZF.compress(toBinary(actorRef, serializeMailbox)(format))
|
|
|
|
|
else toBinary(actorRef)(format)
|
2011-04-29 15:47:56 +02:00
|
|
|
val actorRegistryPath = actorRegistryPathFor(uuid)
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
// create UUID -> Array[Byte] for actor registry
|
|
|
|
|
if (zkClient.exists(actorRegistryPath)) zkClient.writeData(actorRegistryPath, actorBytes) // FIXME check for size and warn if too big
|
|
|
|
|
else {
|
|
|
|
|
zkClient.retryUntilConnected(new Callable[Either[String, Exception]]() {
|
|
|
|
|
def call: Either[String, Exception] = {
|
|
|
|
|
try {
|
|
|
|
|
Left(zkClient.connection.create(actorRegistryPath, actorBytes, CreateMode.PERSISTENT))
|
|
|
|
|
} catch { case e: KeeperException.NodeExistsException => Right(e) }
|
|
|
|
|
}
|
|
|
|
|
}) match {
|
|
|
|
|
case Left(path) => path
|
|
|
|
|
case Right(exception) => actorRegistryPath
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// create UUID -> Format registry
|
|
|
|
|
try {
|
2011-04-29 15:47:56 +02:00
|
|
|
zkClient.createPersistent(actorRegistryFormatPathFor(uuid), format)
|
2011-04-27 01:10:00 +02:00
|
|
|
} catch {
|
2011-04-29 15:47:56 +02:00
|
|
|
case e: ZkNodeExistsException => zkClient.writeData(actorRegistryFormatPathFor(uuid), format)
|
2011-04-27 01:10:00 +02:00
|
|
|
}
|
|
|
|
|
|
2011-04-28 20:12:37 +02:00
|
|
|
// create UUID -> ADDRESS registry
|
2011-04-27 01:10:00 +02:00
|
|
|
try {
|
2011-04-29 15:47:56 +02:00
|
|
|
zkClient.createPersistent(actorRegistryActorAddressPathFor(uuid), actorRef.address)
|
2011-04-27 01:10:00 +02:00
|
|
|
} catch {
|
2011-04-29 15:47:56 +02:00
|
|
|
case e: ZkNodeExistsException => zkClient.writeData(actorRegistryActorAddressPathFor(uuid), actorRef.address)
|
2011-04-27 01:10:00 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// create UUID -> Address registry
|
2011-04-29 15:47:56 +02:00
|
|
|
ignore[ZkNodeExistsException]( zkClient.createPersistent(actorRegistryNodePathFor(uuid)) )
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
// create UUID -> Node registry
|
2011-04-29 15:47:56 +02:00
|
|
|
ignore[ZkNodeExistsException]( zkClient.createPersistent(actorLocationsPathFor(uuid)) )
|
2011-04-27 01:10:00 +02:00
|
|
|
|
2011-04-29 15:47:56 +02:00
|
|
|
// create ADDRESS -> UUIDs registry
|
|
|
|
|
ignore[ZkNodeExistsException]( zkClient.createPersistent(actorAddressToUuidsPathFor(actorRef.address)) )
|
|
|
|
|
ignore[ZkNodeExistsException]( zkClient.createPersistent("%s/%s".format(actorAddressToUuidsPathFor(actorRef.address), uuid)) )
|
2011-04-27 01:10:00 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
val command = RemoteDaemonMessageProtocol.newBuilder
|
|
|
|
|
.setMessageType(USE)
|
|
|
|
|
.setActorUuid(uuidToUuidProtocol(uuid))
|
|
|
|
|
.build
|
|
|
|
|
replicaConnectionsForReplicationFactor(replicationFactor) foreach { connection =>
|
|
|
|
|
connection ! command
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
this
|
|
|
|
|
} else throw new ClusterException("Not connected to cluster")
|
|
|
|
|
|
|
|
|
|
/**
|
2011-04-29 15:47:56 +02:00
|
|
|
* Removes actor with uuid from the cluster.
|
2011-04-27 01:10:00 +02:00
|
|
|
*/
|
2011-04-29 15:47:56 +02:00
|
|
|
def remove(uuid: UUID) = {
|
|
|
|
|
releaseActorOnAllNodes(uuid)
|
|
|
|
|
|
|
|
|
|
locallyCheckedOutActors.remove(uuid)
|
|
|
|
|
// warning: ordering matters here
|
|
|
|
|
ignore[ZkNoNodeException](zkClient.deleteRecursive(actorAddressToUuidsPathFor(actorAddressForUuid(uuid)))) // remove ADDRESS to UUID mapping
|
|
|
|
|
ignore[ZkNoNodeException](zkClient.deleteRecursive(actorAtNodePathFor(nodeAddress.nodeName, uuid)))
|
|
|
|
|
ignore[ZkNoNodeException](zkClient.deleteRecursive(actorRegistryPathFor(uuid)))
|
|
|
|
|
ignore[ZkNoNodeException](zkClient.deleteRecursive(actorLocationsPathFor(uuid)))
|
|
|
|
|
}
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
/**
|
2011-04-29 15:47:56 +02:00
|
|
|
* Removes actor with address from the cluster.
|
2011-04-27 01:10:00 +02:00
|
|
|
*/
|
2011-04-29 15:47:56 +02:00
|
|
|
def remove(address: String): ClusterNode = {
|
2011-04-27 01:10:00 +02:00
|
|
|
isConnected ifOn {
|
2011-04-29 15:47:56 +02:00
|
|
|
EventHandler.debug(this,
|
|
|
|
|
"Removing actor(s) with ADDRESS [%s] from cluster".format(address))
|
|
|
|
|
uuidsForActorAddress(address) foreach (uuid => remove(uuid))
|
2011-04-27 01:10:00 +02:00
|
|
|
}
|
|
|
|
|
this
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Is the actor with uuid clustered or not?
|
|
|
|
|
*/
|
2011-04-29 15:47:56 +02:00
|
|
|
def isClustered(actorAddress: String): Boolean = if (isConnected.isOn) {
|
2011-04-27 01:10:00 +02:00
|
|
|
actorUuidsForActorAddress(actorAddress) map { uuid =>
|
2011-04-29 15:47:56 +02:00
|
|
|
zkClient.exists(actorRegistryPathFor(uuid))
|
2011-04-27 01:10:00 +02:00
|
|
|
} exists (_ == true)
|
|
|
|
|
} else false
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Is the actor with uuid in use on 'this' node or not?
|
|
|
|
|
*/
|
2011-04-29 15:47:56 +02:00
|
|
|
def isInUseOnNode(actorAddress: String): Boolean = isInUseOnNode(actorAddress, nodeAddress)
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Is the actor with uuid in use or not?
|
|
|
|
|
*/
|
2011-04-29 15:47:56 +02:00
|
|
|
def isInUseOnNode(actorAddress: String, node: NodeAddress): Boolean = if (isConnected.isOn) {
|
2011-04-27 01:10:00 +02:00
|
|
|
actorUuidsForActorAddress(actorAddress) map { uuid =>
|
2011-04-29 15:47:56 +02:00
|
|
|
zkClient.exists(actorLocationsPathFor(uuid, node))
|
2011-04-27 01:10:00 +02:00
|
|
|
} exists (_ == true)
|
|
|
|
|
} else false
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Checks out an actor for use on this node, e.g. checked out as a 'LocalActorRef' but it makes it available
|
|
|
|
|
* for remote access through lookup by its UUID.
|
|
|
|
|
*/
|
2011-04-29 15:47:56 +02:00
|
|
|
def use[T <: Actor](actorAddress: String)(
|
2011-04-27 01:10:00 +02:00
|
|
|
implicit format: Format[T] = formatForActor(actorAddress)): Array[LocalActorRef] = if (isConnected.isOn) {
|
|
|
|
|
|
|
|
|
|
import akka.serialization.ActorSerialization._
|
|
|
|
|
|
|
|
|
|
actorUuidsForActorAddress(actorAddress) map { uuid =>
|
|
|
|
|
EventHandler.debug(this,
|
|
|
|
|
"Checking out actor with UUID [%s] to be used on node [%s]".format(uuid, nodeAddress.nodeName))
|
|
|
|
|
|
2011-04-29 15:47:56 +02:00
|
|
|
ignore[ZkNodeExistsException](zkClient.createPersistent(actorAtNodePathFor(nodeAddress.nodeName, uuid), true))
|
|
|
|
|
ignore[ZkNodeExistsException](zkClient.createEphemeral(actorLocationsPathFor(uuid, nodeAddress)))
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
// set home address
|
2011-04-29 15:47:56 +02:00
|
|
|
ignore[ZkNodeExistsException](zkClient.createPersistent(actorRegistryNodePathFor(uuid)))
|
|
|
|
|
ignore[ZkNodeExistsException](zkClient.createEphemeral(actorRegistryNodePathFor(uuid, remoteServerAddress)))
|
2011-04-27 01:10:00 +02:00
|
|
|
|
2011-04-29 15:47:56 +02:00
|
|
|
val actorPath = actorRegistryPathFor(uuid)
|
2011-04-27 01:10:00 +02:00
|
|
|
zkClient.retryUntilConnected(new Callable[Either[Array[Byte], Exception]]() {
|
|
|
|
|
def call: Either[Array[Byte], Exception] = {
|
|
|
|
|
try {
|
|
|
|
|
Left(if (shouldCompressData) LZF.uncompress(zkClient.connection.readData(actorPath, new Stat, false))
|
|
|
|
|
else zkClient.connection.readData(actorPath, new Stat, false))
|
|
|
|
|
} catch { case e: KeeperException.NodeExistsException => Right(e) }
|
|
|
|
|
}
|
|
|
|
|
}) match {
|
|
|
|
|
case Left(bytes) =>
|
|
|
|
|
locallyCheckedOutActors += (uuid -> bytes)
|
|
|
|
|
// FIXME switch to ReplicatedActorRef here
|
|
|
|
|
// val actor = new ReplicatedActorRef(fromBinary[T](bytes, remoteServerAddress)(format))
|
|
|
|
|
val actor = fromBinary[T](bytes, remoteServerAddress)(format)
|
|
|
|
|
remoteService.register(UUID_PREFIX + uuid, actor) // clustered refs are always registered and looked up by UUID
|
|
|
|
|
actor.start
|
|
|
|
|
actor.asInstanceOf[LocalActorRef]
|
|
|
|
|
case Right(exception) => throw exception
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
} else Array.empty[LocalActorRef]
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Using (checking out) all actors with a specific UUID on all nodes in the cluster.
|
|
|
|
|
*/
|
|
|
|
|
def useActorOnAllNodes(uuid: UUID): Unit = isConnected ifOn {
|
|
|
|
|
EventHandler.debug(this,
|
|
|
|
|
"Using (checking out) all actors with UUID [%s] on all nodes in cluster".format(uuid))
|
|
|
|
|
val command = RemoteDaemonMessageProtocol.newBuilder
|
|
|
|
|
.setMessageType(USE)
|
|
|
|
|
.setActorUuid(uuidToUuidProtocol(uuid))
|
|
|
|
|
.build
|
|
|
|
|
membershipNodes foreach { node =>
|
|
|
|
|
replicaConnections.get(node) foreach { case (_, connection) =>
|
|
|
|
|
connection ! command
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Using (checking out) specific UUID on a specefic node.
|
|
|
|
|
*/
|
|
|
|
|
def useActorOnNode(node: String, uuid: UUID): Unit = isConnected ifOn {
|
|
|
|
|
replicaConnections.get(node) foreach { case (_, connection) =>
|
|
|
|
|
connection ! RemoteDaemonMessageProtocol.newBuilder
|
|
|
|
|
.setMessageType(USE)
|
|
|
|
|
.setActorUuid(uuidToUuidProtocol(uuid))
|
|
|
|
|
.build
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Checks in an actor after done using it on this node.
|
|
|
|
|
*/
|
2011-04-29 15:47:56 +02:00
|
|
|
def release(actorAddress: String): Unit = isConnected ifOn {
|
2011-04-27 01:10:00 +02:00
|
|
|
actorUuidsForActorAddress(actorAddress) foreach { uuid =>
|
|
|
|
|
EventHandler.debug(this,
|
|
|
|
|
"Releasing actor with UUID [%s] after usage".format(uuid))
|
|
|
|
|
locallyCheckedOutActors.remove(uuid)
|
2011-04-29 15:47:56 +02:00
|
|
|
ignore[ZkNoNodeException](zkClient.deleteRecursive(actorAtNodePathFor(nodeAddress.nodeName, uuid)))
|
|
|
|
|
ignore[ZkNoNodeException](zkClient.delete(actorAtNodePathFor(nodeAddress.nodeName, uuid)))
|
|
|
|
|
ignore[ZkNoNodeException](zkClient.delete(actorLocationsPathFor(uuid, nodeAddress)))
|
|
|
|
|
ignore[ZkNoNodeException](zkClient.delete(actorRegistryNodePathFor(uuid, remoteServerAddress)))
|
2011-04-27 01:10:00 +02:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Releases (checking in) all actors with a specific UUID on all nodes in the cluster where the actor is in 'use'.
|
|
|
|
|
*/
|
|
|
|
|
def releaseActorOnAllNodes(uuid: UUID): Unit = isConnected ifOn {
|
|
|
|
|
EventHandler.debug(this,
|
|
|
|
|
"Releasing (checking in) all actors with UUID [%s] on all nodes in cluster".format(uuid))
|
|
|
|
|
val command = RemoteDaemonMessageProtocol.newBuilder
|
|
|
|
|
.setMessageType(RELEASE)
|
|
|
|
|
.setActorUuid(uuidToUuidProtocol(uuid))
|
|
|
|
|
.build
|
|
|
|
|
nodesForActorsInUseWithUuid(uuid) foreach { node =>
|
|
|
|
|
replicaConnections.get(node) foreach { case (_, connection) =>
|
|
|
|
|
connection ! command
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Creates an ActorRef with a Router to a set of clustered actors.
|
|
|
|
|
*/
|
2011-04-29 15:47:56 +02:00
|
|
|
def ref(actorAddress: String, router: Router.RouterType): ActorRef = if (isConnected.isOn) {
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
val addresses = addressesForActor(actorAddress)
|
|
|
|
|
val actorType = ActorType.ScalaActor // FIXME later we also want to suppot TypedActor, then 'actorType' needs to be configurable
|
|
|
|
|
|
|
|
|
|
EventHandler.debug(this,
|
|
|
|
|
"Creating cluster actor ref with router [%s] for actors [%s]".format(router, addresses.mkString(", ")))
|
|
|
|
|
|
|
|
|
|
def registerClusterActorRefForAddress(actorRef: ClusterActorRef, addresses: Array[(UUID, InetSocketAddress)]) =
|
|
|
|
|
addresses foreach { case (_, address) => clusterActorRefs.put(address, actorRef) }
|
|
|
|
|
|
2011-04-29 15:47:56 +02:00
|
|
|
// FIXME remove?
|
2011-04-28 20:12:37 +02:00
|
|
|
def refByUuid(uuid: UUID): ActorRef = {
|
2011-04-27 01:10:00 +02:00
|
|
|
val actor = Router newRouter (
|
|
|
|
|
router, addresses,
|
2011-04-29 15:47:56 +02:00
|
|
|
uuidToString(uuid),
|
2011-04-27 01:10:00 +02:00
|
|
|
Actor.TIMEOUT, actorType)
|
|
|
|
|
registerClusterActorRefForAddress(actor, addresses)
|
|
|
|
|
actor
|
|
|
|
|
}
|
|
|
|
|
|
2011-04-29 15:47:56 +02:00
|
|
|
def refByAddress(actorAddress: String): ActorRef = {
|
|
|
|
|
val uuids = uuidsForActorAddress(actorAddress)
|
2011-04-27 01:10:00 +02:00
|
|
|
val actor = Router newRouter (
|
|
|
|
|
router, addresses,
|
2011-04-29 15:47:56 +02:00
|
|
|
actorAddress,
|
2011-04-27 01:10:00 +02:00
|
|
|
Actor.TIMEOUT, actorType)
|
|
|
|
|
registerClusterActorRefForAddress(actor, addresses)
|
|
|
|
|
actor
|
|
|
|
|
}
|
|
|
|
|
|
2011-04-29 15:47:56 +02:00
|
|
|
refByAddress(actorAddress)
|
2011-04-27 01:10:00 +02:00
|
|
|
} else throw new ClusterException("Not connected to cluster")
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Migrate the actor from 'this' node to node 'to'.
|
|
|
|
|
*/
|
2011-04-29 15:47:56 +02:00
|
|
|
def migrate(to: NodeAddress, actorAddress: String): Unit = migrate(nodeAddress, to, actorAddress)
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Migrate the actor from node 'from' to node 'to'.
|
|
|
|
|
*/
|
|
|
|
|
def migrate(
|
2011-04-29 15:47:56 +02:00
|
|
|
from: NodeAddress, to: NodeAddress, actorAddress: String): Unit = isConnected ifOn {
|
2011-04-27 01:10:00 +02:00
|
|
|
if (from eq null) throw new IllegalArgumentException("NodeAddress 'from' can not be 'null'")
|
|
|
|
|
if (to eq null) throw new IllegalArgumentException("NodeAddress 'to' can not be 'null'")
|
|
|
|
|
if (isInUseOnNode(actorAddress, from)) {
|
|
|
|
|
migrateWithoutCheckingThatActorResidesOnItsHomeNode(from, to, actorAddress)
|
|
|
|
|
} else {
|
|
|
|
|
throw new ClusterException("Can't move actor from node [" + from + "] since it does not exist on this node")
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Returns the UUIDs of all actors checked out on this node.
|
|
|
|
|
*/
|
|
|
|
|
def uuidsForActorsInUse: Array[UUID] = uuidsForActorsInUseOnNode(nodeAddress.nodeName)
|
|
|
|
|
|
|
|
|
|
/**
|
2011-04-29 15:47:56 +02:00
|
|
|
* Returns the addresses of all actors checked out on this node.
|
2011-04-27 01:10:00 +02:00
|
|
|
*/
|
2011-04-29 15:47:56 +02:00
|
|
|
def addressesForActorsInUse: Array[String] = actorAddressForUuids(uuidsForActorsInUse)
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Returns the UUIDs of all actors registered in this cluster.
|
|
|
|
|
*/
|
|
|
|
|
def uuidsForClusteredActors: Array[UUID] = if (isConnected.isOn) {
|
|
|
|
|
zkClient.getChildren(ACTOR_REGISTRY_NODE).toList.map(new UUID(_)).toArray.asInstanceOf[Array[UUID]]
|
|
|
|
|
} else Array.empty[UUID]
|
|
|
|
|
|
|
|
|
|
/**
|
2011-04-29 15:47:56 +02:00
|
|
|
* Returns the addresses of all actors registered in this cluster.
|
2011-04-27 01:10:00 +02:00
|
|
|
*/
|
2011-04-29 15:47:56 +02:00
|
|
|
def addressesForClusteredActors: Array[String] = actorAddressForUuids(uuidsForClusteredActors)
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Returns the actor id for the actor with a specific UUID.
|
|
|
|
|
*/
|
2011-04-28 20:12:37 +02:00
|
|
|
def actorAddressForUuid(uuid: UUID): String = if (isConnected.isOn) {
|
2011-04-29 15:47:56 +02:00
|
|
|
try { zkClient.readData(actorRegistryActorAddressPathFor(uuid)).asInstanceOf[String] }
|
2011-04-27 01:10:00 +02:00
|
|
|
catch { case e: ZkNoNodeException => "" }
|
|
|
|
|
} else ""
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Returns the actor ids for all the actors with a specific UUID.
|
|
|
|
|
*/
|
2011-04-29 15:47:56 +02:00
|
|
|
def actorAddressForUuids(uuids: Array[UUID]): Array[String] = uuids map (actorAddressForUuid(_)) filter (_ != "")
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Returns the actor UUIDs for actor ID.
|
|
|
|
|
*/
|
2011-04-28 20:12:37 +02:00
|
|
|
def uuidsForActorAddress(actorAddress: String): Array[UUID] = if (isConnected.isOn) {
|
2011-04-29 15:47:56 +02:00
|
|
|
try { zkClient.getChildren(actorAddressToUuidsPathFor(actorAddress)).toList.map(new UUID(_)).toArray.asInstanceOf[Array[UUID]] }
|
2011-04-27 01:10:00 +02:00
|
|
|
catch { case e: ZkNoNodeException => Array[UUID]() }
|
|
|
|
|
} else Array.empty[UUID]
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Returns the node names of all actors in use with UUID.
|
|
|
|
|
*/
|
|
|
|
|
def nodesForActorsInUseWithUuid(uuid: UUID): Array[String] = if (isConnected.isOn) {
|
2011-04-29 15:47:56 +02:00
|
|
|
try { zkClient.getChildren(actorLocationsPathFor(uuid)).toList.toArray.asInstanceOf[Array[String]] }
|
2011-04-27 01:10:00 +02:00
|
|
|
catch { case e: ZkNoNodeException => Array[String]() }
|
|
|
|
|
} else Array.empty[String]
|
|
|
|
|
|
|
|
|
|
/**
|
2011-04-29 15:47:56 +02:00
|
|
|
* Returns the node names of all actors in use with address.
|
2011-04-27 01:10:00 +02:00
|
|
|
*/
|
2011-04-29 15:47:56 +02:00
|
|
|
def nodesForActorsInUseWithAddress(address: String): Array[String] = if (isConnected.isOn) {
|
2011-04-27 01:10:00 +02:00
|
|
|
flatten {
|
2011-04-29 15:47:56 +02:00
|
|
|
actorUuidsForActorAddress(address) map { uuid =>
|
|
|
|
|
try { zkClient.getChildren(actorLocationsPathFor(uuid)).toList.toArray.asInstanceOf[Array[String]] }
|
2011-04-27 01:10:00 +02:00
|
|
|
catch { case e: ZkNoNodeException => Array[String]() }
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
} else Array.empty[String]
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Returns the UUIDs of all actors in use registered on a specific node.
|
|
|
|
|
*/
|
|
|
|
|
def uuidsForActorsInUseOnNode(nodeName: String): Array[UUID] = if (isConnected.isOn) {
|
2011-04-29 15:47:56 +02:00
|
|
|
try { zkClient.getChildren(actorsAtNodePathFor(nodeName)).toList.map(new UUID(_)).toArray.asInstanceOf[Array[UUID]] }
|
2011-04-27 01:10:00 +02:00
|
|
|
catch { case e: ZkNoNodeException => Array[UUID]() }
|
|
|
|
|
} else Array.empty[UUID]
|
|
|
|
|
|
|
|
|
|
/**
|
2011-04-29 15:47:56 +02:00
|
|
|
* Returns the addresses of all actors in use registered on a specific node.
|
2011-04-27 01:10:00 +02:00
|
|
|
*/
|
2011-04-29 15:47:56 +02:00
|
|
|
def addressesForActorsInUseOnNode(nodeName: String): Array[String] = if (isConnected.isOn) {
|
2011-04-27 01:10:00 +02:00
|
|
|
val uuids =
|
2011-04-29 15:47:56 +02:00
|
|
|
try { zkClient.getChildren(actorsAtNodePathFor(nodeName)).toList.map(new UUID(_)).toArray.asInstanceOf[Array[UUID]] }
|
2011-04-27 01:10:00 +02:00
|
|
|
catch { case e: ZkNoNodeException => Array[UUID]() }
|
2011-04-29 15:47:56 +02:00
|
|
|
actorAddressForUuids(uuids)
|
2011-04-27 01:10:00 +02:00
|
|
|
} else Array.empty[String]
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Returns Format for actor with UUID.
|
|
|
|
|
*/
|
2011-04-29 15:47:56 +02:00
|
|
|
def formatForActor[T <: Actor](actorAddress: String): Format[T] = {
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
val formats = actorUuidsForActorAddress(actorAddress) map { uuid =>
|
2011-04-29 15:47:56 +02:00
|
|
|
zkClient.readData(actorRegistryFormatPathFor(uuid), new Stat).asInstanceOf[Format[T]]
|
2011-04-27 01:10:00 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
val format = formats.head
|
|
|
|
|
if (formats.isEmpty) throw new IllegalStateException("No Format found for [%s]".format(actorAddress))
|
|
|
|
|
if (formats map (_ == format) exists (_ == false)) throw new IllegalStateException(
|
|
|
|
|
"Multiple Format classes found for [%s]".format(actorAddress))
|
|
|
|
|
format
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Returns home address for actor with UUID.
|
|
|
|
|
*/
|
2011-04-29 15:47:56 +02:00
|
|
|
def addressesForActor(actorAddress: String): Array[(UUID, InetSocketAddress)] = {
|
2011-04-27 01:10:00 +02:00
|
|
|
try {
|
|
|
|
|
for {
|
|
|
|
|
uuid <- actorUuidsForActorAddress(actorAddress)
|
2011-04-29 15:47:56 +02:00
|
|
|
address <- zkClient.getChildren(actorRegistryNodePathFor(uuid)).toList
|
2011-04-27 01:10:00 +02:00
|
|
|
} yield {
|
|
|
|
|
val tokenizer = new java.util.StringTokenizer(address, ":")
|
|
|
|
|
val hostname = tokenizer.nextToken // hostname
|
|
|
|
|
val port = tokenizer.nextToken.toInt // port
|
|
|
|
|
(uuid, new InetSocketAddress(hostname, port))
|
|
|
|
|
}
|
|
|
|
|
} catch {
|
|
|
|
|
case e: ZkNoNodeException => Array[(UUID, InetSocketAddress)]()
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// =======================================
|
|
|
|
|
// Compute Grid
|
|
|
|
|
// =======================================
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Send a function 'Function0[Unit]' to be invoked on a random number of nodes (defined by 'replicationFactor' argument).
|
|
|
|
|
*/
|
|
|
|
|
def send(f: Function0[Unit], replicationFactor: Int): Unit = {
|
|
|
|
|
val message = RemoteDaemonMessageProtocol.newBuilder
|
|
|
|
|
.setMessageType(FUNCTION_FUN0_UNIT)
|
|
|
|
|
.setPayload(ByteString.copyFrom(Serializer.Java.toBinary(f)))
|
|
|
|
|
.build
|
|
|
|
|
replicaConnectionsForReplicationFactor(replicationFactor) foreach (_ ! message)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Send a function 'Function0[Any]' to be invoked on a random number of nodes (defined by 'replicationFactor' argument).
|
|
|
|
|
* Returns an 'Array' with all the 'Future's from the computation.
|
|
|
|
|
*/
|
|
|
|
|
def send(f: Function0[Any], replicationFactor: Int): List[Future[Any]] = {
|
|
|
|
|
val message = RemoteDaemonMessageProtocol.newBuilder
|
|
|
|
|
.setMessageType(FUNCTION_FUN0_ANY)
|
|
|
|
|
.setPayload(ByteString.copyFrom(Serializer.Java.toBinary(f)))
|
|
|
|
|
.build
|
|
|
|
|
val results = replicaConnectionsForReplicationFactor(replicationFactor) map (_ !!! message)
|
|
|
|
|
results.toList.asInstanceOf[List[Future[Any]]]
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Send a function 'Function1[Any, Unit]' to be invoked on a random number of nodes (defined by 'replicationFactor' argument)
|
|
|
|
|
* with the argument speficied.
|
|
|
|
|
*/
|
|
|
|
|
def send(f: Function1[Any, Unit], arg: Any, replicationFactor: Int): Unit = {
|
|
|
|
|
val message = RemoteDaemonMessageProtocol.newBuilder
|
|
|
|
|
.setMessageType(FUNCTION_FUN1_ARG_UNIT)
|
|
|
|
|
.setPayload(ByteString.copyFrom(Serializer.Java.toBinary((f, arg))))
|
|
|
|
|
.build
|
|
|
|
|
replicaConnectionsForReplicationFactor(replicationFactor) foreach (_ ! message)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Send a function 'Function1[Any, Any]' to be invoked on a random number of nodes (defined by 'replicationFactor' argument)
|
|
|
|
|
* with the argument speficied.
|
|
|
|
|
* Returns an 'Array' with all the 'Future's from the computation.
|
|
|
|
|
*/
|
|
|
|
|
def send(f: Function1[Any, Any], arg: Any, replicationFactor: Int): List[Future[Any]] = {
|
|
|
|
|
val message = RemoteDaemonMessageProtocol.newBuilder
|
|
|
|
|
.setMessageType(FUNCTION_FUN1_ARG_ANY)
|
|
|
|
|
.setPayload(ByteString.copyFrom(Serializer.Java.toBinary((f, arg))))
|
|
|
|
|
.build
|
|
|
|
|
val results = replicaConnectionsForReplicationFactor(replicationFactor) map (_ !!! message)
|
|
|
|
|
results.toList.asInstanceOf[List[Future[Any]]]
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// =======================================
|
|
|
|
|
// Config
|
|
|
|
|
// =======================================
|
|
|
|
|
|
|
|
|
|
def setConfigElement(key: String, bytes: Array[Byte]) {
|
|
|
|
|
val compressedBytes = if (shouldCompressData) LZF.compress(bytes) else bytes
|
|
|
|
|
EventHandler.debug(this,
|
|
|
|
|
"Adding config value [%s] under key [%s] in cluster registry".format(key, compressedBytes))
|
|
|
|
|
zkClient.retryUntilConnected(new Callable[Either[Unit, Exception]]() {
|
|
|
|
|
def call: Either[Unit, Exception] = {
|
|
|
|
|
try {
|
2011-04-29 15:47:56 +02:00
|
|
|
Left(zkClient.connection.create(configurationPathFor(key), compressedBytes, CreateMode.PERSISTENT))
|
2011-04-27 01:10:00 +02:00
|
|
|
} catch { case e: KeeperException.NodeExistsException =>
|
|
|
|
|
try {
|
2011-04-29 15:47:56 +02:00
|
|
|
Left(zkClient.connection.writeData(configurationPathFor(key), compressedBytes))
|
2011-04-27 01:10:00 +02:00
|
|
|
} catch { case e: Exception => Right(e) }
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}) match {
|
|
|
|
|
case Left(_) => { /* do nothing */ }
|
|
|
|
|
case Right(exception) => throw exception
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Returns the config element for the key or NULL if no element exists under the key.
|
|
|
|
|
*/
|
|
|
|
|
def getConfigElement(key: String): Array[Byte] = try {
|
2011-04-29 15:47:56 +02:00
|
|
|
zkClient.connection.readData(configurationPathFor(key), new Stat, true)
|
2011-04-27 01:10:00 +02:00
|
|
|
} catch {
|
|
|
|
|
case e: KeeperException.NoNodeException => null
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
def removeConfigElement(key: String) = ignore[ZkNoNodeException]{
|
|
|
|
|
EventHandler.debug(this,
|
|
|
|
|
"Removing config element with key [%s] from cluster registry".format(key))
|
2011-04-29 15:47:56 +02:00
|
|
|
zkClient.deleteRecursive(configurationPathFor(key))
|
2011-04-27 01:10:00 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
def getConfigElementKeys: Array[String] = zkClient.getChildren(CONFIGURATION_NODE).toList.toArray.asInstanceOf[Array[String]]
|
|
|
|
|
|
|
|
|
|
// =======================================
|
|
|
|
|
// Queue
|
|
|
|
|
// =======================================
|
|
|
|
|
|
|
|
|
|
def createQueue(rootPath: String, blocking: Boolean = true) = new ZooKeeperQueue(zkClient, rootPath, blocking)
|
|
|
|
|
|
|
|
|
|
// =======================================
|
|
|
|
|
// Barrier
|
|
|
|
|
// =======================================
|
|
|
|
|
|
|
|
|
|
def barrier(name: String, count: Int) =
|
|
|
|
|
ZooKeeperBarrier(zkClient, nodeAddress.clusterName, name, nodeAddress.nodeName, count)
|
|
|
|
|
|
|
|
|
|
def barrier(name: String, count: Int, timeout: Duration) =
|
|
|
|
|
ZooKeeperBarrier(zkClient, nodeAddress.clusterName, name, nodeAddress.nodeName, count, timeout)
|
|
|
|
|
|
|
|
|
|
// =======================================
|
|
|
|
|
// Private
|
|
|
|
|
// =======================================
|
|
|
|
|
|
2011-04-29 15:47:56 +02:00
|
|
|
private[cluster] def membershipPathFor(node: String) = "%s/%s".format(MEMBERSHIP_NODE, node)
|
2011-04-27 01:10:00 +02:00
|
|
|
|
2011-04-29 15:47:56 +02:00
|
|
|
private[cluster] def configurationPathFor(key: String) = "%s/%s".format(CONFIGURATION_NODE, key)
|
2011-04-27 01:10:00 +02:00
|
|
|
|
2011-04-29 15:47:56 +02:00
|
|
|
private[cluster] def actorAddressToUuidsPathFor(actorAddress: String) = "%s/%s".format(ACTOR_ADDRESS_TO_UUIDS_NODE, actorAddress.replace('.', '_'))
|
2011-04-27 01:10:00 +02:00
|
|
|
|
2011-04-29 15:47:56 +02:00
|
|
|
private[cluster] def actorLocationsPathFor(uuid: UUID) = "%s/%s".format(ACTOR_LOCATIONS_NODE, uuid)
|
|
|
|
|
private[cluster] def actorLocationsPathFor(uuid: UUID, node: NodeAddress) =
|
2011-04-28 20:12:37 +02:00
|
|
|
"%s/%s/%s".format(ACTOR_LOCATIONS_NODE, uuid, node.nodeName)
|
2011-04-27 01:10:00 +02:00
|
|
|
|
2011-04-29 15:47:56 +02:00
|
|
|
private[cluster] def actorsAtNodePathFor(node: String) = "%s/%s".format(ACTORS_AT_NODE_NODE, node)
|
|
|
|
|
private[cluster] def actorAtNodePathFor(node: String, uuid: UUID) = "%s/%s/%s".format(ACTORS_AT_NODE_NODE, node, uuid)
|
2011-04-27 01:10:00 +02:00
|
|
|
|
2011-04-29 15:47:56 +02:00
|
|
|
private[cluster] def actorRegistryPathFor(uuid: UUID) = "%s/%s".format(ACTOR_REGISTRY_NODE, uuid)
|
|
|
|
|
private[cluster] def actorRegistryFormatPathFor(uuid: UUID) = "%s/%s".format(actorRegistryPathFor(uuid), "format")
|
|
|
|
|
private[cluster] def actorRegistryActorAddressPathFor(uuid: UUID) = "%s/%s".format(actorRegistryPathFor(uuid), "address")
|
|
|
|
|
private[cluster] def actorRegistryNodePathFor(uuid: UUID): String = "%s/%s".format(actorRegistryPathFor(uuid), "node")
|
|
|
|
|
private[cluster] def actorRegistryNodePathFor(uuid: UUID, address: InetSocketAddress): String =
|
|
|
|
|
"%s/%s:%s".format(actorRegistryNodePathFor(uuid), address.getHostName, address.getPort)
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
private[cluster] def initializeNode = {
|
|
|
|
|
EventHandler.info(this, "Initializing cluster node [%s]".format(nodeAddress))
|
|
|
|
|
createRootClusterNode
|
|
|
|
|
val isLeader = joinLeaderElection
|
|
|
|
|
if (isLeader) createNodeStructureIfNeeded
|
|
|
|
|
registerListeners
|
|
|
|
|
joinMembershipNode
|
|
|
|
|
joinActorsAtAddressNode
|
|
|
|
|
fetchMembershipChildrenNodes
|
|
|
|
|
EventHandler.info(this, "Cluster node [%s] started successfully".format(nodeAddress))
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
private[cluster] def addressForNode(node: String): InetSocketAddress = {
|
2011-04-29 15:47:56 +02:00
|
|
|
val address = zkClient.readData(membershipPathFor(node)).asInstanceOf[String]
|
2011-04-27 01:10:00 +02:00
|
|
|
val tokenizer = new java.util.StringTokenizer(address, ":")
|
|
|
|
|
tokenizer.nextToken // cluster name
|
|
|
|
|
tokenizer.nextToken // node name
|
|
|
|
|
val hostname = tokenizer.nextToken // hostname
|
|
|
|
|
val port = tokenizer.nextToken.toInt // port
|
|
|
|
|
new InetSocketAddress(hostname, port)
|
|
|
|
|
}
|
|
|
|
|
|
2011-04-29 15:47:56 +02:00
|
|
|
private def actorUuidsForActorAddress(actorAddress: String): Array[UUID] = uuidsForActorAddress(actorAddress) filter (_ ne null)
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Returns a random set with replica connections of size 'replicationFactor'.
|
|
|
|
|
* Default replicationFactor is 0, which returns the empty set.
|
|
|
|
|
*/
|
|
|
|
|
private def replicaConnectionsForReplicationFactor(replicationFactor: Int = 0): Set[ActorRef] = {
|
|
|
|
|
var replicas = HashSet.empty[ActorRef]
|
|
|
|
|
if (replicationFactor < 1) return replicas
|
|
|
|
|
|
|
|
|
|
connectToAllReplicas
|
|
|
|
|
|
|
|
|
|
val numberOfReplicas = replicaConnections.size
|
|
|
|
|
val replicaConnectionsAsArray = replicaConnections.toList map { case (node, (address, actorRef)) => actorRef } // the ActorRefs
|
|
|
|
|
|
|
|
|
|
if (numberOfReplicas < replicationFactor) {
|
|
|
|
|
throw new IllegalArgumentException(
|
|
|
|
|
"Replication factor [" + replicationFactor + "] is greater than the number of available nodes [" + numberOfReplicas + "]")
|
|
|
|
|
} else if (numberOfReplicas == replicationFactor) {
|
|
|
|
|
replicas = replicas ++ replicaConnectionsAsArray
|
|
|
|
|
} else {
|
|
|
|
|
val random = new java.util.Random(System.currentTimeMillis)
|
|
|
|
|
while (replicas.size < replicationFactor) {
|
|
|
|
|
val index = random.nextInt(numberOfReplicas)
|
|
|
|
|
replicas = replicas + replicaConnectionsAsArray(index)
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
replicas
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Connect to all available replicas unless already connected).
|
|
|
|
|
*/
|
|
|
|
|
private def connectToAllReplicas = {
|
|
|
|
|
membershipNodes foreach { node =>
|
|
|
|
|
if (!replicaConnections.contains(node)) {
|
|
|
|
|
val address = addressForNode(node)
|
2011-04-28 20:12:37 +02:00
|
|
|
val clusterDaemon = Actor.remote.actorFor(RemoteClusterDaemon.ADDRESS, address.getHostName, address.getPort)
|
2011-04-27 01:10:00 +02:00
|
|
|
replicaConnections.put(node, (address, clusterDaemon))
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
private[cluster] def joinMembershipNode = {
|
|
|
|
|
nodeNameToAddress.put(nodeAddress.nodeName, remoteServerAddress)
|
|
|
|
|
try {
|
|
|
|
|
EventHandler.info(this,
|
|
|
|
|
"Joining cluster as membership node [%s] on [%s]".format(nodeAddress, membershipNodePath))
|
|
|
|
|
zkClient.createEphemeral(membershipNodePath, nodeAddress.toString)
|
|
|
|
|
} catch {
|
|
|
|
|
case e: ZkNodeExistsException =>
|
|
|
|
|
val error = new ClusterException("Can't join the cluster. The node name [" + nodeAddress.nodeName + "] is already in by another node")
|
|
|
|
|
EventHandler.error(error, this, "")
|
|
|
|
|
throw error
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
private[cluster] def joinActorsAtAddressNode =
|
2011-04-29 15:47:56 +02:00
|
|
|
ignore[ZkNodeExistsException](zkClient.createPersistent(actorsAtNodePathFor(nodeAddress.nodeName)))
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
private[cluster] def joinLeaderElection: Boolean = {
|
|
|
|
|
EventHandler.info(this, "Node [%s] is joining leader election".format(nodeAddress.nodeName))
|
|
|
|
|
leaderLock.lock
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
private[cluster] def failOverConnections(from: InetSocketAddress, to: InetSocketAddress) {
|
|
|
|
|
clusterActorRefs.values(from) foreach (_.failOver(from, to))
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
private[cluster] def migrateFromFailedNodes[T <: Actor](currentSetOfClusterNodes: List[String]) = {
|
|
|
|
|
findFailedNodes(currentSetOfClusterNodes).foreach { failedNodeName =>
|
|
|
|
|
|
|
|
|
|
val allNodes = locallyCachedMembershipNodes.toList
|
|
|
|
|
val myIndex = allNodes.indexWhere(_.endsWith(nodeAddress.nodeName))
|
|
|
|
|
val failedNodeIndex = allNodes.indexWhere(_ == failedNodeName)
|
|
|
|
|
|
|
|
|
|
// Migrate to the successor of the failed node (using a sorted circular list of the node names)
|
|
|
|
|
if ((failedNodeIndex == 0 && myIndex == locallyCachedMembershipNodes.size - 1) || // No leftmost successor exists, check the tail
|
|
|
|
|
(failedNodeIndex == myIndex + 1)) { // Am I the leftmost successor?
|
|
|
|
|
|
|
|
|
|
// Yes I am the node to migrate the actor to (can only be one in the cluster)
|
2011-04-29 15:47:56 +02:00
|
|
|
val actorUuidsForFailedNode = zkClient.getChildren(actorsAtNodePathFor(failedNodeName))
|
2011-04-27 01:10:00 +02:00
|
|
|
EventHandler.debug(this,
|
|
|
|
|
"Migrating actors from failed node [%s] to node [%s]: Actor UUIDs [%s]"
|
|
|
|
|
.format(failedNodeName, nodeAddress.nodeName, actorUuidsForFailedNode))
|
|
|
|
|
|
2011-04-28 20:12:37 +02:00
|
|
|
actorUuidsForFailedNode.foreach { uuid =>
|
2011-04-27 01:10:00 +02:00
|
|
|
EventHandler.debug(this,
|
|
|
|
|
"Cluster node [%s] has failed, migrating actor with UUID [%s] to [%s]"
|
2011-04-28 20:12:37 +02:00
|
|
|
.format(failedNodeName, uuid, nodeAddress.nodeName))
|
2011-04-27 01:10:00 +02:00
|
|
|
|
2011-04-29 15:47:56 +02:00
|
|
|
val actorAddress = actorAddressForUuid(uuidFrom(uuid))
|
2011-04-27 01:10:00 +02:00
|
|
|
migrateWithoutCheckingThatActorResidesOnItsHomeNode( // since the ephemeral node is already gone, so can't check
|
|
|
|
|
NodeAddress(nodeAddress.clusterName, failedNodeName), nodeAddress, actorAddress)
|
|
|
|
|
|
|
|
|
|
implicit val format: Format[T] = formatForActor(actorAddress)
|
|
|
|
|
use(actorAddress) foreach { actor =>
|
|
|
|
|
// FIXME remove ugly reflection when we have 1.0 final which has 'fromBinary(byte, homeAddress)(format)'
|
|
|
|
|
//actor.homeAddress = remoteServerAddress
|
|
|
|
|
val homeAddress = classOf[LocalActorRef].getDeclaredField("homeAddress")
|
|
|
|
|
homeAddress.setAccessible(true)
|
|
|
|
|
homeAddress.set(actor, Some(remoteServerAddress))
|
|
|
|
|
|
2011-04-28 20:12:37 +02:00
|
|
|
remoteService.register(uuid, actor)
|
2011-04-27 01:10:00 +02:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// notify all available nodes that they should fail-over all connections from 'from' to 'to'
|
|
|
|
|
val from = nodeNameToAddress.get(failedNodeName)
|
|
|
|
|
val to = remoteServerAddress
|
|
|
|
|
val command = RemoteDaemonMessageProtocol.newBuilder
|
|
|
|
|
.setMessageType(FAIL_OVER_CONNECTIONS)
|
|
|
|
|
.setPayload(ByteString.copyFrom(Serializer.Java.toBinary((from, to))))
|
|
|
|
|
.build
|
|
|
|
|
membershipNodes foreach { node =>
|
|
|
|
|
replicaConnections.get(node) foreach { case (_, connection) =>
|
|
|
|
|
connection ! command
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Used when the ephemeral "home" node is already gone, so we can't check.
|
|
|
|
|
*/
|
|
|
|
|
private def migrateWithoutCheckingThatActorResidesOnItsHomeNode(
|
2011-04-29 15:47:56 +02:00
|
|
|
from: NodeAddress, to: NodeAddress, actorAddress: String) {
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
actorUuidsForActorAddress(actorAddress) map { uuid =>
|
2011-04-29 15:47:56 +02:00
|
|
|
val actorAddress = actorAddressForUuid(uuid)
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
if (!isInUseOnNode(actorAddress, to)) {
|
|
|
|
|
release(actorAddress)
|
|
|
|
|
|
|
|
|
|
val newAddress = new InetSocketAddress(to.hostname, to.port)
|
2011-04-29 15:47:56 +02:00
|
|
|
ignore[ZkNodeExistsException](zkClient.createPersistent(actorRegistryNodePathFor(uuid)))
|
|
|
|
|
ignore[ZkNodeExistsException](zkClient.createEphemeral(actorRegistryNodePathFor(uuid, newAddress)))
|
|
|
|
|
ignore[ZkNodeExistsException](zkClient.createEphemeral(actorLocationsPathFor(uuid, to)))
|
|
|
|
|
ignore[ZkNodeExistsException](zkClient.createPersistent(actorAtNodePathFor(nodeAddress.nodeName, uuid)))
|
2011-04-27 01:10:00 +02:00
|
|
|
|
2011-04-29 15:47:56 +02:00
|
|
|
ignore[ZkNoNodeException](zkClient.delete(actorLocationsPathFor(uuid, from)))
|
|
|
|
|
ignore[ZkNoNodeException](zkClient.delete(actorAtNodePathFor(from.nodeName, uuid)))
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
// 'use' (check out) actor on the remote 'to' node
|
|
|
|
|
useActorOnNode(to.nodeName, uuid)
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
private[cluster] def findFailedNodes(nodes: List[String]): List[String] =
|
|
|
|
|
(locallyCachedMembershipNodes diff Set(nodes: _*)).toList
|
|
|
|
|
|
|
|
|
|
private[cluster] def findNewlyConnectedMembershipNodes(nodes: List[String]): List[String] =
|
|
|
|
|
(Set(nodes: _*) diff locallyCachedMembershipNodes).toList
|
|
|
|
|
|
|
|
|
|
private[cluster] def findNewlyDisconnectedMembershipNodes(nodes: List[String]): List[String] =
|
|
|
|
|
(locallyCachedMembershipNodes diff Set(nodes: _*)).toList
|
|
|
|
|
|
|
|
|
|
private[cluster] def findNewlyConnectedAvailableNodes(nodes: List[String]): List[String] =
|
|
|
|
|
(Set(nodes: _*) diff locallyCachedMembershipNodes).toList
|
|
|
|
|
|
|
|
|
|
private[cluster] def findNewlyDisconnectedAvailableNodes(nodes: List[String]): List[String] =
|
|
|
|
|
(locallyCachedMembershipNodes diff Set(nodes: _*)).toList
|
|
|
|
|
|
|
|
|
|
private def createRootClusterNode: Unit = ignore[ZkNodeExistsException] {
|
|
|
|
|
zkClient.create(CLUSTER_NODE, null, CreateMode.PERSISTENT)
|
|
|
|
|
EventHandler.info(this, "Created node [%s]".format(CLUSTER_NODE))
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
private def createNodeStructureIfNeeded = {
|
|
|
|
|
baseNodes.foreach { path =>
|
|
|
|
|
try {
|
|
|
|
|
zkClient.create(path, null, CreateMode.PERSISTENT)
|
|
|
|
|
EventHandler.debug(this, "Created node [%s]".format(path))
|
|
|
|
|
} catch {
|
|
|
|
|
case e: ZkNodeExistsException => {} // do nothing
|
|
|
|
|
case e =>
|
|
|
|
|
val error = new ClusterException(e.toString)
|
|
|
|
|
EventHandler.error(error, this, "")
|
|
|
|
|
throw error
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
private def registerListeners = {
|
|
|
|
|
zkClient.subscribeStateChanges(stateListener)
|
|
|
|
|
zkClient.subscribeChildChanges(MEMBERSHIP_NODE, membershipListener)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
private def fetchMembershipChildrenNodes = {
|
|
|
|
|
val membershipChildren = zkClient.getChildren(MEMBERSHIP_NODE)
|
|
|
|
|
locallyCachedMembershipNodes.clear
|
|
|
|
|
membershipChildren.iterator.foreach(locallyCachedMembershipNodes.add)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
private def createMBean = {
|
|
|
|
|
val clusterMBean = new StandardMBean(classOf[ClusterNodeMBean]) with ClusterNodeMBean {
|
|
|
|
|
import Cluster._
|
|
|
|
|
|
|
|
|
|
def start = self.start
|
|
|
|
|
def stop = self.stop
|
|
|
|
|
|
|
|
|
|
def disconnect = self.disconnect
|
|
|
|
|
def reconnect = self.reconnect
|
|
|
|
|
def resign = self.resign
|
|
|
|
|
|
|
|
|
|
def isConnected = self.isConnected.isOn
|
|
|
|
|
|
|
|
|
|
def getRemoteServerHostname = self.nodeAddress.hostname
|
|
|
|
|
def getRemoteServerPort = self.nodeAddress.port
|
|
|
|
|
|
|
|
|
|
def getNodeName = self.nodeAddress.nodeName
|
|
|
|
|
def getClusterName = self.nodeAddress.clusterName
|
|
|
|
|
def getZooKeeperServerAddresses = self.zkServerAddresses
|
|
|
|
|
|
|
|
|
|
def getMemberNodes = self.locallyCachedMembershipNodes.iterator.map(_.toString).toArray
|
|
|
|
|
def getLeader = self.leader.toString
|
|
|
|
|
|
|
|
|
|
def getUuidsForActorsInUse = self.uuidsForActorsInUse.map(_.toString).toArray
|
2011-04-29 15:47:56 +02:00
|
|
|
def getAddressesForActorsInUse = self.addressesForActorsInUse.map(_.toString).toArray
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
def getUuidsForClusteredActors = self.uuidsForClusteredActors.map(_.toString).toArray
|
2011-04-29 15:47:56 +02:00
|
|
|
def getAddressesForClusteredActors = self.addressesForClusteredActors.map(_.toString).toArray
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
def getNodesForActorInUseWithUuid(uuid: String) = self.nodesForActorsInUseWithUuid(stringToUuid(uuid))
|
2011-04-29 15:47:56 +02:00
|
|
|
def getNodesForActorInUseWithAddress(id: String) = self.nodesForActorsInUseWithAddress(id)
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
def getUuidsForActorsInUseOnNode(nodeName: String) = self.uuidsForActorsInUseOnNode(nodeName).map(_.toString).toArray
|
2011-04-29 15:47:56 +02:00
|
|
|
def getAddressesForActorsInUseOnNode(nodeName: String) = self.addressesForActorsInUseOnNode(nodeName).map(_.toString).toArray
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
def setConfigElement(key: String, value: String) = self.setConfigElement(key, value.getBytes("UTF-8"))
|
|
|
|
|
def getConfigElement(key: String) = new String(self.getConfigElement(key), "UTF-8")
|
|
|
|
|
def removeConfigElement(key: String) = self.removeConfigElement(key)
|
|
|
|
|
def getConfigElementKeys = self.getConfigElementKeys.toArray
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
JMX.register(clusterJmxObjectName, clusterMBean)
|
2011-04-28 20:12:37 +02:00
|
|
|
|
|
|
|
|
// FIXME need monitoring to lookup the cluster MBean dynamically
|
|
|
|
|
// Monitoring.registerLocalMBean(clusterJmxObjectName, clusterMBean)
|
2011-04-27 01:10:00 +02:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* @author <a href="http://jonasboner.com">Jonas Bonér</a>
|
|
|
|
|
*/
|
|
|
|
|
class MembershipChildListener(self: ClusterNode) extends IZkChildListener with ErrorHandler {
|
|
|
|
|
def handleChildChange(parentPath: String, currentChilds: JList[String]) = withErrorHandler {
|
|
|
|
|
if (currentChilds ne null) {
|
|
|
|
|
val childList = currentChilds.toList
|
|
|
|
|
if (!childList.isEmpty) EventHandler.debug(this,
|
|
|
|
|
"MembershipChildListener at [%s] has children [%s]"
|
|
|
|
|
.format(self.nodeAddress.nodeName, childList.mkString(" ")))
|
|
|
|
|
self.findNewlyConnectedMembershipNodes(childList) foreach { name =>
|
|
|
|
|
self.nodeNameToAddress.put(name, self.addressForNode(name)) // update 'nodename-address' map
|
|
|
|
|
self.publish(Cluster.NodeConnected(name))
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
self.findNewlyDisconnectedMembershipNodes(childList) foreach { name =>
|
|
|
|
|
self.nodeNameToAddress.remove(name) // update 'nodename-address' map
|
|
|
|
|
self.publish(Cluster.NodeDisconnected(name))
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
self.locallyCachedMembershipNodes.clear
|
|
|
|
|
childList.foreach(self.locallyCachedMembershipNodes.add)
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* @author <a href="http://jonasboner.com">Jonas Bonér</a>
|
|
|
|
|
*/
|
|
|
|
|
class StateListener(self: ClusterNode) extends IZkStateListener {
|
|
|
|
|
def handleStateChanged(state: KeeperState) = state match {
|
|
|
|
|
|
|
|
|
|
case KeeperState.SyncConnected =>
|
|
|
|
|
EventHandler.debug(this, "Cluster node [%s] - Connected".format(self.nodeAddress))
|
|
|
|
|
self.publish(Cluster.ThisNode.Connected)
|
|
|
|
|
|
|
|
|
|
case KeeperState.Disconnected =>
|
|
|
|
|
EventHandler.debug(this, "Cluster node [%s] - Disconnected".format(self.nodeAddress))
|
|
|
|
|
self.publish(Cluster.ThisNode.Disconnected)
|
|
|
|
|
|
|
|
|
|
case KeeperState.Expired =>
|
|
|
|
|
EventHandler.debug(this, "Cluster node [%s] - Expired".format(self.nodeAddress))
|
|
|
|
|
self.publish(Cluster.ThisNode.Expired)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Re-initialize after the zookeeper session has expired and a new session has been created.
|
|
|
|
|
*/
|
|
|
|
|
def handleNewSession = {
|
|
|
|
|
EventHandler.debug(this, "Session expired re-initializing node [%s]".format(self.nodeAddress))
|
|
|
|
|
self.initializeNode
|
|
|
|
|
self.publish(Cluster.NewSession)
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* @author <a href="http://jonasboner.com">Jonas Bonér</a>
|
|
|
|
|
*/
|
|
|
|
|
trait ErrorHandler {
|
|
|
|
|
def withErrorHandler[T](body: => T) = {
|
|
|
|
|
try {
|
|
|
|
|
body
|
|
|
|
|
} catch {
|
|
|
|
|
case e: org.I0Itec.zkclient.exception.ZkInterruptedException => { /* ignore */ }
|
|
|
|
|
case e: Throwable =>
|
|
|
|
|
EventHandler.error(e, this, e.toString)
|
|
|
|
|
throw e
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* @author <a href="http://jonasboner.com">Jonas Bonér</a>
|
|
|
|
|
*/
|
|
|
|
|
object RemoteClusterDaemon {
|
2011-04-29 15:47:56 +02:00
|
|
|
val ADDRESS = "akka-cluster-daemon"
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
// FIXME configure functionServerDispatcher to what?
|
|
|
|
|
val functionServerDispatcher = Dispatchers.newExecutorBasedEventDrivenDispatcher("akka:cloud:cluster:function:server").build
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* @author <a href="http://jonasboner.com">Jonas Bonér</a>
|
|
|
|
|
*/
|
|
|
|
|
class RemoteClusterDaemon(cluster: ClusterNode) extends Actor {
|
|
|
|
|
import RemoteClusterDaemon._
|
|
|
|
|
import Cluster._
|
|
|
|
|
|
|
|
|
|
self.dispatcher = Dispatchers.newThreadBasedDispatcher(self)
|
|
|
|
|
|
|
|
|
|
def receive: Receive = {
|
|
|
|
|
case message: RemoteDaemonMessageProtocol =>
|
|
|
|
|
EventHandler.debug(this, "Received command to RemoteClusterDaemon [%s]".format(message))
|
|
|
|
|
message.getMessageType match {
|
|
|
|
|
|
|
|
|
|
case USE =>
|
|
|
|
|
if (message.hasActorUuid) {
|
|
|
|
|
val uuid = uuidProtocolToUuid(message.getActorUuid)
|
2011-04-29 15:47:56 +02:00
|
|
|
val address = cluster.actorAddressForUuid(uuid)
|
2011-04-27 01:10:00 +02:00
|
|
|
implicit val format: Format[Actor] = cluster formatForActor address
|
|
|
|
|
val actors = cluster use address
|
2011-04-28 20:12:37 +02:00
|
|
|
} else if (message.hasActorAddress) {
|
2011-04-29 15:47:56 +02:00
|
|
|
val address = message.getActorAddress
|
2011-04-27 01:10:00 +02:00
|
|
|
implicit val format: Format[Actor] = cluster formatForActor address
|
|
|
|
|
val actors = cluster use address
|
|
|
|
|
} else EventHandler.warning(this,
|
2011-04-29 15:47:56 +02:00
|
|
|
"None of 'uuid', or 'address' is specified, ignoring remote cluster daemon command [%s]".format(message))
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
case RELEASE =>
|
2011-04-29 15:47:56 +02:00
|
|
|
if (message.hasActorUuid) { cluster release cluster.actorAddressForUuid(uuidProtocolToUuid(message.getActorUuid)) }
|
|
|
|
|
else if (message.hasActorAddress) { cluster release message.getActorAddress }
|
2011-04-27 01:10:00 +02:00
|
|
|
else EventHandler.warning(this,
|
2011-04-29 15:47:56 +02:00
|
|
|
"None of 'uuid' or 'actorAddress'' is specified, ignoring remote cluster daemon command [%s]".format(message))
|
2011-04-27 01:10:00 +02:00
|
|
|
|
|
|
|
|
case START => cluster.start
|
|
|
|
|
|
|
|
|
|
case STOP => cluster.stop
|
|
|
|
|
|
|
|
|
|
case DISCONNECT => cluster.disconnect
|
|
|
|
|
|
|
|
|
|
case RECONNECT => cluster.reconnect
|
|
|
|
|
|
|
|
|
|
case RESIGN => cluster.resign
|
|
|
|
|
|
|
|
|
|
case FAIL_OVER_CONNECTIONS =>
|
|
|
|
|
val (from, to) = payloadFor(message, classOf[(InetSocketAddress, InetSocketAddress)])
|
|
|
|
|
cluster.failOverConnections(from, to)
|
|
|
|
|
|
|
|
|
|
case FUNCTION_FUN0_UNIT =>
|
|
|
|
|
actorOf(new Actor() {
|
|
|
|
|
self.dispatcher = functionServerDispatcher
|
|
|
|
|
def receive = {
|
|
|
|
|
case f: Function0[Unit] => try { f() } finally { self.stop }
|
|
|
|
|
}
|
|
|
|
|
}).start ! payloadFor(message, classOf[Function0[Unit]])
|
|
|
|
|
|
|
|
|
|
case FUNCTION_FUN0_ANY =>
|
|
|
|
|
actorOf(new Actor() {
|
|
|
|
|
self.dispatcher = functionServerDispatcher
|
|
|
|
|
def receive = {
|
|
|
|
|
case f: Function0[Any] => try { self.reply(f()) } finally { self.stop }
|
|
|
|
|
}
|
|
|
|
|
}).start forward payloadFor(message, classOf[Function0[Any]])
|
|
|
|
|
|
|
|
|
|
case FUNCTION_FUN1_ARG_UNIT =>
|
|
|
|
|
actorOf(new Actor() {
|
|
|
|
|
self.dispatcher = functionServerDispatcher
|
|
|
|
|
def receive = {
|
|
|
|
|
case t: Tuple2[Function1[Any, Unit], Any] => try { t._1(t._2) } finally { self.stop }
|
|
|
|
|
}
|
|
|
|
|
}).start ! payloadFor(message, classOf[Tuple2[Function1[Any, Unit], Any]])
|
|
|
|
|
|
|
|
|
|
case FUNCTION_FUN1_ARG_ANY =>
|
|
|
|
|
actorOf(new Actor() {
|
|
|
|
|
self.dispatcher = functionServerDispatcher
|
|
|
|
|
def receive = {
|
|
|
|
|
case t: Tuple2[Function1[Any, Any], Any] => try { self.reply(t._1(t._2)) } finally { self.stop }
|
|
|
|
|
}
|
|
|
|
|
}).start forward payloadFor(message, classOf[Tuple2[Function1[Any, Any], Any]])
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
case unknown => EventHandler.warning(this, "Unknown message [%s]".format(unknown))
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
private def payloadFor[T](message: RemoteDaemonMessageProtocol, clazz: Class[T]): T = {
|
|
|
|
|
Serializer.Java.fromBinary(message.getPayload.toByteArray, Some(clazz)).asInstanceOf[T]
|
|
|
|
|
}
|
|
|
|
|
}
|