pekko/akka-distributed-data/src/main/scala/akka/cluster/ddata/ORSet.scala

/**
 * Copyright (C) 2009-2015 Typesafe Inc. <http://www.typesafe.com>
 */
package akka.cluster.ddata

import scala.annotation.tailrec
import scala.collection.immutable.TreeMap

import akka.cluster.Cluster
import akka.cluster.UniqueAddress
import akka.util.HashCode

// TODO this class can be optimized, but I wanted to start with correct functionality and comparability with riak_dt_orswot

object ORSet {
  private val _empty: ORSet[Any] = new ORSet(Map.empty, VersionVector.empty)
  def empty[A]: ORSet[A] = _empty.asInstanceOf[ORSet[A]]
  def apply(): ORSet[Any] = _empty
  /**
   * Java API
   */
  def create[A](): ORSet[A] = empty[A]

  /**
   * Extract the [[ORSet#elements]].
   */
  def unapply[A](s: ORSet[A]): Option[Set[A]] = Some(s.elements)

  /**
   * Extract the [[ORSet#elements]] of an `ORSet`.
   */
  def unapply(a: ReplicatedData): Option[Set[Any]] = a match {
    case s: ORSet[Any] @unchecked ⇒ Some(s.elements)
    case _                        ⇒ None
  }

  /**
   * INTERNAL API
   */
  private[akka]type Dot = VersionVector

  /**
   * INTERNAL API
   * Subtract the `vvector` from the `dot`.
   * What this means is that any (node, version) pair in
   * `dot` that is &lt;= an entry in `vvector` is removed from `dot`.
   * Example [{a, 3}, {b, 2}, {d, 14}, {g, 22}] -
   *         [{a, 4}, {b, 1}, {c, 1}, {d, 14}, {e, 5}, {f, 2}] =
   *         [{b, 2}, {g, 22}]
   */
  private[akka] def subtractDots(dot: Dot, vvector: VersionVector): Dot = {

    @tailrec def dropDots(remaining: List[(UniqueAddress, Long)], acc: List[(UniqueAddress, Long)]): List[(UniqueAddress, Long)] =
      remaining match {
        case Nil ⇒ acc
        case (d @ (node, v1)) :: rest ⇒
          vvector.versions.get(node) match {
            case Some(v2) if v2 >= v1 ⇒
              // dot is dominated by version vector, drop it
              dropDots(rest, acc)
            case _ ⇒
              dropDots(rest, d :: acc)
          }
      }

    if (dot.versions.isEmpty)
      VersionVector.empty
    else {
      val newDots = dropDots(dot.versions.toList, Nil)
      new VersionVector(versions = VersionVector.emptyVersions ++ newDots)
    }
  }

  /**
   * INTERNAL API
   * @see [[ORSet#merge]]
   */
  private[akka] def mergeCommonKeys[A](commonKeys: Set[A], lhs: ORSet[A], rhs: ORSet[A]): Map[A, ORSet.Dot] = {
    commonKeys.foldLeft(Map.empty[A, ORSet.Dot]) {
      case (acc, k) ⇒
        val lhsDots = lhs.elementsMap(k)
        val lhsDotsVersions = lhsDots.versions
        val rhsDotsVersions = rhs.elementsMap(k).versions
        if (lhsDotsVersions.size == 1 && rhsDotsVersions.size == 1 && lhsDotsVersions.head == rhsDotsVersions.head) {
          // one single common dot
          acc.updated(k, lhsDots)
        } else {
          val commonDots = lhsDotsVersions.filter {
            case (thisDotNode, v) ⇒ rhsDotsVersions.get(thisDotNode).exists(_ == v)
          }
          val commonDotsKeys = commonDots.keys
          val lhsUniqueDots = lhsDotsVersions -- commonDotsKeys
          val rhsUniqueDots = rhsDotsVersions -- commonDotsKeys
          val lhsKeep = ORSet.subtractDots(new VersionVector(lhsUniqueDots), rhs.vvector)
          val rhsKeep = ORSet.subtractDots(new VersionVector(rhsUniqueDots), lhs.vvector)
          val merged = lhsKeep.merge(rhsKeep).merge(new VersionVector(versions = commonDots))
          // Perfectly possible that an item in both sets should be dropped
          if (merged.versions.isEmpty) acc
          else acc.updated(k, merged)
        }
    }
  }

  /**
   * INTERNAL API
   * @see [[ORSet#merge]]
   */
  private[akka] def mergeDisjointKeys[A](keys: Set[A], elementsMap: Map[A, ORSet.Dot], vvector: VersionVector,
                                         accumulator: Map[A, ORSet.Dot]): Map[A, ORSet.Dot] = {
    keys.foldLeft(accumulator) {
      case (acc, k) ⇒
        val dots = elementsMap(k)
        if (vvector > dots || vvector == dots)
          acc
        else {
          // Optimise the set of stored dots to include only those unseen
          val newDots = subtractDots(dots, vvector)
          acc.updated(k, newDots)
        }
    }
  }
}

/**
 * Implements a 'Observed Remove Set' CRDT, also called a 'OR-Set'.
 * Elements can be added and removed any number of times. Concurrent add wins
 * over remove.
 *
 * It is not implemented as in the paper
 * <a href="http://hal.upmc.fr/file/index/docid/555588/filename/techreport.pdf">A comprehensive study of Convergent and Commutative Replicated Data Types</a>.
 * This is more space efficient and doesn't accumulate garbage for removed elements.
 * It is described in the paper
 * <a href="https://hal.inria.fr/file/index/docid/738680/filename/RR-8083.pdf">An optimized conflict-free replicated set</a>
 * The implementation is inspired by the Riak DT <a href="https://github.com/basho/riak_dt/blob/develop/src/riak_dt_orswot.erl">
 * riak_dt_orswot</a>.
 *
 * The ORSet has a version vector that is incremented when an element is added to
 * the set. The `node -&gt; count` pair for that increment is stored against the
 * element as its "birth dot". Every time the element is re-added to the set,
 * its "birth dot" is updated to that of the `node -&gt; count` version vector entry
 * resulting from the add. When an element is removed, we simply drop it, no tombstones.
 *
 * When an element exists in replica A and not replica B, is it because A added
 * it and B has not yet seen that, or that B removed it and A has not yet seen that?
 * In this implementation we compare the `dot` of the present element to the version vector
 * in the Set it is absent from. If the element dot is not "seen" by the Set version vector,
 * that means the other set has yet to see this add, and the item is in the merged
 * Set. If the Set version vector dominates the dot, that means the other Set has removed this
 * element already, and the item is not in the merged Set.
 *
 * This class is immutable, i.e. "modifying" methods return a new instance.
 */
@SerialVersionUID(1L)
final class ORSet[A] private[akka] (
  private[akka] val elementsMap: Map[A, ORSet.Dot],
  private[akka] val vvector: VersionVector)
  extends ReplicatedData with ReplicatedDataSerialization with RemovedNodePruning {

  type T = ORSet[A]

  /**
   * Scala API
   */
  def elements: Set[A] = elementsMap.keySet

  /**
   * Java API
   */
  def getElements(): java.util.Set[A] = {
    import scala.collection.JavaConverters._
    elements.asJava
  }

  def contains(a: A): Boolean = elementsMap.contains(a)

  def isEmpty: Boolean = elementsMap.isEmpty

  def size: Int = elementsMap.size

  /**
   * Adds an element to the set
   */
  def +(element: A)(implicit node: Cluster): ORSet[A] = add(node, element)

  /**
   * Adds an element to the set
   */
  def add(node: Cluster, element: A): ORSet[A] = add(node.selfUniqueAddress, element)

  /**
   * INTERNAL API
   */
  private[akka] def add(node: UniqueAddress, element: A): ORSet[A] = {
    val newVvector = vvector + node
    val newDot = new VersionVector(versions = TreeMap(node -> newVvector.versions(node)))
    new ORSet(elementsMap = elementsMap.updated(element, newDot), vvector = newVvector)
  }

  /**
   * Removes an element from the set.
   */
  def -(element: A)(implicit node: Cluster): ORSet[A] = remove(node, element)

  /**
   * Removes an element from the set.
   */
  def remove(node: Cluster, element: A): ORSet[A] = remove(node.selfUniqueAddress, element)

  /**
   * INTERNAL API
   */
  private[akka] def remove(node: UniqueAddress, element: A): ORSet[A] =
    copy(elementsMap = elementsMap - element)

  /**
   * Removes all elements from the set, but keeps the history.
   * This has the same result as using [[#remove]] for each
   * element, but it is more efficient.
   */
  def clear(node: Cluster): ORSet[A] = clear(node.selfUniqueAddress)

  /**
   * INTERNAL API
   */
  private[akka] def clear(node: UniqueAddress): ORSet[A] = copy(elementsMap = Map.empty)

  /**
   * When element is in this Set but not in that Set:
   * Compare the "birth dot" of the present element to the version vector in the Set it is absent from.
   * If the element dot is not "seen" by other Set version vector, that means the other set has yet to
   * see this add, and the element is to be in the merged Set.
   * If the other Set version vector dominates the dot, that means the other Set has removed
   * the element already, and the element is not to be in the merged Set.
   *
   * When element in both this Set and in that Set:
   * Some dots may still need to be shed. If this Set has dots that the other Set does not have,
   * and the other Set version vector dominates those dots, then we need to drop those dots.
   * Keep only common dots, and dots that are not dominated by the other sides version vector
   */
  override def merge(that: ORSet[A]): ORSet[A] = {
    val thisKeys = elementsMap.keySet
    val thatKeys = that.elementsMap.keySet
    val commonKeys = thisKeys.intersect(thatKeys)
    val thisUniqueKeys = thisKeys -- commonKeys
    val thatUniqueKeys = thatKeys -- commonKeys

    val entries00 = ORSet.mergeCommonKeys(commonKeys, this, that)
    val entries0 = ORSet.mergeDisjointKeys(thisUniqueKeys, this.elementsMap, that.vvector, entries00)
    val entries = ORSet.mergeDisjointKeys(thatUniqueKeys, that.elementsMap, this.vvector, entries0)
    val mergedVvector = this.vvector.merge(that.vvector)

    new ORSet(entries, mergedVvector)
  }

  override def needPruningFrom(removedNode: UniqueAddress): Boolean =
    vvector.needPruningFrom(removedNode)

  override def prune(removedNode: UniqueAddress, collapseInto: UniqueAddress): ORSet[A] = {
    val pruned = elementsMap.foldLeft(Map.empty[A, ORSet.Dot]) {
      case (acc, (elem, dot)) ⇒
        if (dot.needPruningFrom(removedNode)) acc.updated(elem, dot.prune(removedNode, collapseInto))
        else acc
    }
    if (pruned.isEmpty)
      copy(vvector = vvector.prune(removedNode, collapseInto))
    else {
      // re-add elements that were pruned, to bump dots to right vvector
      val newSet = new ORSet(elementsMap = elementsMap ++ pruned, vvector = vvector.prune(removedNode, collapseInto))
      pruned.keys.foldLeft(newSet) {
        case (s, elem) ⇒ s.add(collapseInto, elem)
      }
    }
  }

  override def pruningCleanup(removedNode: UniqueAddress): ORSet[A] = {
    val updated = elementsMap.foldLeft(elementsMap) {
      case (acc, (elem, dot)) ⇒
        if (dot.needPruningFrom(removedNode)) acc.updated(elem, dot.pruningCleanup(removedNode))
        else acc
    }
    new ORSet(updated, vvector.pruningCleanup(removedNode))
  }

  private def copy(elementsMap: Map[A, ORSet.Dot] = this.elementsMap, vvector: VersionVector = this.vvector): ORSet[A] =
    new ORSet(elementsMap, vvector)

  // this class cannot be a `case class` because we need different `unapply`

  override def toString: String = s"OR$elements"

  override def equals(o: Any): Boolean = o match {
    case other: ORSet[_] ⇒ vvector == other.vvector && elementsMap == other.elementsMap
    case _               ⇒ false
  }

  override def hashCode: Int = {
    var result = HashCode.SEED
    result = HashCode.hash(result, elementsMap)
    result = HashCode.hash(result, vvector)
    result
  }
}

object ORSetKey {
  def create[A](id: String): Key[ORSet[A]] = ORSetKey(id)
}

@SerialVersionUID(1L)
final case class ORSetKey[A](_id: String) extends Key[ORSet[A]](_id) with ReplicatedDataSerialization
+cdd #16799 Add Distributed Data module Previously know as [patriknw/akka-data-replication](https://github.com/patriknw/akka-data-replication), which was originally inspired by [jboner/akka-crdt](https://github.com/jboner/akka-crdt). The functionality is very similar to akka-data-replication 0.11. Here is a list of the most important changes: * The package name changed to `akka.cluster.ddata` * The extension was renamed to `DistributedData` * The keys changed from strings to classes with unique identifiers and type information of the data values, e.g. `ORSetKey[Int]("set2")` * The optional read consistency parameter was removed from the `Update` message. If you need to read from other replicas before performing the update you have to first send a `Get` message and then continue with the ``Update`` when the ``GetSuccess`` is received. * `BigInt` is used in `GCounter` and `PNCounter` instead of `Long` * Improvements of java api * Better documentation 2015-05-17 12:28:47 +02:00			`/**`
			`* Copyright (C) 2009-2015 Typesafe Inc. <http://www.typesafe.com>`
			`*/`
			`package akka.cluster.ddata`

			`import scala.annotation.tailrec`
			`import scala.collection.immutable.TreeMap`

			`import akka.cluster.Cluster`
			`import akka.cluster.UniqueAddress`
			`import akka.util.HashCode`

			`// TODO this class can be optimized, but I wanted to start with correct functionality and comparability with riak_dt_orswot`

			`object ORSet {`
			`private val _empty: ORSet[Any] = new ORSet(Map.empty, VersionVector.empty)`
			`def empty[A]: ORSet[A] = _empty.asInstanceOf[ORSet[A]]`
			`def apply(): ORSet[Any] = _empty`
			`/**`
			`* Java API`
			`*/`
			`def create[A](): ORSet[A] = empty[A]`

			`/**`
			`* Extract the [[ORSet#elements]].`
			`*/`
			`def unapply[A](s: ORSet[A]): Option[Set[A]] = Some(s.elements)`

			`/**`
			* Extract the [[ORSet#elements]] of an `ORSet`.
			`*/`
			`def unapply(a: ReplicatedData): Option[Set[Any]] = a match {`
			`case s: ORSet[Any] @unchecked ⇒ Some(s.elements)`
			`case _ ⇒ None`
			`}`

			`/**`
			`* INTERNAL API`
			`*/`
			`private[akka]type Dot = VersionVector`

			`/**`
			`* INTERNAL API`
			* Subtract the `vvector` from the `dot`.
			`* What this means is that any (node, version) pair in`
			* `dot` that is <= an entry in `vvector` is removed from `dot`.
			`* Example [{a, 3}, {b, 2}, {d, 14}, {g, 22}] -`
			`* [{a, 4}, {b, 1}, {c, 1}, {d, 14}, {e, 5}, {f, 2}] =`
			`* [{b, 2}, {g, 22}]`
			`*/`
			`private[akka] def subtractDots(dot: Dot, vvector: VersionVector): Dot = {`

			`@tailrec def dropDots(remaining: List[(UniqueAddress, Long)], acc: List[(UniqueAddress, Long)]): List[(UniqueAddress, Long)] =`
			`remaining match {`
			`case Nil ⇒ acc`
			`case (d @ (node, v1)) :: rest ⇒`
			`vvector.versions.get(node) match {`
			`case Some(v2) if v2 >= v1 ⇒`
			`// dot is dominated by version vector, drop it`
			`dropDots(rest, acc)`
			`case _ ⇒`
			`dropDots(rest, d :: acc)`
			`}`
			`}`

=cdd #18328 optimize ORSet.mergeCommonKeys AFTER: [info] Benchmark (set1Size) Mode Cnt Score Error Units [info] ORSetMergeBenchmark.mergeAddFromBothNodes 1 thrpt 10 737.646 ± 10.289 ops/ms [info] ORSetMergeBenchmark.mergeAddFromBothNodes 10 thrpt 10 146.706 ± 6.331 ops/ms [info] ORSetMergeBenchmark.mergeAddFromBothNodes 20 thrpt 10 95.553 ± 1.801 ops/ms [info] ORSetMergeBenchmark.mergeAddFromBothNodes 100 thrpt 10 18.321 ± 0.586 ops/ms [info] ORSetMergeBenchmark.mergeAddFromOtherNode 1 thrpt 10 1274.526 ± 23.732 ops/ms [info] ORSetMergeBenchmark.mergeAddFromOtherNode 10 thrpt 10 162.426 ± 20.490 ops/ms [info] ORSetMergeBenchmark.mergeAddFromOtherNode 20 thrpt 10 102.436 ± 2.435 ops/ms [info] ORSetMergeBenchmark.mergeAddFromOtherNode 100 thrpt 10 18.911 ± 0.659 ops/ms [info] ORSetMergeBenchmark.mergeAddFromSameNode 1 thrpt 10 653.358 ± 71.232 ops/ms [info] ORSetMergeBenchmark.mergeAddFromSameNode 10 thrpt 10 147.385 ± 2.750 ops/ms [info] ORSetMergeBenchmark.mergeAddFromSameNode 20 thrpt 10 94.280 ± 0.894 ops/ms [info] ORSetMergeBenchmark.mergeAddFromSameNode 100 thrpt 10 17.922 ± 1.522 ops/ms [info] ORSetMergeBenchmark.mergeComplex 1 thrpt 10 335.060 ± 8.385 ops/ms [info] ORSetMergeBenchmark.mergeComplex 10 thrpt 10 134.438 ± 3.044 ops/ms [info] ORSetMergeBenchmark.mergeComplex 20 thrpt 10 86.015 ± 2.145 ops/ms [info] ORSetMergeBenchmark.mergeComplex 100 thrpt 10 17.611 ± 0.136 ops/ms BEFORE: [info] Benchmark (set1Size) Mode Cnt Score Error Units [info] ORSetMergeBenchmark.mergeAddFromBothNodes 1 thrpt 10 492.291 ± 55.903 ops/ms [info] ORSetMergeBenchmark.mergeAddFromBothNodes 10 thrpt 10 79.890 ± 4.977 ops/ms [info] ORSetMergeBenchmark.mergeAddFromBothNodes 20 thrpt 10 44.560 ± 9.081 ops/ms [info] ORSetMergeBenchmark.mergeAddFromBothNodes 100 thrpt 10 9.405 ± 0.323 ops/ms [info] ORSetMergeBenchmark.mergeAddFromOtherNode 1 thrpt 10 714.043 ± 14.694 ops/ms [info] ORSetMergeBenchmark.mergeAddFromOtherNode 10 thrpt 10 88.281 ± 13.858 ops/ms [info] ORSetMergeBenchmark.mergeAddFromOtherNode 20 thrpt 10 49.001 ± 0.940 ops/ms [info] ORSetMergeBenchmark.mergeAddFromOtherNode 100 thrpt 10 9.379 ± 0.300 ops/ms [info] ORSetMergeBenchmark.mergeAddFromSameNode 1 thrpt 10 487.261 ± 7.457 ops/ms [info] ORSetMergeBenchmark.mergeAddFromSameNode 10 thrpt 10 80.073 ± 9.736 ops/ms [info] ORSetMergeBenchmark.mergeAddFromSameNode 20 thrpt 10 46.385 ± 1.225 ops/ms [info] ORSetMergeBenchmark.mergeAddFromSameNode 100 thrpt 10 9.583 ± 0.234 ops/ms [info] ORSetMergeBenchmark.mergeComplex 1 thrpt 10 313.959 ± 31.419 ops/ms [info] ORSetMergeBenchmark.mergeComplex 10 thrpt 10 79.265 ± 1.126 ops/ms [info] ORSetMergeBenchmark.mergeComplex 20 thrpt 10 44.478 ± 2.077 ops/ms [info] ORSetMergeBenchmark.mergeComplex 100 thrpt 10 9.202 ± 0.564 ops/ms 2015-09-19 21:46:01 +02:00			`if (dot.versions.isEmpty)`
			`VersionVector.empty`
			`else {`
			`val newDots = dropDots(dot.versions.toList, Nil)`
			`new VersionVector(versions = VersionVector.emptyVersions ++ newDots)`
			`}`
+cdd #16799 Add Distributed Data module Previously know as [patriknw/akka-data-replication](https://github.com/patriknw/akka-data-replication), which was originally inspired by [jboner/akka-crdt](https://github.com/jboner/akka-crdt). The functionality is very similar to akka-data-replication 0.11. Here is a list of the most important changes: * The package name changed to `akka.cluster.ddata` * The extension was renamed to `DistributedData` * The keys changed from strings to classes with unique identifiers and type information of the data values, e.g. `ORSetKey[Int]("set2")` * The optional read consistency parameter was removed from the `Update` message. If you need to read from other replicas before performing the update you have to first send a `Get` message and then continue with the ``Update`` when the ``GetSuccess`` is received. * `BigInt` is used in `GCounter` and `PNCounter` instead of `Long` * Improvements of java api * Better documentation 2015-05-17 12:28:47 +02:00			`}`

			`/**`
			`* INTERNAL API`
			`* @see [[ORSet#merge]]`
			`*/`
			`private[akka] def mergeCommonKeys[A](commonKeys: Set[A], lhs: ORSet[A], rhs: ORSet[A]): Map[A, ORSet.Dot] = {`
			`commonKeys.foldLeft(Map.empty[A, ORSet.Dot]) {`
			`case (acc, k) ⇒`
=cdd #18328 optimize ORSet.mergeCommonKeys AFTER: [info] Benchmark (set1Size) Mode Cnt Score Error Units [info] ORSetMergeBenchmark.mergeAddFromBothNodes 1 thrpt 10 737.646 ± 10.289 ops/ms [info] ORSetMergeBenchmark.mergeAddFromBothNodes 10 thrpt 10 146.706 ± 6.331 ops/ms [info] ORSetMergeBenchmark.mergeAddFromBothNodes 20 thrpt 10 95.553 ± 1.801 ops/ms [info] ORSetMergeBenchmark.mergeAddFromBothNodes 100 thrpt 10 18.321 ± 0.586 ops/ms [info] ORSetMergeBenchmark.mergeAddFromOtherNode 1 thrpt 10 1274.526 ± 23.732 ops/ms [info] ORSetMergeBenchmark.mergeAddFromOtherNode 10 thrpt 10 162.426 ± 20.490 ops/ms [info] ORSetMergeBenchmark.mergeAddFromOtherNode 20 thrpt 10 102.436 ± 2.435 ops/ms [info] ORSetMergeBenchmark.mergeAddFromOtherNode 100 thrpt 10 18.911 ± 0.659 ops/ms [info] ORSetMergeBenchmark.mergeAddFromSameNode 1 thrpt 10 653.358 ± 71.232 ops/ms [info] ORSetMergeBenchmark.mergeAddFromSameNode 10 thrpt 10 147.385 ± 2.750 ops/ms [info] ORSetMergeBenchmark.mergeAddFromSameNode 20 thrpt 10 94.280 ± 0.894 ops/ms [info] ORSetMergeBenchmark.mergeAddFromSameNode 100 thrpt 10 17.922 ± 1.522 ops/ms [info] ORSetMergeBenchmark.mergeComplex 1 thrpt 10 335.060 ± 8.385 ops/ms [info] ORSetMergeBenchmark.mergeComplex 10 thrpt 10 134.438 ± 3.044 ops/ms [info] ORSetMergeBenchmark.mergeComplex 20 thrpt 10 86.015 ± 2.145 ops/ms [info] ORSetMergeBenchmark.mergeComplex 100 thrpt 10 17.611 ± 0.136 ops/ms BEFORE: [info] Benchmark (set1Size) Mode Cnt Score Error Units [info] ORSetMergeBenchmark.mergeAddFromBothNodes 1 thrpt 10 492.291 ± 55.903 ops/ms [info] ORSetMergeBenchmark.mergeAddFromBothNodes 10 thrpt 10 79.890 ± 4.977 ops/ms [info] ORSetMergeBenchmark.mergeAddFromBothNodes 20 thrpt 10 44.560 ± 9.081 ops/ms [info] ORSetMergeBenchmark.mergeAddFromBothNodes 100 thrpt 10 9.405 ± 0.323 ops/ms [info] ORSetMergeBenchmark.mergeAddFromOtherNode 1 thrpt 10 714.043 ± 14.694 ops/ms [info] ORSetMergeBenchmark.mergeAddFromOtherNode 10 thrpt 10 88.281 ± 13.858 ops/ms [info] ORSetMergeBenchmark.mergeAddFromOtherNode 20 thrpt 10 49.001 ± 0.940 ops/ms [info] ORSetMergeBenchmark.mergeAddFromOtherNode 100 thrpt 10 9.379 ± 0.300 ops/ms [info] ORSetMergeBenchmark.mergeAddFromSameNode 1 thrpt 10 487.261 ± 7.457 ops/ms [info] ORSetMergeBenchmark.mergeAddFromSameNode 10 thrpt 10 80.073 ± 9.736 ops/ms [info] ORSetMergeBenchmark.mergeAddFromSameNode 20 thrpt 10 46.385 ± 1.225 ops/ms [info] ORSetMergeBenchmark.mergeAddFromSameNode 100 thrpt 10 9.583 ± 0.234 ops/ms [info] ORSetMergeBenchmark.mergeComplex 1 thrpt 10 313.959 ± 31.419 ops/ms [info] ORSetMergeBenchmark.mergeComplex 10 thrpt 10 79.265 ± 1.126 ops/ms [info] ORSetMergeBenchmark.mergeComplex 20 thrpt 10 44.478 ± 2.077 ops/ms [info] ORSetMergeBenchmark.mergeComplex 100 thrpt 10 9.202 ± 0.564 ops/ms 2015-09-19 21:46:01 +02:00			`val lhsDots = lhs.elementsMap(k)`
			`val lhsDotsVersions = lhsDots.versions`
			`val rhsDotsVersions = rhs.elementsMap(k).versions`
			`if (lhsDotsVersions.size == 1 && rhsDotsVersions.size == 1 && lhsDotsVersions.head == rhsDotsVersions.head) {`
			`// one single common dot`
			`acc.updated(k, lhsDots)`
			`} else {`
			`val commonDots = lhsDotsVersions.filter {`
			`case (thisDotNode, v) ⇒ rhsDotsVersions.get(thisDotNode).exists(_ == v)`
			`}`
			`val commonDotsKeys = commonDots.keys`
			`val lhsUniqueDots = lhsDotsVersions -- commonDotsKeys`
			`val rhsUniqueDots = rhsDotsVersions -- commonDotsKeys`
			`val lhsKeep = ORSet.subtractDots(new VersionVector(lhsUniqueDots), rhs.vvector)`
			`val rhsKeep = ORSet.subtractDots(new VersionVector(rhsUniqueDots), lhs.vvector)`
			`val merged = lhsKeep.merge(rhsKeep).merge(new VersionVector(versions = commonDots))`
			`// Perfectly possible that an item in both sets should be dropped`
			`if (merged.versions.isEmpty) acc`
			`else acc.updated(k, merged)`
+cdd #16799 Add Distributed Data module Previously know as [patriknw/akka-data-replication](https://github.com/patriknw/akka-data-replication), which was originally inspired by [jboner/akka-crdt](https://github.com/jboner/akka-crdt). The functionality is very similar to akka-data-replication 0.11. Here is a list of the most important changes: * The package name changed to `akka.cluster.ddata` * The extension was renamed to `DistributedData` * The keys changed from strings to classes with unique identifiers and type information of the data values, e.g. `ORSetKey[Int]("set2")` * The optional read consistency parameter was removed from the `Update` message. If you need to read from other replicas before performing the update you have to first send a `Get` message and then continue with the ``Update`` when the ``GetSuccess`` is received. * `BigInt` is used in `GCounter` and `PNCounter` instead of `Long` * Improvements of java api * Better documentation 2015-05-17 12:28:47 +02:00			`}`
			`}`
			`}`

			`/**`
			`* INTERNAL API`
			`* @see [[ORSet#merge]]`
			`*/`
			`private[akka] def mergeDisjointKeys[A](keys: Set[A], elementsMap: Map[A, ORSet.Dot], vvector: VersionVector,`
			`accumulator: Map[A, ORSet.Dot]): Map[A, ORSet.Dot] = {`
			`keys.foldLeft(accumulator) {`
			`case (acc, k) ⇒`
			`val dots = elementsMap(k)`
			`if (vvector > dots \|\| vvector == dots)`
			`acc`
			`else {`
			`// Optimise the set of stored dots to include only those unseen`
			`val newDots = subtractDots(dots, vvector)`
			`acc.updated(k, newDots)`
			`}`
			`}`
			`}`
			`}`

			`/**`
			`* Implements a 'Observed Remove Set' CRDT, also called a 'OR-Set'.`
			`* Elements can be added and removed any number of times. Concurrent add wins`
			`* over remove.`
			`*`
			`* It is not implemented as in the paper`
			`* <a href="http://hal.upmc.fr/file/index/docid/555588/filename/techreport.pdf">A comprehensive study of Convergent and Commutative Replicated Data Types</a>.`
			`* This is more space efficient and doesn't accumulate garbage for removed elements.`
			`* It is described in the paper`
			`* <a href="https://hal.inria.fr/file/index/docid/738680/filename/RR-8083.pdf">An optimized conflict-free replicated set</a>`
			`* The implementation is inspired by the Riak DT <a href="https://github.com/basho/riak_dt/blob/develop/src/riak_dt_orswot.erl">`
			`* riak_dt_orswot</a>.`
			`*`
			`* The ORSet has a version vector that is incremented when an element is added to`
			* the set. The `node -> count` pair for that increment is stored against the
			`* element as its "birth dot". Every time the element is re-added to the set,`
			* its "birth dot" is updated to that of the `node -> count` version vector entry
			`* resulting from the add. When an element is removed, we simply drop it, no tombstones.`
			`*`
			`* When an element exists in replica A and not replica B, is it because A added`
			`* it and B has not yet seen that, or that B removed it and A has not yet seen that?`
			* In this implementation we compare the `dot` of the present element to the version vector
			`* in the Set it is absent from. If the element dot is not "seen" by the Set version vector,`
			`* that means the other set has yet to see this add, and the item is in the merged`
			`* Set. If the Set version vector dominates the dot, that means the other Set has removed this`
			`* element already, and the item is not in the merged Set.`
			`*`
			`* This class is immutable, i.e. "modifying" methods return a new instance.`
			`*/`
			`@SerialVersionUID(1L)`
			`final class ORSet[A] private[akka] (`
			`private[akka] val elementsMap: Map[A, ORSet.Dot],`
			`private[akka] val vvector: VersionVector)`
			`extends ReplicatedData with ReplicatedDataSerialization with RemovedNodePruning {`

			`type T = ORSet[A]`

			`/**`
			`* Scala API`
			`*/`
			`def elements: Set[A] = elementsMap.keySet`

			`/**`
			`* Java API`
			`*/`
			`def getElements(): java.util.Set[A] = {`
			`import scala.collection.JavaConverters._`
			`elements.asJava`
			`}`

			`def contains(a: A): Boolean = elementsMap.contains(a)`

			`def isEmpty: Boolean = elementsMap.isEmpty`

			`def size: Int = elementsMap.size`

			`/**`
			`* Adds an element to the set`
			`*/`
			`def +(element: A)(implicit node: Cluster): ORSet[A] = add(node, element)`

			`/**`
			`* Adds an element to the set`
			`*/`
			`def add(node: Cluster, element: A): ORSet[A] = add(node.selfUniqueAddress, element)`

			`/**`
			`* INTERNAL API`
			`*/`
			`private[akka] def add(node: UniqueAddress, element: A): ORSet[A] = {`
			`val newVvector = vvector + node`
			`val newDot = new VersionVector(versions = TreeMap(node -> newVvector.versions(node)))`
			`new ORSet(elementsMap = elementsMap.updated(element, newDot), vvector = newVvector)`
			`}`

			`/**`
			`* Removes an element from the set.`
			`*/`
			`def -(element: A)(implicit node: Cluster): ORSet[A] = remove(node, element)`

			`/**`
			`* Removes an element from the set.`
			`*/`
			`def remove(node: Cluster, element: A): ORSet[A] = remove(node.selfUniqueAddress, element)`

			`/**`
			`* INTERNAL API`
			`*/`
			`private[akka] def remove(node: UniqueAddress, element: A): ORSet[A] =`
			`copy(elementsMap = elementsMap - element)`

			`/**`
			`* Removes all elements from the set, but keeps the history.`
			`* This has the same result as using [[#remove]] for each`
			`* element, but it is more efficient.`
			`*/`
			`def clear(node: Cluster): ORSet[A] = clear(node.selfUniqueAddress)`

			`/**`
			`* INTERNAL API`
			`*/`
			`private[akka] def clear(node: UniqueAddress): ORSet[A] = copy(elementsMap = Map.empty)`

			`/**`
			`* When element is in this Set but not in that Set:`
			`* Compare the "birth dot" of the present element to the version vector in the Set it is absent from.`
			`* If the element dot is not "seen" by other Set version vector, that means the other set has yet to`
			`* see this add, and the element is to be in the merged Set.`
			`* If the other Set version vector dominates the dot, that means the other Set has removed`
			`* the element already, and the element is not to be in the merged Set.`
			`*`
			`* When element in both this Set and in that Set:`
			`* Some dots may still need to be shed. If this Set has dots that the other Set does not have,`
			`* and the other Set version vector dominates those dots, then we need to drop those dots.`
			`* Keep only common dots, and dots that are not dominated by the other sides version vector`
			`*/`
			`override def merge(that: ORSet[A]): ORSet[A] = {`
			`val thisKeys = elementsMap.keySet`
			`val thatKeys = that.elementsMap.keySet`
			`val commonKeys = thisKeys.intersect(thatKeys)`
			`val thisUniqueKeys = thisKeys -- commonKeys`
			`val thatUniqueKeys = thatKeys -- commonKeys`

			`val entries00 = ORSet.mergeCommonKeys(commonKeys, this, that)`
			`val entries0 = ORSet.mergeDisjointKeys(thisUniqueKeys, this.elementsMap, that.vvector, entries00)`
			`val entries = ORSet.mergeDisjointKeys(thatUniqueKeys, that.elementsMap, this.vvector, entries0)`
			`val mergedVvector = this.vvector.merge(that.vvector)`

			`new ORSet(entries, mergedVvector)`
			`}`

			`override def needPruningFrom(removedNode: UniqueAddress): Boolean =`
			`vvector.needPruningFrom(removedNode)`

			`override def prune(removedNode: UniqueAddress, collapseInto: UniqueAddress): ORSet[A] = {`
			`val pruned = elementsMap.foldLeft(Map.empty[A, ORSet.Dot]) {`
			`case (acc, (elem, dot)) ⇒`
			`if (dot.needPruningFrom(removedNode)) acc.updated(elem, dot.prune(removedNode, collapseInto))`
			`else acc`
			`}`
			`if (pruned.isEmpty)`
			`copy(vvector = vvector.prune(removedNode, collapseInto))`
			`else {`
			`// re-add elements that were pruned, to bump dots to right vvector`
			`val newSet = new ORSet(elementsMap = elementsMap ++ pruned, vvector = vvector.prune(removedNode, collapseInto))`
			`pruned.keys.foldLeft(newSet) {`
			`case (s, elem) ⇒ s.add(collapseInto, elem)`
			`}`
			`}`
			`}`

			`override def pruningCleanup(removedNode: UniqueAddress): ORSet[A] = {`
			`val updated = elementsMap.foldLeft(elementsMap) {`
			`case (acc, (elem, dot)) ⇒`
			`if (dot.needPruningFrom(removedNode)) acc.updated(elem, dot.pruningCleanup(removedNode))`
			`else acc`
			`}`
			`new ORSet(updated, vvector.pruningCleanup(removedNode))`
			`}`

			`private def copy(elementsMap: Map[A, ORSet.Dot] = this.elementsMap, vvector: VersionVector = this.vvector): ORSet[A] =`
			`new ORSet(elementsMap, vvector)`

			// this class cannot be a `case class` because we need different `unapply`

			`override def toString: String = s"OR$elements"`

			`override def equals(o: Any): Boolean = o match {`
			`case other: ORSet[_] ⇒ vvector == other.vvector && elementsMap == other.elementsMap`
			`case _ ⇒ false`
			`}`

			`override def hashCode: Int = {`
			`var result = HashCode.SEED`
			`result = HashCode.hash(result, elementsMap)`
			`result = HashCode.hash(result, vvector)`
			`result`
			`}`
			`}`

			`object ORSetKey {`
			`def create[A](id: String): Key[ORSet[A]] = ORSetKey(id)`
			`}`

			`@SerialVersionUID(1L)`
			`final case class ORSetKey[A](_id: String) extends Key[ORSet[A]](_id) with ReplicatedDataSerialization`