Added a correct consistent hash load balancer with test cases.

- The approach is to have one routing ring per partition - Rather than performing N (no. of partitions) lookup per routing request, it collapse N rings into one by building a unique set of points in a ring which for each point, contains the node id for each partition by looking up individual partition routing ring.
LinkedInAttic · Feb 29, 2012 · 2ca216e · 2ca216e · jhartman · Mar 1, 2012
1 parent f256da3
commit 2ca216e
Show file tree

Hide file tree

Showing 3 changed files with 446 additions and 0 deletions.
diff --git a/sensei-core/src/main/java/com/senseidb/cluster/routing/ConsistentHashLoadBalancer.java b/sensei-core/src/main/java/com/senseidb/cluster/routing/ConsistentHashLoadBalancer.java
@@ -0,0 +1,134 @@
+package com.senseidb.cluster.routing;
+
+import com.linkedin.norbert.javacompat.cluster.Node;
+import java.util.ArrayList;
+import java.util.HashSet;
+import java.util.List;
+import java.util.Map;
+import java.util.NavigableMap;
+import java.util.Set;
+import java.util.TreeMap;
+import org.apache.log4j.Logger;
+
+
+/**
+ * A {@link SenseiLoadBalancer} that provides consistent hash behavior for all partitions with one lookup per routing.
+ */
+public class ConsistentHashLoadBalancer implements SenseiLoadBalancer
+{
+  private static Logger logger = Logger.getLogger(ConsistentHashLoadBalancer.class);
+
+  private final HashProvider _hashProvider;
+  private final NavigableMap<Long, RoutingInfo> _routingMap;
+
+  public ConsistentHashLoadBalancer(HashProvider hashProvider, int bucketCount, Set<Node> nodes)
+  {
+    _hashProvider = hashProvider;
+    _routingMap = new TreeMap<Long, RoutingInfo>();
+
+    // Gather set of nodes for each partition
+    Map<Integer, Set<Node>> partitionNodes = new TreeMap<Integer, Set<Node>>();
+    for (Node node : nodes)
+    {
+      for (Integer partId : node.getPartitionIds())
+      {
+        Set<Node> partNodes = partitionNodes.get(partId);
+        if (partNodes == null)
+        {
+          partNodes = new HashSet<Node>();
+          partitionNodes.put(partId, partNodes);
+        }
+        partNodes.add(node);
+      }
+    }
+
+    // Build the common data structure shared among all RoutingInfo
+    int maxSize = 0;
+    int[] partitions = new int[partitionNodes.size()];
+    @SuppressWarnings("unchecked")
+    List<Node>[] nodeLists = new List[partitions.length];
+    int idx = 0;
+    for (Map.Entry<Integer, Set<Node>> entry : partitionNodes.entrySet())
+    {
+      partitions[idx] = entry.getKey();
+      nodeLists[idx] = new ArrayList<Node>(entry.getValue());
+      if (maxSize < nodeLists[idx].size()) {
+        maxSize = nodeLists[idx].size();
+      }
+      idx++;
+    }
+
+    // Builds individual ring for each partitions
+    Map<Integer, NavigableMap<Long, Integer>> rings = new TreeMap<Integer, NavigableMap<Long, Integer>>();
+    for (int i = 0; i < partitions.length; i++)
+    {
+      Integer partId = partitions[i];
+      NavigableMap<Long, Integer> ring = rings.get(partId);
+      if (ring == null)
+      {
+        ring = new TreeMap<Long, Integer>();
+        rings.put(partId, ring);
+      }
+
+      // Put points in ring. BucketCount points per node.
+      for (int j = 0; j < nodeLists[i].size(); j++)
+      {
+        for (int k = 0; k < bucketCount; k++)
+        {
+          ring.put(hashProvider.hash(String.format("node-%d-%d", nodeLists[i].get(j).getId(), k)), j);
+        }
+      }
+    }
+
+    // Generate points and gather node for each partition on each point
+    for (int slot = 0; slot < bucketCount * maxSize; slot++)
+    {
+      Long point = hashProvider.hash(String.format("ring-%d", slot));
+
+      // Choice of node for each partition
+      int[] nodeChoices = new int[partitions.length];
+      for (int i = 0; i < partitions.length; i++)
+      {
+        nodeChoices[i] = lookup(rings.get(partitions[i]), point);
+      }
+
+      _routingMap.put(point, new RoutingInfo(nodeLists, partitions, nodeChoices));
+    }
+  }
+
+  @Override
+  public RoutingInfo route(String routeParam)
+  {
+    if (_routingMap.isEmpty())
+    {
+      return null;
+    }
+
+    RoutingInfo result = lookup(_routingMap, _hashProvider.hash(routeParam));
+
+    if (logger.isDebugEnabled())
+    {
+      logger.debug(routeParam + " is sent to " + result.toString());
+    }
+
+    return result;
+  }
+
+  private <K, V> V lookup(NavigableMap<K, V> ring, K key)
+  {
+    V result = ring.get(key);
+    if (result == null)
+    {       // Not a direct match
+      Map.Entry<K, V> entry = ring.ceilingEntry(key);
+      result = (entry == null) ? ring.firstEntry().getValue() : entry.getValue();
+    }
+
+    return result;
+  }
+
+  @Override
+  public String toString()
+  {
+    return _routingMap.toString();
+  }
+}
diff --git a/...ei-core/src/main/java/com/senseidb/cluster/routing/ConsistentHashLoadBalancerFactory.java b/...ei-core/src/main/java/com/senseidb/cluster/routing/ConsistentHashLoadBalancerFactory.java
@@ -0,0 +1,24 @@
+package com.senseidb.cluster.routing;
+
+
+import com.linkedin.norbert.javacompat.cluster.Node;
+import java.util.Set;
+
+
+public class ConsistentHashLoadBalancerFactory implements SenseiLoadBalancerFactory {
+
+  private final int _multiplyFactor;
+  private final HashProvider _hashProvider;
+
+  public ConsistentHashLoadBalancerFactory(HashProvider hashProvider, int multiplyFactor)
+  {
+    _hashProvider = hashProvider;
+    _multiplyFactor = multiplyFactor;
+  }
+
+  @Override
+  public SenseiLoadBalancer newLoadBalancer(Set<Node> nodes)
+  {
+    return new ConsistentHashLoadBalancer(_hashProvider, _multiplyFactor, nodes);
+  }
+}