Repository: kafka
Updated Branches:
  refs/heads/trunk 7c82afddc -> 10311c138


kafka-1984; java producer may miss an available partition; patched by Jun Rao; 
reviewed by Ewen Cheslack-Postava, Jay Kreps, and Guozhang Wang


Project: http://git-wip-us.apache.org/repos/asf/kafka/repo
Commit: http://git-wip-us.apache.org/repos/asf/kafka/commit/10311c13
Tree: http://git-wip-us.apache.org/repos/asf/kafka/tree/10311c13
Diff: http://git-wip-us.apache.org/repos/asf/kafka/diff/10311c13

Branch: refs/heads/trunk
Commit: 10311c138923dcded5d8f57f587c7f7ef1119dac
Parents: 7c82afd
Author: Jun Rao <jun...@gmail.com>
Authored: Tue Feb 24 14:07:27 2015 -0800
Committer: Jun Rao <jun...@gmail.com>
Committed: Tue Feb 24 14:07:27 2015 -0800

----------------------------------------------------------------------
 .../clients/producer/internals/Partitioner.java | 15 +++++-----
 .../java/org/apache/kafka/common/Cluster.java   | 24 ++++++++++++++--
 .../kafka/clients/producer/PartitionerTest.java | 29 ++++++++++----------
 3 files changed, 45 insertions(+), 23 deletions(-)
----------------------------------------------------------------------


http://git-wip-us.apache.org/repos/asf/kafka/blob/10311c13/clients/src/main/java/org/apache/kafka/clients/producer/internals/Partitioner.java
----------------------------------------------------------------------
diff --git 
a/clients/src/main/java/org/apache/kafka/clients/producer/internals/Partitioner.java
 
b/clients/src/main/java/org/apache/kafka/clients/producer/internals/Partitioner.java
index 8112e6d..dfb936d 100644
--- 
a/clients/src/main/java/org/apache/kafka/clients/producer/internals/Partitioner.java
+++ 
b/clients/src/main/java/org/apache/kafka/clients/producer/internals/Partitioner.java
@@ -56,14 +56,15 @@ public class Partitioner {
                                                    + "].");
             return partition;
         } else if (key == null) {
-            // choose the next available node in a round-robin fashion
-            for (int i = 0; i < numPartitions; i++) {
-                int part = Utils.abs(counter.getAndIncrement()) % 
numPartitions;
-                if (partitions.get(part).leader() != null)
-                    return part;
+            int nextValue = counter.getAndIncrement();
+            List<PartitionInfo> availablePartitions = 
cluster.availablePartitionsForTopic(topic);
+            if (availablePartitions.size() > 0) {
+                int part = Utils.abs(nextValue) % availablePartitions.size();
+                return availablePartitions.get(part).partition();
+            } else {
+                // no partitions are available, give a non-available partition
+                return Utils.abs(nextValue) % numPartitions;
             }
-            // no partitions are available, give a non-available partition
-            return Utils.abs(counter.getAndIncrement()) % numPartitions;
         } else {
             // hash the key to choose a partition
             return Utils.abs(Utils.murmur2(key)) % numPartitions;

http://git-wip-us.apache.org/repos/asf/kafka/blob/10311c13/clients/src/main/java/org/apache/kafka/common/Cluster.java
----------------------------------------------------------------------
diff --git a/clients/src/main/java/org/apache/kafka/common/Cluster.java 
b/clients/src/main/java/org/apache/kafka/common/Cluster.java
index 8fcd291..60594a7 100644
--- a/clients/src/main/java/org/apache/kafka/common/Cluster.java
+++ b/clients/src/main/java/org/apache/kafka/common/Cluster.java
@@ -25,6 +25,7 @@ public final class Cluster {
     private final List<Node> nodes;
     private final Map<TopicPartition, PartitionInfo> 
partitionsByTopicPartition;
     private final Map<String, List<PartitionInfo>> partitionsByTopic;
+    private final Map<String, List<PartitionInfo>> availablePartitionsByTopic;
     private final Map<Integer, List<PartitionInfo>> partitionsByNode;
     private final Map<Integer, Node> nodesById;
 
@@ -68,8 +69,18 @@ public final class Cluster {
             }
         }
         this.partitionsByTopic = new HashMap<String, 
List<PartitionInfo>>(partsForTopic.size());
-        for (Map.Entry<String, List<PartitionInfo>> entry : 
partsForTopic.entrySet())
-            this.partitionsByTopic.put(entry.getKey(), 
Collections.unmodifiableList(entry.getValue()));
+        this.availablePartitionsByTopic = new HashMap<String, 
List<PartitionInfo>>(partsForTopic.size());
+        for (Map.Entry<String, List<PartitionInfo>> entry : 
partsForTopic.entrySet()) {
+            String topic = entry.getKey();
+            List<PartitionInfo> partitionList = entry.getValue();
+            this.partitionsByTopic.put(topic, 
Collections.unmodifiableList(partitionList));
+            List<PartitionInfo> availablePartitions = new 
ArrayList<PartitionInfo>();
+            for (PartitionInfo part : partitionList) {
+                if (part.leader() != null)
+                    availablePartitions.add(part);
+            }
+            this.availablePartitionsByTopic.put(topic, 
Collections.unmodifiableList(availablePartitions));
+        }
         this.partitionsByNode = new HashMap<Integer, 
List<PartitionInfo>>(partsForNode.size());
         for (Map.Entry<Integer, List<PartitionInfo>> entry : 
partsForNode.entrySet())
             this.partitionsByNode.put(entry.getKey(), 
Collections.unmodifiableList(entry.getValue()));
@@ -144,6 +155,15 @@ public final class Cluster {
     }
 
     /**
+     * Get the list of available partitions for this topic
+     * @param topic The topic name
+     * @return A list of partitions
+     */
+    public List<PartitionInfo> availablePartitionsForTopic(String topic) {
+        return this.availablePartitionsByTopic.get(topic);
+    }
+
+    /**
      * Get the list of partitions whose leader is this node
      * @param nodeId The node id
      * @return A list of partitions

http://git-wip-us.apache.org/repos/asf/kafka/blob/10311c13/clients/src/test/java/org/apache/kafka/clients/producer/PartitionerTest.java
----------------------------------------------------------------------
diff --git 
a/clients/src/test/java/org/apache/kafka/clients/producer/PartitionerTest.java 
b/clients/src/test/java/org/apache/kafka/clients/producer/PartitionerTest.java
index 29c8417..404bedb 100644
--- 
a/clients/src/test/java/org/apache/kafka/clients/producer/PartitionerTest.java
+++ 
b/clients/src/test/java/org/apache/kafka/clients/producer/PartitionerTest.java
@@ -33,9 +33,10 @@ public class PartitionerTest {
     private Node node2 = new Node(2, "localhost", 101);
     private Node[] nodes = new Node[] {node0, node1, node2};
     private String topic = "test";
-    private List<PartitionInfo> partitions = asList(new PartitionInfo(topic, 
0, node0, nodes, nodes),
-                                                    new PartitionInfo(topic, 
1, node1, nodes, nodes),
-                                                    new PartitionInfo(topic, 
2, null, nodes, nodes));
+    // Intentionally make the partition list not in partition order to test 
the edge cases.
+    private List<PartitionInfo> partitions = asList(new PartitionInfo(topic, 
1, null, nodes, nodes),
+                                                    new PartitionInfo(topic, 
2, node1, nodes, nodes),
+                                                    new PartitionInfo(topic, 
0, node0, nodes, nodes));
     private Cluster cluster = new Cluster(asList(node0, node1, node2), 
partitions);
 
     @Test
@@ -50,19 +51,19 @@ public class PartitionerTest {
     }
 
     @Test
-    public void testRoundRobinIsStable() {
-        int startPart = partitioner.partition("test", null, null, cluster);
+    public void testRoundRobinWithUnavailablePartitions() {
+        // When there are some unavailable partitions, we want to make sure 
that (1) we always pick an available partition,
+        // and (2) the available partitions are selected in a round robin way.
+        int countForPart0 = 0;
+        int countForPart2 = 0;
         for (int i = 1; i <= 100; i++) {
-            int partition = partitioner.partition("test", null, null, cluster);
-            assertEquals("Should yield a different partition each call with 
round-robin partitioner", partition, (startPart + i) % 2);
-        }
-    }
-
-    @Test
-    public void testRoundRobinWithDownNode() {
-        for (int i = 0; i < partitions.size(); i++) {
             int part = partitioner.partition("test", null, null, cluster);
-            assertTrue("We should never choose a leader-less node in round 
robin", part >= 0 && part < 2);
+            assertTrue("We should never choose a leader-less node in round 
robin", part == 0 || part == 2);
+            if (part == 0)
+                countForPart0++;
+            else
+                countForPart2++;
         }
+        assertEquals("The distribution between two available partitions should 
be even", countForPart0, countForPart2);
     }
 }

Reply via email to