Return-Path: X-Original-To: archive-asf-public-internal@cust-asf2.ponee.io Delivered-To: archive-asf-public-internal@cust-asf2.ponee.io Received: from cust-asf.ponee.io (cust-asf.ponee.io [163.172.22.183]) by cust-asf2.ponee.io (Postfix) with ESMTP id C197B200CD0 for ; Tue, 25 Jul 2017 20:59:55 +0200 (CEST) Received: by cust-asf.ponee.io (Postfix) id 7D113167506; Tue, 25 Jul 2017 18:59:47 +0000 (UTC) Delivered-To: archive-asf-public@cust-asf.ponee.io Received: from mail.apache.org (hermes.apache.org [140.211.11.3]) by cust-asf.ponee.io (Postfix) with SMTP id 9C0A71674E7 for ; Tue, 25 Jul 2017 20:59:46 +0200 (CEST) Received: (qmail 47238 invoked by uid 500); 25 Jul 2017 18:59:45 -0000 Mailing-List: contact commits-help@kudu.apache.org; run by ezmlm Precedence: bulk List-Help: List-Unsubscribe: List-Post: List-Id: Reply-To: dev@kudu.apache.org Delivered-To: mailing list commits@kudu.apache.org Received: (qmail 47229 invoked by uid 99); 25 Jul 2017 18:59:45 -0000 Received: from git1-us-west.apache.org (HELO git1-us-west.apache.org) (140.211.11.23) by apache.org (qpsmtpd/0.29) with ESMTP; Tue, 25 Jul 2017 18:59:45 +0000 Received: by git1-us-west.apache.org (ASF Mail Server at git1-us-west.apache.org, from userid 33) id B881DE2F41; Tue, 25 Jul 2017 18:59:45 +0000 (UTC) Content-Type: text/plain; charset="us-ascii" MIME-Version: 1.0 Content-Transfer-Encoding: 7bit From: todd@apache.org To: commits@kudu.apache.org Message-Id: <262f2ef16c9d4843965317112ce64b08@git.apache.org> X-Mailer: ASF-Git Admin Mailer Subject: kudu git commit: KUDU-2053. Fix race in Java RequestTracker Date: Tue, 25 Jul 2017 18:59:45 +0000 (UTC) archived-at: Tue, 25 Jul 2017 18:59:55 -0000 Repository: kudu Updated Branches: refs/heads/branch-1.4.x 798f92c40 -> 5b0b786d2 KUDU-2053. Fix race in Java RequestTracker The implementation of RequestTracker.newSeqNo() was previously implemented as: 1. allocate the new sequence number 2. add that sequence number to the 'incomplete' map These steps were individually thread-safe by using an AtomicLong and a thread-safe collection, respectively, but they were not performed atomically. Thus we could have the following race: T1: allocate seq number 1 T2: allocate seq number 2 T2: add seq number 2 to incompleteRpcs T2: ask for firstIncomplete() -> 2 T2: send an RPC --> server GCs seqnum < 2 T1: add seq number 1 to incompleteRpcs T1: send an RPC with seq number 1 --> server responds with an error since this seqnum is already GCed This patch fixes the issue by moving back to a simpler synchronization scheme such that the two steps (allocation and addition to the tracking structure) are done under a single critical section. A new unit test is included which reliably reproduced the issue prior to the fix. Change-Id: I56f3d1ac85d34ca663e5b6378ff8362846a2424a Reviewed-on: http://gerrit.cloudera.org:8080/7494 Tested-by: Kudu Jenkins Reviewed-by: Jean-Daniel Cryans (cherry picked from commit be8e3c22b9a3a71b2c365e2b9ed306ea23d60058) Reviewed-on: http://gerrit.cloudera.org:8080/7496 Project: http://git-wip-us.apache.org/repos/asf/kudu/repo Commit: http://git-wip-us.apache.org/repos/asf/kudu/commit/5b0b786d Tree: http://git-wip-us.apache.org/repos/asf/kudu/tree/5b0b786d Diff: http://git-wip-us.apache.org/repos/asf/kudu/diff/5b0b786d Branch: refs/heads/branch-1.4.x Commit: 5b0b786d292a4f2fb000cbbc734e9f0c48ca6406 Parents: 798f92c Author: Todd Lipcon Authored: Mon Jul 24 23:07:40 2017 -0700 Committer: Todd Lipcon Committed: Tue Jul 25 18:59:04 2017 +0000 ---------------------------------------------------------------------- .../org/apache/kudu/client/RequestTracker.java | 33 +++++++++----- .../apache/kudu/client/TestRequestTracker.java | 48 ++++++++++++++++++++ 2 files changed, 70 insertions(+), 11 deletions(-) ---------------------------------------------------------------------- http://git-wip-us.apache.org/repos/asf/kudu/blob/5b0b786d/java/kudu-client/src/main/java/org/apache/kudu/client/RequestTracker.java ---------------------------------------------------------------------- diff --git a/java/kudu-client/src/main/java/org/apache/kudu/client/RequestTracker.java b/java/kudu-client/src/main/java/org/apache/kudu/client/RequestTracker.java index 1945119..5f05a93 100644 --- a/java/kudu-client/src/main/java/org/apache/kudu/client/RequestTracker.java +++ b/java/kudu-client/src/main/java/org/apache/kudu/client/RequestTracker.java @@ -17,9 +17,8 @@ package org.apache.kudu.client; -import java.util.Queue; -import java.util.concurrent.PriorityBlockingQueue; -import java.util.concurrent.atomic.AtomicLong; +import java.util.TreeSet; +import javax.annotation.concurrent.GuardedBy; import org.apache.kudu.annotations.InterfaceAudience; @@ -28,8 +27,12 @@ import org.apache.kudu.annotations.InterfaceAudience; */ @InterfaceAudience.Private public class RequestTracker { - private final AtomicLong sequenceIdTracker = new AtomicLong(); - private final Queue incompleteRpcs = new PriorityBlockingQueue<>(); + private Object lock = new Object(); + + @GuardedBy("lock") + private long nextSeqNo = 1; + @GuardedBy("lock") + private final TreeSet incompleteRpcs = new TreeSet<>(); static final long NO_SEQ_NO = -1; @@ -48,9 +51,11 @@ public class RequestTracker { * @return a new sequence number */ public long newSeqNo() { - Long next = sequenceIdTracker.incrementAndGet(); - incompleteRpcs.add(next); - return next; + synchronized (lock) { + long seq = nextSeqNo++; + incompleteRpcs.add(seq); + return seq; + } } /** @@ -59,8 +64,12 @@ public class RequestTracker { * @return the first incomplete sequence number */ public long firstIncomplete() { - Long peek = incompleteRpcs.peek(); - return peek == null ? NO_SEQ_NO : peek; + synchronized (lock) { + if (incompleteRpcs.isEmpty()) { + return NO_SEQ_NO; + } + return incompleteRpcs.first(); + } } /** @@ -68,7 +77,9 @@ public class RequestTracker { * @param sequenceId the sequence id to mark as complete */ public void rpcCompleted(long sequenceId) { - incompleteRpcs.remove(sequenceId); + synchronized (lock) { + incompleteRpcs.remove(sequenceId); + } } public String getClientId() { http://git-wip-us.apache.org/repos/asf/kudu/blob/5b0b786d/java/kudu-client/src/test/java/org/apache/kudu/client/TestRequestTracker.java ---------------------------------------------------------------------- diff --git a/java/kudu-client/src/test/java/org/apache/kudu/client/TestRequestTracker.java b/java/kudu-client/src/test/java/org/apache/kudu/client/TestRequestTracker.java index 83e247d..c75c4fb 100644 --- a/java/kudu-client/src/test/java/org/apache/kudu/client/TestRequestTracker.java +++ b/java/kudu-client/src/test/java/org/apache/kudu/client/TestRequestTracker.java @@ -18,8 +18,19 @@ package org.apache.kudu.client; import static org.junit.Assert.assertEquals; +import java.util.List; +import java.util.concurrent.Callable; +import java.util.concurrent.ExecutionException; +import java.util.concurrent.ExecutorService; +import java.util.concurrent.Executors; +import java.util.concurrent.Future; +import java.util.concurrent.atomic.AtomicBoolean; + +import org.junit.Assert; import org.junit.Test; +import com.google.common.collect.Lists; + public class TestRequestTracker { @Test(timeout = 10000) @@ -71,4 +82,41 @@ public class TestRequestTracker { // Test that we get back to NO_SEQ_NO after marking them all. assertEquals(RequestTracker.NO_SEQ_NO, tracker.firstIncomplete()); } + + private static class Checker { + long curIncomplete = 0; + public synchronized void check(long seqNo, long firstIncomplete) { + Assert.assertTrue("should not send a seq number that was previously marked complete", + seqNo >= curIncomplete); + curIncomplete = Math.max(firstIncomplete, curIncomplete); + } + } + + @Test(timeout = 30000) + public void testMultiThreaded() throws InterruptedException, ExecutionException { + final AtomicBoolean done = new AtomicBoolean(false); + final RequestTracker rt = new RequestTracker("fake id"); + final Checker checker = new Checker(); + ExecutorService exec = Executors.newCachedThreadPool(); + List> futures = Lists.newArrayList(); + for (int i = 0; i < 16; i++) { + futures.add(exec.submit(new Callable() { + @Override + public Void call() { + while (!done.get()) { + long seqNo = rt.newSeqNo(); + long incomplete = rt.firstIncomplete(); + checker.check(seqNo, incomplete); + rt.rpcCompleted(seqNo); + } + return null; + } + })); + } + Thread.sleep(5000); + done.set(true); + for (Future f : futures) { + f.get(); + } + } }