grpc · dapengzhang0 · Aug 18, 2021 · Aug 18, 2021 · ejona86 · Aug 18, 2021
diff --git a/census/src/main/java/io/grpc/census/CensusStatsModule.java b/census/src/main/java/io/grpc/census/CensusStatsModule.java
@@ -356,12 +356,12 @@ public void streamClosed(Status status) {
         if (module.recordFinishedRpcs) {
           // Stream is closed early. So no need to record metrics for any inbound events after this
           // point.
-          recordFinishedRpc();
+          recordFinishedAttempt();
         }
       } // Otherwise will report stats in callEnded() to guarantee all inbound metrics are recorded.
     }
 
-    void recordFinishedRpc() {
+    void recordFinishedAttempt() {
       MeasureMap measureMap = module.statsRecorder.newMeasureMap()
           // TODO(songya): remove the deprecated measure constants once they are completed removed.
           .put(DeprecatedCensusConstants.RPC_CLIENT_FINISHED_COUNT, 1)
@@ -439,7 +439,10 @@ static final class CallAttemptsTracerFactory extends
     private final AtomicLong retryDelayNanos = new AtomicLong();
     private final AtomicLong lastInactiveTimeStamp = new AtomicLong();
     private final AtomicInteger activeStreams = new AtomicInteger();
+    private final AtomicInteger activeStreams2 = new AtomicInteger();
     private final AtomicBoolean activated = new AtomicBoolean();
+    private AtomicBoolean finishedRpcRecorded = new AtomicBoolean();
+    private Status status;
 
     CallAttemptsTracerFactory(
         CensusStatsModule module, TagContext parentCtx, String fullMethodName) {
@@ -462,6 +465,7 @@ static final class CallAttemptsTracerFactory extends
     @Override
     public ClientStreamTracer newClientStreamTracer(StreamInfo info, Metadata metadata) {
       ClientTracer tracer = new ClientTracer(this, module, parentCtx, startCtx, info);
+      activeStreams2.incrementAndGet();
       if (activeStreams.incrementAndGet() == 1) {
         if (!activated.compareAndSet(false, true)) {
           retryDelayNanos.addAndGet(stopwatch.elapsed(TimeUnit.NANOSECONDS));
@@ -489,9 +493,15 @@ void attemptEnded() {
             this.lastInactiveTimeStamp.getAndSet(stopwatch.elapsed(TimeUnit.NANOSECONDS));
         retryDelayNanos.addAndGet(-lastInactiveTimeStamp);
       }
+      if (activeStreams2.decrementAndGet() == 0) {
+        if (callEnded == 1) {
+          recordFinishedCall();
+        }
+      }
     }
 
     void callEnded(Status status) {
+      this.status = status;
       if (callEndedUpdater != null) {
         if (callEndedUpdater.getAndSet(this, 1) != 0) {
           return;
@@ -502,6 +512,15 @@ void callEnded(Status status) {
         }
         callEnded = 1;
       }
+      if (activeStreams2.get() == 0) {
+        recordFinishedCall();
+      }
+    }
+
+    void recordFinishedCall() {
+      if (!finishedRpcRecorded.compareAndSet(false, true)) {
+        return;
+      }
       if (!module.recordFinishedRpcs) {
         return;
       }
@@ -510,9 +529,9 @@ void callEnded(Status status) {
         ClientTracer tracer = new ClientTracer(this, module, parentCtx, startCtx, null);
         tracer.roundtripNanos = stopwatch.elapsed(TimeUnit.NANOSECONDS);
         tracer.statusCode = status.getCode();
-        tracer.recordFinishedRpc();
+        tracer.recordFinishedAttempt();
       } else if (inboundMetricTracer != null) {
-        inboundMetricTracer.recordFinishedRpc();
+        inboundMetricTracer.recordFinishedAttempt();
       }
 
       long retriesPerCall = 0;

diff --git a/interop-testing/src/test/java/io/grpc/testing/integration/RetryTest.java b/interop-testing/src/test/java/io/grpc/testing/integration/RetryTest.java
@@ -356,6 +356,70 @@ public void statsRecorded() throws Exception {
     assertRetryStatsRecorded(1, 0, 10_000);
   }
 
+  @Test
+  public void statsRecorde_callCancelledBeforeCommit() throws Exception {
+    startNewServer();
+    retryPolicy = ImmutableMap.<String, Object>builder()
+        .put("maxAttempts", 4D)
+        .put("initialBackoff", "10s")
+        .put("maxBackoff", "10s")
+        .put("backoffMultiplier", 1D)
+        .put("retryableStatusCodes", Arrays.<Object>asList("UNAVAILABLE"))
+        .build();
+    createNewChannel();
+
+    // We will have streamClosed return at a particular moment that we want.
+    final CountDownLatch streamClosedLatch = new CountDownLatch(1);
+    ClientStreamTracer.Factory streamTracerFactory = new ClientStreamTracer.Factory() {
+      @Override
+      public ClientStreamTracer newClientStreamTracer(StreamInfo info, Metadata headers) {
+        return new ClientStreamTracer() {
+          @Override
+          public void streamClosed(Status status) {
+            if (status.getCode().equals(Code.CANCELLED)) {
+              try {
+                streamClosedLatch.await();
+              } catch (InterruptedException e) {
+                Thread.currentThread().interrupt();
+                throw new AssertionError("streamClosedLatch interrupted", e);
+              }
+            }
+          }
+        };
+      }
+    };
+    ClientCall<String, Integer> call = channel.newCall(
+        clientStreamingMethod, CallOptions.DEFAULT.withStreamTracerFactory(streamTracerFactory));
+    call.start(mockCallListener, new Metadata());
+    assertRpcStartedRecorded();
+    fakeClock.forwardTime(5, SECONDS);
+    String message = "String of length 20.";
+    call.sendMessage(message);
+    assertOutboundMessageRecorded();
+    ServerCall<String, Integer> serverCall = serverCalls.poll(5, SECONDS);
+    serverCall.request(2);
+    assertOutboundWireSizeRecorded(message.length());
+    // trigger retry
+    serverCall.close(
+        Status.UNAVAILABLE.withDescription("original attempt failed"),
+        new Metadata());
+    assertRpcStatusRecorded(Code.UNAVAILABLE, 5000, 1);
+    elapseBackoff(10, SECONDS);
+    assertRpcStartedRecorded();
+    assertOutboundMessageRecorded();
+    serverCall = serverCalls.poll(5, SECONDS);
+    serverCall.request(2);
+    assertOutboundWireSizeRecorded(message.length());
+    fakeClock.forwardTime(7, SECONDS);
+    call.cancel("Cancelled before commit", null); // A noop substream will commit.
+    // The call listener is closed, but the netty substream listener is not yet closed.
+    verify(mockCallListener, timeout(5000)).onClose(any(Status.class), any(Metadata.class));
+    // Let the netty substream listener be closed.
+    streamClosedLatch.countDown();
+    assertRetryStatsRecorded(1, 0, 10_000);
+    assertRpcStatusRecorded(Code.CANCELLED, 7_000, 1);
+  }
+
   @Test
   public void serverCancelledAndClientDeadlineExceeded() throws Exception {
     startNewServer();