Skip to content
This repository has been archived by the owner on Sep 26, 2023. It is now read-only.

Commit

Permalink
Introduced BatchStats for failures occurred during batching
Browse files Browse the repository at this point in the history
Now BatchStats will keep the counter for each type of exception happened at RPC as well as ElementT/entry object level.

Also refactored exception message to be more detailed.
  • Loading branch information
rahulKQL committed Oct 21, 2019
1 parent 65a9af8 commit 30f23f5
Show file tree
Hide file tree
Showing 6 changed files with 405 additions and 181 deletions.
190 changes: 190 additions & 0 deletions gax/src/main/java/com/google/api/gax/batching/BatchStats.java
@@ -0,0 +1,190 @@
/*
* Copyright 2019 Google LLC
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions are
* met:
*
* * Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* * Redistributions in binary form must reproduce the above
* copyright notice, this list of conditions and the following disclaimer
* in the documentation
* /or other materials provided with the
* distribution.
* * Neither the name of Google LLC nor the names of its
* contributors may be used to endorse or promote products derived from
* this software without specific prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
* OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
package com.google.api.gax.batching;

import com.google.api.core.ApiFutureCallback;
import com.google.api.gax.rpc.ApiException;
import com.google.api.gax.rpc.StatusCode;
import java.util.Map;
import java.util.concurrent.ConcurrentHashMap;
import java.util.concurrent.atomic.AtomicInteger;
import javax.annotation.Nullable;

/**
* This class keeps the statistics about failed operations(both at RPC and ElementT level) in {@link
* Batcher}. This provides the count of individual exception failure and count of each failed {@link
* StatusCode.Code} occurred in the batching process.
*/
class BatchStats {

private final Map<Class, AtomicInteger> requestExceptionCounts = new ConcurrentHashMap<>();
private final Map<StatusCode.Code, AtomicInteger> requestStatusCounts = new ConcurrentHashMap<>();
private final AtomicInteger partialBatchFailures = new AtomicInteger(0);
private final Map<Class, AtomicInteger> entryExceptionCounts = new ConcurrentHashMap<>();
private final Map<StatusCode.Code, AtomicInteger> entryStatusCounts = new ConcurrentHashMap<>();

private final Object errorLock = new Object();
private final Object statusLock = new Object();

<T> ApiFutureCallback<T> getRequestCallback() {
return new ApiFutureCallback<T>() {
public void onFailure(Throwable t) {
recordRequestException(t);
}

@Override
public void onSuccess(T result) {}
};
}

<T> ApiFutureCallback<T> getEntryCallback() {
return new ApiFutureCallback<T>() {
public void onFailure(Throwable t) {
recordEntryException(t);
}

@Override
public void onSuccess(T result) {}
};
}

private void recordRequestException(Throwable throwable) {
Class exceptionClass = throwable.getClass();

if (throwable instanceof ApiException) {
StatusCode.Code code = ((ApiException) throwable).getStatusCode().getCode();
exceptionClass = ApiException.class;

synchronized (statusLock) {
if (requestStatusCounts.containsKey(code)) {
requestStatusCounts.get(code).incrementAndGet();
} else {
requestStatusCounts.put(code, new AtomicInteger(1));
}
}
}

synchronized (errorLock) {
if (requestExceptionCounts.containsKey(exceptionClass)) {
requestExceptionCounts.get(exceptionClass).incrementAndGet();
} else {
synchronized (errorLock) {
requestExceptionCounts.put(exceptionClass, new AtomicInteger(1));
}
}
}
}

private void recordEntryException(Throwable throwable) {
Class exceptionClass = throwable.getClass();

if (throwable instanceof ApiException) {
StatusCode.Code code = ((ApiException) throwable).getStatusCode().getCode();
exceptionClass = ApiException.class;

synchronized (statusLock) {
if (entryStatusCounts.containsKey(code)) {
entryStatusCounts.get(code).incrementAndGet();
} else {
entryStatusCounts.put(code, new AtomicInteger(1));
}
}
}

synchronized (errorLock) {
if (entryExceptionCounts.containsKey(exceptionClass)) {
entryExceptionCounts.get(exceptionClass).incrementAndGet();
} else {
partialBatchFailures.incrementAndGet();
entryExceptionCounts.put(exceptionClass, new AtomicInteger(1));
}
}
}

/** Calculates and formats the message with request and entry failure count. */
@Nullable
BatchingException asException() {
if (requestExceptionCounts.isEmpty() && partialBatchFailures.get() == 0) {
return null;
}

StringBuilder sb = new StringBuilder();
int batchFailures = requestExceptionCounts.size();

if (requestExceptionCounts.isEmpty()) {
sb.append("Batching finished with ");
} else {
sb.append(String.format("%d batches failed to apply due to: ", batchFailures));

// compose the exception and return it
for (Class req : requestExceptionCounts.keySet()) {
sb.append(
String.format("%d %s ", requestExceptionCounts.get(req).get(), req.getSimpleName()));
if (req.equals(ApiException.class)) {
sb.append("(");
for (StatusCode.Code statusCode : requestStatusCounts.keySet()) {
sb.append(
String.format("%d %s ", requestStatusCounts.get(statusCode).get(), statusCode));
}
sb.append(") ");
}
}
}

if (partialBatchFailures.get() > 0) {
sb.append(String.format("%d partial failures.", partialBatchFailures.get()));

int totalEntriesEx = 0;
for (AtomicInteger ai : entryExceptionCounts.values()) {
totalEntriesEx += ai.get();
}

sb.append(
String.format(
" The %d partial failures contained %d entries that failed with: ",
partialBatchFailures.get(), totalEntriesEx));

for (Class entry : entryExceptionCounts.keySet()) {
sb.append(
String.format("%d %s ", entryExceptionCounts.get(entry).get(), entry.getSimpleName()));
if (entry.equals(ApiException.class)) {
sb.append("(");
for (StatusCode.Code code : entryStatusCounts.keySet()) {
sb.append(String.format("%d %s ", entryStatusCounts.get(code).get(), code));
}
sb.append(") ");
}
}
}
sb.append(".");
return new BatchingException(sb.toString());
}
}
53 changes: 9 additions & 44 deletions gax/src/main/java/com/google/api/gax/batching/BatcherImpl.java
Expand Up @@ -37,8 +37,6 @@
import com.google.api.core.BetaApi;
import com.google.api.core.InternalApi;
import com.google.api.core.SettableApiFuture;
import com.google.api.gax.rpc.ApiException;
import com.google.api.gax.rpc.StatusCode;
import com.google.api.gax.rpc.UnaryCallable;
import com.google.common.annotations.VisibleForTesting;
import com.google.common.base.Preconditions;
Expand All @@ -49,17 +47,14 @@
import java.lang.ref.WeakReference;
import java.util.ArrayList;
import java.util.List;
import java.util.Map;
import java.util.concurrent.ConcurrentHashMap;
import java.util.concurrent.ConcurrentMap;
import java.util.concurrent.Future;
import java.util.concurrent.ScheduledExecutorService;
import java.util.concurrent.TimeUnit;
import java.util.concurrent.atomic.AtomicInteger;
import java.util.concurrent.atomic.AtomicLong;
import java.util.logging.Level;
import java.util.logging.Logger;

/**
* Queues up the elements until {@link #flush()} is called; once batching is over, returned future
* resolves.
Expand Down Expand Up @@ -88,13 +83,9 @@ public class BatcherImpl<ElementT, ElementResultT, RequestT, ResponseT>
private final AtomicInteger numOfOutstandingBatches = new AtomicInteger(0);
private final Object flushLock = new Object();
private final Object elementLock = new Object();
private final Object errorLock = new Object();
private final Future<?> scheduledFuture;
private volatile boolean isClosed = false;

private AtomicLong numOfFailure = new AtomicLong();
private final Map<Class, AtomicInteger> failuresTypeCount = new ConcurrentHashMap<>();
private final Map<StatusCode, AtomicInteger> failureStatusCodeCount = new ConcurrentHashMap<>();
private final BatchStats batchStats = new BatchStats();

/**
* @param batchingDescriptor a {@link BatchingDescriptor} for transforming individual elements
Expand Down Expand Up @@ -137,6 +128,7 @@ public ApiFuture<ElementResultT> add(ElementT element) {
Preconditions.checkState(!isClosed, "Cannot add elements on a closed batcher");
SettableApiFuture<ElementResultT> result = SettableApiFuture.create();

ApiFutures.addCallback(result, batchStats.<ElementResultT>getEntryCallback(), directExecutor());
synchronized (elementLock) {
currentOpenBatch.add(element, result);
}
Expand Down Expand Up @@ -171,6 +163,9 @@ public void sendOutstanding() {
unaryCallable.futureCall(accumulatedBatch.builder.build());

numOfOutstandingBatches.incrementAndGet();

ApiFutures.addCallback(
batchResponse, batchStats.<ResponseT>getRequestCallback(), directExecutor());
ApiFutures.addCallback(
batchResponse,
new ApiFutureCallback<ResponseT>() {
Expand All @@ -186,7 +181,6 @@ public void onSuccess(ResponseT response) {
@Override
public void onFailure(Throwable throwable) {
try {
addException(throwable);
accumulatedBatch.onBatchFailure(throwable);
} finally {
onBatchCompletion();
Expand All @@ -212,36 +206,6 @@ private void awaitAllOutstandingBatches() throws InterruptedException {
}
}

/**
* It keeps the count of number of failed RPCs. This method also tracks the count for exception
* type along with counts for different failed {@link StatusCode}s.
*/
private void addException(Throwable throwable) {
numOfFailure.incrementAndGet();
Class exceptionClass = throwable.getClass();

if (throwable instanceof ApiException) {
StatusCode code = ((ApiException) throwable).getStatusCode();
exceptionClass = ApiException.class;

synchronized (errorLock) {
if (failureStatusCodeCount.containsKey(code)) {
failureStatusCodeCount.get(code).incrementAndGet();
} else {
failureStatusCodeCount.put(code, new AtomicInteger(1));
}
}
}

synchronized (errorLock) {
if (failuresTypeCount.containsKey(exceptionClass)) {
failuresTypeCount.get(exceptionClass).incrementAndGet();
} else {
failuresTypeCount.put(exceptionClass, new AtomicInteger(1));
}
}
}

/** {@inheritDoc} */
@Override
public void close() throws InterruptedException {
Expand All @@ -251,11 +215,12 @@ public void close() throws InterruptedException {
flush();
scheduledFuture.cancel(true);
isClosed = true;
if (numOfFailure.get() > 0) {
throw new BatchingException(numOfFailure.get(), failuresTypeCount, failureStatusCodeCount);
}
currentBatcherReference.closed = true;
currentBatcherReference.clear();
BatchingException exception = batchStats.asException();
if (exception != null) {
throw exception;
}
}

/**
Expand Down
Expand Up @@ -29,41 +29,15 @@
*/
package com.google.api.gax.batching;

import com.google.api.gax.rpc.StatusCode;
import java.util.Map;
import java.util.concurrent.atomic.AtomicInteger;
import com.google.api.core.BetaApi;
import com.google.api.core.InternalExtensionOnly;

/**
* This class represents the number of failed exceptions while performing Batching. It also provides
* the count of exceptions types and count of each failed statusCodes occurred in the Batching
* process.
*/
/** Represents exception occurred during batching. */
@BetaApi("The surface for batching is not stable yet and may change in the future.")
@InternalExtensionOnly("For google-cloud-java client use only.")
public class BatchingException extends RuntimeException {

private final long numOfFailure;
private final Map<Class, AtomicInteger> exceptionCount;
private final Map<StatusCode, AtomicInteger> statusCodeCount;

BatchingException(
long numOfFailure,
Map<Class, AtomicInteger> exceptionCount,
Map<StatusCode, AtomicInteger> statusCodeCount) {
super("Failed to commit " + numOfFailure + " mutations");

this.numOfFailure = numOfFailure;
this.exceptionCount = exceptionCount;
this.statusCodeCount = statusCodeCount;
}

public long getTotalFailureCount() {
return numOfFailure;
}

public Map<Class, AtomicInteger> getFailureTypesCount() {
return exceptionCount;
}

public Map<StatusCode, AtomicInteger> getFailureStatusCodeCount() {
return statusCodeCount;
BatchingException(String message) {
super(message);
}
}

0 comments on commit 30f23f5

Please sign in to comment.