com.google.cloud.storage.WriteFlushStrategy Maven / Gradle / Ivy
Show all versions of google-cloud-storage Show documentation
/*
* Copyright 2022 Google LLC
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.google.cloud.storage;
import com.google.api.core.SettableApiFuture;
import com.google.api.gax.grpc.GrpcCallContext;
import com.google.api.gax.retrying.ResultRetryAlgorithm;
import com.google.api.gax.rpc.ApiStreamObserver;
import com.google.api.gax.rpc.ClientStreamingCallable;
import com.google.cloud.storage.Conversions.Decoder;
import com.google.cloud.storage.Retrying.RetryingDependencies;
import com.google.common.collect.ImmutableList;
import com.google.common.collect.ImmutableMap;
import com.google.storage.v2.WriteObjectRequest;
import com.google.storage.v2.WriteObjectResponse;
import java.util.List;
import java.util.concurrent.ExecutionException;
import java.util.function.Consumer;
import java.util.function.LongConsumer;
import java.util.function.Supplier;
import org.checkerframework.checker.nullness.qual.NonNull;
import org.checkerframework.checker.nullness.qual.Nullable;
/**
* When writing to GCS using the WriteObject rpc, there are some behavioral differences between
* performing a "direct" upload vs a "resumable" upload.
*
* This class provides the encapsulation of the stream and "fsync" lifecycles and possible
* automatic retry where applicable.
*
*
In this class "fsync" is used to mean "complete the client stream to GCS and await its
* response". We are loosely following the concept used in linux to flush data to disk fsync(2)
*/
final class WriteFlushStrategy {
private WriteFlushStrategy() {}
/**
* Create a {@link Flusher} which will "fsync" every time {@link Flusher#flush(List)} is called
* along with {@link Flusher#close(WriteObjectRequest)}.
*/
static FlusherFactory fsyncEveryFlush(
ClientStreamingCallable write,
RetryingDependencies deps,
ResultRetryAlgorithm> alg,
Supplier baseContextSupplier) {
return (String bucketName,
LongConsumer committedTotalBytesCallback,
Consumer onSuccessCallback) ->
new FsyncEveryFlusher(
write,
deps,
alg,
bucketName,
committedTotalBytesCallback,
onSuccessCallback,
baseContextSupplier);
}
/**
* Create a {@link Flusher} which will "fsync" only on {@link Flusher#close(WriteObjectRequest)}.
* Calls to {@link Flusher#flush(List)} will be sent but not synced.
*
* @see FlusherFactory#newFlusher(String, LongConsumer, Consumer)
*/
static FlusherFactory fsyncOnClose(
ClientStreamingCallable write) {
return (String bucketName,
LongConsumer committedTotalBytesCallback,
Consumer onSuccessCallback) ->
new FsyncOnClose(write, bucketName, committedTotalBytesCallback, onSuccessCallback);
}
static GrpcCallContext contextWithBucketName(String bucketName, GrpcCallContext baseContext) {
if (bucketName != null && !bucketName.isEmpty()) {
return baseContext.withExtraHeaders(
ImmutableMap.of(
"x-goog-request-params", ImmutableList.of(String.format("bucket=%s", bucketName))));
}
return baseContext;
}
/**
* Several fields of a WriteObjectRequest are only allowed on the "first" message sent to gcs,
* this utility method centralizes the logic necessary to clear those fields for use by subsequent
* messages.
*/
private static WriteObjectRequest possiblyPairDownRequest(
WriteObjectRequest message, boolean firstMessageOfStream) {
if (firstMessageOfStream && message.getWriteOffset() == 0) {
return message;
}
WriteObjectRequest.Builder b = message.toBuilder();
if (!firstMessageOfStream) {
b.clearUploadId();
}
if (message.getWriteOffset() > 0) {
b.clearWriteObjectSpec();
}
if (message.getWriteOffset() > 0 && !message.getFinishWrite()) {
b.clearObjectChecksums();
}
return b.build();
}
@FunctionalInterface
interface FlusherFactory {
/**
* @param committedTotalBytesCallback Callback to signal the total number of bytes committed by
* this flusher.
* @param onSuccessCallback Callback to signal success, and provide the final response.
*/
Flusher newFlusher(
String bucketName,
LongConsumer committedTotalBytesCallback,
Consumer onSuccessCallback);
}
interface Flusher {
void flush(@NonNull List segments);
void close(@Nullable WriteObjectRequest req);
}
private static final class FsyncEveryFlusher implements Flusher {
private final ClientStreamingCallable write;
private final RetryingDependencies deps;
private final ResultRetryAlgorithm> alg;
private final String bucketName;
private final LongConsumer sizeCallback;
private final Consumer completeCallback;
private final Supplier baseContextSupplier;
private FsyncEveryFlusher(
ClientStreamingCallable write,
RetryingDependencies deps,
ResultRetryAlgorithm> alg,
String bucketName,
LongConsumer sizeCallback,
Consumer completeCallback,
Supplier baseContextSupplier) {
this.write = write;
this.deps = deps;
this.alg = alg;
this.bucketName = bucketName;
this.sizeCallback = sizeCallback;
this.completeCallback = completeCallback;
this.baseContextSupplier = baseContextSupplier;
}
public void flush(@NonNull List segments) {
Retrying.run(
deps,
alg,
() -> {
Observer observer = new Observer(sizeCallback, completeCallback);
GrpcCallContext internalContext =
contextWithBucketName(bucketName, baseContextSupplier.get());
ApiStreamObserver write =
this.write.withDefaultCallContext(internalContext).clientStreamingCall(observer);
boolean first = true;
for (WriteObjectRequest message : segments) {
message = possiblyPairDownRequest(message, first);
write.onNext(message);
first = false;
}
write.onCompleted();
observer.await();
return null;
},
Decoder.identity());
}
public void close(@Nullable WriteObjectRequest req) {
if (req != null) {
flush(ImmutableList.of(req));
}
}
}
private static final class FsyncOnClose implements Flusher {
private final ClientStreamingCallable write;
private final String bucketName;
private final Observer responseObserver;
private volatile ApiStreamObserver stream;
private boolean first = true;
private FsyncOnClose(
ClientStreamingCallable write,
String bucketName,
LongConsumer sizeCallback,
Consumer completeCallback) {
this.write = write;
this.bucketName = bucketName;
this.responseObserver = new Observer(sizeCallback, completeCallback);
}
@Override
public void flush(@NonNull List segments) {
ensureOpen();
for (WriteObjectRequest message : segments) {
message = possiblyPairDownRequest(message, first);
stream.onNext(message);
first = false;
}
}
@Override
public void close(@Nullable WriteObjectRequest message) {
ensureOpen();
if (message != null) {
message = possiblyPairDownRequest(message, first);
stream.onNext(message);
}
stream.onCompleted();
responseObserver.await();
}
private void ensureOpen() {
if (stream == null) {
synchronized (this) {
if (stream == null) {
GrpcCallContext internalContext =
contextWithBucketName(bucketName, GrpcCallContext.createDefault());
stream =
this.write
.withDefaultCallContext(internalContext)
.clientStreamingCall(responseObserver);
}
}
}
}
}
static class Observer implements ApiStreamObserver {
private final LongConsumer sizeCallback;
private final Consumer completeCallback;
private final SettableApiFuture invocationHandle;
private volatile WriteObjectResponse last;
Observer(LongConsumer sizeCallback, Consumer completeCallback) {
this.sizeCallback = sizeCallback;
this.completeCallback = completeCallback;
this.invocationHandle = SettableApiFuture.create();
}
@Override
public void onNext(WriteObjectResponse value) {
// incremental update
if (value.hasPersistedSize()) {
sizeCallback.accept(value.getPersistedSize());
} else if (value.hasResource()) {
sizeCallback.accept(value.getResource().getSize());
}
last = value;
}
/**
* observed exceptions so far
*
*
* - {@link com.google.api.gax.rpc.OutOfRangeException}
*
- {@link com.google.api.gax.rpc.AlreadyExistsException}
*
- {@link io.grpc.StatusRuntimeException}
*
*/
@Override
public void onError(Throwable t) {
invocationHandle.setException(t);
}
@Override
public void onCompleted() {
if (last != null && last.hasResource()) {
completeCallback.accept(last);
}
invocationHandle.set(null);
}
void await() {
try {
invocationHandle.get();
} catch (InterruptedException | ExecutionException e) {
if (e.getCause() instanceof RuntimeException) {
throw (RuntimeException) e.getCause();
} else {
throw new RuntimeException(e);
}
}
}
}
}