com.amazonaws.services.s3.model.S3ObjectInputStream Maven / Gradle / Ivy
/*
* Copyright 2012-2017 Amazon Technologies, Inc.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at:
*
* http://aws.amazon.com/apache2.0
*
* This file is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES
* OR CONDITIONS OF ANY KIND, either express or implied. See the
* License for the specific language governing permissions and
* limitations under the License.
*/
package com.amazonaws.services.s3.model;
import com.amazonaws.internal.MetricAware;
import com.amazonaws.internal.SdkFilterInputStream;
import com.amazonaws.metrics.AwsSdkMetrics;
import com.amazonaws.metrics.MetricFilterInputStream;
import com.amazonaws.services.s3.metrics.S3ServiceMetric;
import com.amazonaws.util.IOUtils;
import java.io.IOException;
import java.io.InputStream;
import org.apache.http.client.HttpClient;
import org.apache.http.client.methods.HttpRequestBase;
import org.apache.http.conn.EofSensorInputStream;
/**
* Input stream representing the content of an {@link S3Object}. In addition to
* the methods supplied by the {@link InputStream} class,
* {@link S3ObjectInputStream} supplies the abort() method, which will terminate
* an HTTP connection to the S3 object.
*/
public class S3ObjectInputStream extends SdkFilterInputStream {
private final HttpRequestBase httpRequest;
public S3ObjectInputStream(InputStream in, HttpRequestBase httpRequest) {
this(in, httpRequest, wrapWithByteCounting(in));
}
public S3ObjectInputStream(
InputStream in,
HttpRequestBase httpRequest,
boolean collectMetrics) {
super(collectMetrics
? new MetricFilterInputStream(S3ServiceMetric.S3DownloadThroughput, in)
: in);
this.httpRequest = httpRequest;
}
/**
* Returns true if we should wrap the given input stream with a byte
* counting wrapper; false otherwise.
*/
private static boolean wrapWithByteCounting(InputStream in) {
if (!AwsSdkMetrics.isMetricsEnabled()) {
return false; // metrics is disabled
}
if (in instanceof MetricAware) {
MetricAware aware = (MetricAware) in;
// wrap only if not already wrapped in one of it's inner chain of input stream
return !aware.isMetricActivated();
}
return true; // this is a raw input stream so metric wrapping is necessary
}
/**
* {@inheritDoc}
*
* Aborts the underlying http request without reading any more data and
* closes the stream.
*
* By default Apache {@link HttpClient} tries to reuse http connections by
* reading to the end of an attached input stream on
* {@link InputStream#close()}. This is efficient from a socket pool
* management perspective, but for objects with large payloads can incur
* significant overhead while bytes are read from s3 and discarded. It's up
* to clients to decide when to take the performance hit implicit in not
* reusing an http connection in order to not read unnecessary information
* from S3.
*
* @see EofSensorInputStream
*/
@Override
public void abort() {
if (httpRequest != null) {
httpRequest.abort();
}
IOUtils.closeQuietly(in, null);
}
/**
* Returns the http request from which this input stream is derived.
*/
public HttpRequestBase getHttpRequest() {
return httpRequest;
}
/**
* Returns the value of super.available() if the result is nonzero, or 1
* otherwise.
*
* This is necessary to work around a known bug in
* GZIPInputStream.available(), which returns zero in some edge cases,
* causing file truncation.
*
* Ref: http://bugs.java.com/bugdatabase/view_bug.do?bug_id=7036144
*/
@Override
public int available() throws IOException {
int estimate = super.available();
return estimate == 0 ? 1 : estimate;
}
/**
* {@inheritDoc}
*
* Delegates to {@link S3ObjectInputStream#abort()} if there is any data
* remaining in the stream. Otherwise, it safely closes the stream.
*
* @see S3ObjectInputStream#abort()
* @see com.amazonaws.services.s3.internal.S3AbortableInputStream
*/
@Override
public void close() throws IOException {
super.close();
}
}