org.apache.iceberg.aws.s3.S3FileIO Maven / Gradle / Ivy
Show all versions of iceberg-aws Show documentation
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package org.apache.iceberg.aws.s3;
import java.util.Map;
import java.util.concurrent.atomic.AtomicBoolean;
import org.apache.iceberg.aws.AwsClientFactories;
import org.apache.iceberg.aws.AwsClientFactory;
import org.apache.iceberg.aws.AwsProperties;
import org.apache.iceberg.io.FileIO;
import org.apache.iceberg.io.InputFile;
import org.apache.iceberg.io.OutputFile;
import org.apache.iceberg.util.SerializableSupplier;
import software.amazon.awssdk.services.s3.S3Client;
import software.amazon.awssdk.services.s3.model.DeleteObjectRequest;
/**
* FileIO implementation backed by S3.
*
* Locations used must follow the conventions for S3 URIs (e.g. s3://bucket/path...).
* URIs with schemes s3a, s3n, https are also treated as s3 file paths.
* Using this FileIO with other schemes will result in {@link org.apache.iceberg.exceptions.ValidationException}.
*/
public class S3FileIO implements FileIO {
private SerializableSupplier s3;
private AwsProperties awsProperties;
private AwsClientFactory awsClientFactory;
private transient S3Client client;
private final AtomicBoolean isResourceClosed = new AtomicBoolean(false);
/**
* No-arg constructor to load the FileIO dynamically.
*
* All fields are initialized by calling {@link S3FileIO#initialize(Map)} later.
*/
public S3FileIO() {
}
/**
* Constructor with custom s3 supplier and default AWS properties.
*
* Calling {@link S3FileIO#initialize(Map)} will overwrite information set in this constructor.
* @param s3 s3 supplier
*/
public S3FileIO(SerializableSupplier s3) {
this(s3, new AwsProperties());
}
/**
* Constructor with custom s3 supplier and AWS properties.
*
* Calling {@link S3FileIO#initialize(Map)} will overwrite information set in this constructor.
* @param s3 s3 supplier
* @param awsProperties aws properties
*/
public S3FileIO(SerializableSupplier s3, AwsProperties awsProperties) {
this.s3 = s3;
this.awsProperties = awsProperties;
}
@Override
public InputFile newInputFile(String path) {
return S3InputFile.fromLocation(path, client(), awsProperties);
}
@Override
public OutputFile newOutputFile(String path) {
return S3OutputFile.fromLocation(path, client(), awsProperties);
}
@Override
public void deleteFile(String path) {
S3URI location = new S3URI(path);
DeleteObjectRequest deleteRequest =
DeleteObjectRequest.builder().bucket(location.bucket()).key(location.key()).build();
client().deleteObject(deleteRequest);
}
private S3Client client() {
if (client == null) {
client = s3.get();
}
return client;
}
@Override
public void initialize(Map properties) {
this.awsProperties = new AwsProperties(properties);
this.awsClientFactory = AwsClientFactories.from(properties);
this.s3 = awsClientFactory::s3;
}
@Override
public void close() {
// handles concurrent calls to close()
if (isResourceClosed.compareAndSet(false, true)) {
if (client != null) {
client.close();
}
}
}
}