All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.iceberg.aws.s3.S3FileIO Maven / Gradle / Ivy

The newest version!
/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *   http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 * KIND, either express or implied.  See the License for the
 * specific language governing permissions and limitations
 * under the License.
 */

package org.apache.iceberg.aws.s3;

import java.util.Map;
import java.util.concurrent.atomic.AtomicBoolean;
import org.apache.iceberg.aws.AwsClientFactories;
import org.apache.iceberg.aws.AwsClientFactory;
import org.apache.iceberg.aws.AwsProperties;
import org.apache.iceberg.io.FileIO;
import org.apache.iceberg.io.InputFile;
import org.apache.iceberg.io.OutputFile;
import org.apache.iceberg.util.SerializableSupplier;
import software.amazon.awssdk.services.s3.S3Client;
import software.amazon.awssdk.services.s3.model.DeleteObjectRequest;

/**
 * FileIO implementation backed by S3.
 * 

* Locations used must follow the conventions for S3 URIs (e.g. s3://bucket/path...). * URIs with schemes s3a, s3n, https are also treated as s3 file paths. * Using this FileIO with other schemes will result in {@link org.apache.iceberg.exceptions.ValidationException}. */ public class S3FileIO implements FileIO { private SerializableSupplier s3; private AwsProperties awsProperties; private AwsClientFactory awsClientFactory; private transient S3Client client; private final AtomicBoolean isResourceClosed = new AtomicBoolean(false); /** * No-arg constructor to load the FileIO dynamically. *

* All fields are initialized by calling {@link S3FileIO#initialize(Map)} later. */ public S3FileIO() { } /** * Constructor with custom s3 supplier and default AWS properties. *

* Calling {@link S3FileIO#initialize(Map)} will overwrite information set in this constructor. * @param s3 s3 supplier */ public S3FileIO(SerializableSupplier s3) { this(s3, new AwsProperties()); } /** * Constructor with custom s3 supplier and AWS properties. *

* Calling {@link S3FileIO#initialize(Map)} will overwrite information set in this constructor. * @param s3 s3 supplier * @param awsProperties aws properties */ public S3FileIO(SerializableSupplier s3, AwsProperties awsProperties) { this.s3 = s3; this.awsProperties = awsProperties; } @Override public InputFile newInputFile(String path) { return S3InputFile.fromLocation(path, client(), awsProperties); } @Override public OutputFile newOutputFile(String path) { return S3OutputFile.fromLocation(path, client(), awsProperties); } @Override public void deleteFile(String path) { S3URI location = new S3URI(path); DeleteObjectRequest deleteRequest = DeleteObjectRequest.builder().bucket(location.bucket()).key(location.key()).build(); client().deleteObject(deleteRequest); } private S3Client client() { if (client == null) { client = s3.get(); } return client; } @Override public void initialize(Map properties) { this.awsProperties = new AwsProperties(properties); this.awsClientFactory = AwsClientFactories.from(properties); this.s3 = awsClientFactory::s3; } @Override public void close() { // handles concurrent calls to close() if (isResourceClosed.compareAndSet(false, true)) { if (client != null) { client.close(); } } } }





© 2015 - 2025 Weber Informatics LLC | Privacy Policy