All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.hadoop.fs.s3a.Constants Maven / Gradle / Ivy

Go to download

This module contains code to support integration with Amazon Web Services. It also declares the dependencies needed to work with AWS services.

The newest version!
/**
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.apache.hadoop.fs.s3a;

import org.apache.hadoop.classification.InterfaceAudience;
import org.apache.hadoop.classification.InterfaceStability;

/**
 * All the constants used with the {@link S3AFileSystem}.
 *
 * Some of the strings are marked as {@code Unstable}. This means
 * that they may be unsupported in future; at which point they will be marked
 * as deprecated and simply ignored.
 */
@InterfaceAudience.Public
@InterfaceStability.Evolving
public final class Constants {

  private Constants() {
  }

  /**
   * default hadoop temp dir on local system: {@value}.
   */
  public static final String HADOOP_TMP_DIR = "hadoop.tmp.dir";

  /** The minimum multipart size which S3 supports. */
  public static final int MULTIPART_MIN_SIZE = 5 * 1024 * 1024;

  // s3 access key
  public static final String ACCESS_KEY = "fs.s3a.access.key";

  // s3 secret key
  public static final String SECRET_KEY = "fs.s3a.secret.key";

  // aws credentials provider
  public static final String AWS_CREDENTIALS_PROVIDER =
      "fs.s3a.aws.credentials.provider";

  /**
   * Extra set of security credentials which will be prepended to that
   * set in {@code "hadoop.security.credential.provider.path"}.
   * This extra option allows for per-bucket overrides.
   */
  public static final String S3A_SECURITY_CREDENTIAL_PROVIDER_PATH =
      "fs.s3a.security.credential.provider.path";

  // session token for when using TemporaryAWSCredentialsProvider
  public static final String SESSION_TOKEN = "fs.s3a.session.token";

  /**
   * AWS Role to request.
   */
  public static final String ASSUMED_ROLE_ARN =
      "fs.s3a.assumed.role.arn";

  /**
   * Session name for the assumed role, must be valid characters according
   * to the AWS APIs.
   * If not set, one is generated from the current Hadoop/Kerberos username.
   */
  public static final String ASSUMED_ROLE_SESSION_NAME =
      "fs.s3a.assumed.role.session.name";

  /**
   * Duration of assumed roles before a refresh is attempted.
   */
  public static final String ASSUMED_ROLE_SESSION_DURATION =
      "fs.s3a.assumed.role.session.duration";

  /** Security Token Service Endpoint. If unset, uses the default endpoint. */
  public static final String ASSUMED_ROLE_STS_ENDPOINT =
      "fs.s3a.assumed.role.sts.endpoint";

  /**
   * Region for the STS endpoint; only relevant if the endpoint
   * is set.
   */
  public static final String ASSUMED_ROLE_STS_ENDPOINT_REGION =
      "fs.s3a.assumed.role.sts.endpoint.region";

  /**
   * Default value for the STS endpoint region; needed for
   * v4 signing.
   */
  public static final String ASSUMED_ROLE_STS_ENDPOINT_REGION_DEFAULT =
      "us-west-1";

  /**
   * Default duration of an assumed role.
   */
  public static final String ASSUMED_ROLE_SESSION_DURATION_DEFAULT = "30m";

  /** list of providers to authenticate for the assumed role. */
  public static final String ASSUMED_ROLE_CREDENTIALS_PROVIDER =
      "fs.s3a.assumed.role.credentials.provider";

  /** JSON policy containing the policy to apply to the role. */
  public static final String ASSUMED_ROLE_POLICY =
      "fs.s3a.assumed.role.policy";

  public static final String ASSUMED_ROLE_CREDENTIALS_DEFAULT =
      SimpleAWSCredentialsProvider.NAME;

  // number of simultaneous connections to s3
  public static final String MAXIMUM_CONNECTIONS = "fs.s3a.connection.maximum";
  public static final int DEFAULT_MAXIMUM_CONNECTIONS = 15;

  // connect to s3 over ssl?
  public static final String SECURE_CONNECTIONS =
      "fs.s3a.connection.ssl.enabled";
  public static final boolean DEFAULT_SECURE_CONNECTIONS = true;

  //use a custom endpoint?
  public static final String ENDPOINT = "fs.s3a.endpoint";

  //Enable path style access? Overrides default virtual hosting
  public static final String PATH_STYLE_ACCESS = "fs.s3a.path.style.access";

  //connect to s3 through a proxy server?
  public static final String PROXY_HOST = "fs.s3a.proxy.host";
  public static final String PROXY_PORT = "fs.s3a.proxy.port";
  public static final String PROXY_USERNAME = "fs.s3a.proxy.username";
  public static final String PROXY_PASSWORD = "fs.s3a.proxy.password";
  public static final String PROXY_DOMAIN = "fs.s3a.proxy.domain";
  public static final String PROXY_WORKSTATION = "fs.s3a.proxy.workstation";

  // number of times we should retry errors
  public static final String MAX_ERROR_RETRIES = "fs.s3a.attempts.maximum";
  public static final int DEFAULT_MAX_ERROR_RETRIES = 20;

  // seconds until we give up trying to establish a connection to s3
  public static final String ESTABLISH_TIMEOUT =
      "fs.s3a.connection.establish.timeout";
  public static final int DEFAULT_ESTABLISH_TIMEOUT = 50000;

  // seconds until we give up on a connection to s3
  public static final String SOCKET_TIMEOUT = "fs.s3a.connection.timeout";
  public static final int DEFAULT_SOCKET_TIMEOUT = 200000;

  // socket send buffer to be used in Amazon client
  public static final String SOCKET_SEND_BUFFER = "fs.s3a.socket.send.buffer";
  public static final int DEFAULT_SOCKET_SEND_BUFFER = 8 * 1024;

  // socket send buffer to be used in Amazon client
  public static final String SOCKET_RECV_BUFFER = "fs.s3a.socket.recv.buffer";
  public static final int DEFAULT_SOCKET_RECV_BUFFER = 8 * 1024;

  // number of records to get while paging through a directory listing
  public static final String MAX_PAGING_KEYS = "fs.s3a.paging.maximum";
  public static final int DEFAULT_MAX_PAGING_KEYS = 5000;

  // the maximum number of threads to allow in the pool used by TransferManager
  public static final String MAX_THREADS = "fs.s3a.threads.max";
  public static final int DEFAULT_MAX_THREADS = 10;

  // the time an idle thread waits before terminating
  public static final String KEEPALIVE_TIME = "fs.s3a.threads.keepalivetime";
  public static final int DEFAULT_KEEPALIVE_TIME = 60;

  // the maximum number of tasks cached if all threads are already uploading
  public static final String MAX_TOTAL_TASKS = "fs.s3a.max.total.tasks";
  public static final int DEFAULT_MAX_TOTAL_TASKS = 5;

  // size of each of or multipart pieces in bytes
  public static final String MULTIPART_SIZE = "fs.s3a.multipart.size";
  public static final long DEFAULT_MULTIPART_SIZE = 104857600; // 100 MB

  // minimum size in bytes before we start a multipart uploads or copy
  public static final String MIN_MULTIPART_THRESHOLD =
      "fs.s3a.multipart.threshold";
  public static final long DEFAULT_MIN_MULTIPART_THRESHOLD = Integer.MAX_VALUE;

  //enable multiobject-delete calls?
  public static final String ENABLE_MULTI_DELETE =
      "fs.s3a.multiobjectdelete.enable";

  // comma separated list of directories
  public static final String BUFFER_DIR = "fs.s3a.buffer.dir";

  // switch to the fast block-by-block upload mechanism
  // this is the only supported upload mechanism
  @Deprecated
  public static final String FAST_UPLOAD = "fs.s3a.fast.upload";
  @Deprecated
  public static final boolean DEFAULT_FAST_UPLOAD = false;

  //initial size of memory buffer for a fast upload
  @Deprecated
  public static final String FAST_BUFFER_SIZE = "fs.s3a.fast.buffer.size";
  public static final int DEFAULT_FAST_BUFFER_SIZE = 1048576; //1MB

  /**
   * What buffer to use.
   * Default is {@link #FAST_UPLOAD_BUFFER_DISK}
   * Value: {@value}
   */
  @InterfaceStability.Unstable
  public static final String FAST_UPLOAD_BUFFER =
      "fs.s3a.fast.upload.buffer";

  /**
   * Buffer blocks to disk: {@value}.
   * Capacity is limited to available disk space.
   */

  @InterfaceStability.Unstable
  public static final String FAST_UPLOAD_BUFFER_DISK = "disk";

  /**
   * Use an in-memory array. Fast but will run of heap rapidly: {@value}.
   */
  @InterfaceStability.Unstable
  public static final String FAST_UPLOAD_BUFFER_ARRAY = "array";

  /**
   * Use a byte buffer. May be more memory efficient than the
   * {@link #FAST_UPLOAD_BUFFER_ARRAY}: {@value}.
   */
  @InterfaceStability.Unstable
  public static final String FAST_UPLOAD_BYTEBUFFER = "bytebuffer";

  /**
   * Default buffer option: {@value}.
   */
  @InterfaceStability.Unstable
  public static final String DEFAULT_FAST_UPLOAD_BUFFER =
      FAST_UPLOAD_BUFFER_DISK;

  /**
   * Maximum Number of blocks a single output stream can have
   * active (uploading, or queued to the central FileSystem
   * instance's pool of queued operations.
   * This stops a single stream overloading the shared thread pool.
   * {@value}
   * 

* Default is {@link #DEFAULT_FAST_UPLOAD_ACTIVE_BLOCKS} */ @InterfaceStability.Unstable public static final String FAST_UPLOAD_ACTIVE_BLOCKS = "fs.s3a.fast.upload.active.blocks"; /** * Limit of queued block upload operations before writes * block. Value: {@value} */ @InterfaceStability.Unstable public static final int DEFAULT_FAST_UPLOAD_ACTIVE_BLOCKS = 4; // Private | PublicRead | PublicReadWrite | AuthenticatedRead | // LogDeliveryWrite | BucketOwnerRead | BucketOwnerFullControl public static final String CANNED_ACL = "fs.s3a.acl.default"; public static final String DEFAULT_CANNED_ACL = ""; // should we try to purge old multipart uploads when starting up public static final String PURGE_EXISTING_MULTIPART = "fs.s3a.multipart.purge"; public static final boolean DEFAULT_PURGE_EXISTING_MULTIPART = false; // purge any multipart uploads older than this number of seconds public static final String PURGE_EXISTING_MULTIPART_AGE = "fs.s3a.multipart.purge.age"; public static final long DEFAULT_PURGE_EXISTING_MULTIPART_AGE = 86400; // s3 server-side encryption, see S3AEncryptionMethods for valid options public static final String SERVER_SIDE_ENCRYPTION_ALGORITHM = "fs.s3a.server-side-encryption-algorithm"; /** * The standard encryption algorithm AWS supports. * Different implementations may support others (or none). * Use the S3AEncryptionMethods instead when configuring * which Server Side Encryption to use. * Value: "{@value}". */ @Deprecated public static final String SERVER_SIDE_ENCRYPTION_AES256 = "AES256"; /** * Used to specify which AWS KMS key to use if * {@link #SERVER_SIDE_ENCRYPTION_ALGORITHM} is * {@code SSE-KMS} (will default to aws/s3 * master key if left blank). * With with {@code SSE_C}, the base-64 encoded AES 256 key. * May be set within a JCEKS file. * Value: "{@value}". */ public static final String SERVER_SIDE_ENCRYPTION_KEY = "fs.s3a.server-side-encryption.key"; //override signature algorithm used for signing requests public static final String SIGNING_ALGORITHM = "fs.s3a.signing-algorithm"; public static final String S3N_FOLDER_SUFFIX = "_$folder$"; public static final String FS_S3A_BLOCK_SIZE = "fs.s3a.block.size"; public static final String FS_S3A = "s3a"; /** Prefix for all S3A properties: {@value}. */ public static final String FS_S3A_PREFIX = "fs.s3a."; /** Prefix for S3A bucket-specific properties: {@value}. */ public static final String FS_S3A_BUCKET_PREFIX = "fs.s3a.bucket."; public static final int S3A_DEFAULT_PORT = -1; public static final String USER_AGENT_PREFIX = "fs.s3a.user.agent.prefix"; /** Whether or not to allow MetadataStore to be source of truth. */ public static final String METADATASTORE_AUTHORITATIVE = "fs.s3a.metadatastore.authoritative"; public static final boolean DEFAULT_METADATASTORE_AUTHORITATIVE = false; /** read ahead buffer size to prevent connection re-establishments. */ public static final String READAHEAD_RANGE = "fs.s3a.readahead.range"; public static final long DEFAULT_READAHEAD_RANGE = 64 * 1024; /** * Which input strategy to use for buffering, seeking and similar when * reading data. * Value: {@value} */ @InterfaceStability.Unstable public static final String INPUT_FADVISE = "fs.s3a.experimental.input.fadvise"; /** * General input. Some seeks, some reads. * Value: {@value} */ @InterfaceStability.Unstable public static final String INPUT_FADV_NORMAL = "normal"; /** * Optimized for sequential access. * Value: {@value} */ @InterfaceStability.Unstable public static final String INPUT_FADV_SEQUENTIAL = "sequential"; /** * Optimized purely for random seek+read/positionedRead operations; * The performance of sequential IO may be reduced in exchange for * more efficient {@code seek()} operations. * Value: {@value} */ @InterfaceStability.Unstable public static final String INPUT_FADV_RANDOM = "random"; @InterfaceAudience.Private @InterfaceStability.Unstable public static final String S3_CLIENT_FACTORY_IMPL = "fs.s3a.s3.client.factory.impl"; @InterfaceAudience.Private @InterfaceStability.Unstable public static final Class DEFAULT_S3_CLIENT_FACTORY_IMPL = DefaultS3ClientFactory.class; /** * Maximum number of partitions in a multipart upload: {@value}. */ @InterfaceAudience.Private public static final int MAX_MULTIPART_COUNT = 10000; /* Constants. */ public static final String S3_METADATA_STORE_IMPL = "fs.s3a.metadatastore.impl"; /** Minimum period of time (in milliseconds) to keep metadata (may only be * applied when a prune command is manually run). */ @InterfaceStability.Unstable public static final String S3GUARD_CLI_PRUNE_AGE = "fs.s3a.s3guard.cli.prune.age"; /** * The region of the DynamoDB service. * * This config has no default value. If the user does not set this, the * S3Guard will operate table in the associated S3 bucket region. */ @InterfaceStability.Unstable public static final String S3GUARD_DDB_REGION_KEY = "fs.s3a.s3guard.ddb.region"; /** * The DynamoDB table name to use. * * This config has no default value. If the user does not set this, the * S3Guard implementation will use the respective S3 bucket name. */ @InterfaceStability.Unstable public static final String S3GUARD_DDB_TABLE_NAME_KEY = "fs.s3a.s3guard.ddb.table"; /** * A prefix for adding tags to the DDB Table upon creation. * * For example: * fs.s3a.s3guard.ddb.table.tag.mytag */ @InterfaceStability.Unstable public static final String S3GUARD_DDB_TABLE_TAG = "fs.s3a.s3guard.ddb.table.tag."; /** * Test table name to use during DynamoDB integration test. * * The table will be modified, and deleted in the end of the tests. * If this value is not set, the integration tests that would be destructive * won't run. */ @InterfaceStability.Unstable public static final String S3GUARD_DDB_TEST_TABLE_NAME_KEY = "fs.s3a.s3guard.ddb.test.table"; /** * Whether to create the DynamoDB table if the table does not exist. */ @InterfaceStability.Unstable public static final String S3GUARD_DDB_TABLE_CREATE_KEY = "fs.s3a.s3guard.ddb.table.create"; @InterfaceStability.Unstable public static final String S3GUARD_DDB_TABLE_CAPACITY_READ_KEY = "fs.s3a.s3guard.ddb.table.capacity.read"; public static final long S3GUARD_DDB_TABLE_CAPACITY_READ_DEFAULT = 500; @InterfaceStability.Unstable public static final String S3GUARD_DDB_TABLE_CAPACITY_WRITE_KEY = "fs.s3a.s3guard.ddb.table.capacity.write"; public static final long S3GUARD_DDB_TABLE_CAPACITY_WRITE_DEFAULT = 100; /** * The maximum put or delete requests per BatchWriteItem request. * * Refer to Amazon API reference for this limit. */ public static final int S3GUARD_DDB_BATCH_WRITE_REQUEST_LIMIT = 25; @InterfaceStability.Unstable public static final String S3GUARD_DDB_MAX_RETRIES = "fs.s3a.s3guard.ddb.max.retries"; /** * Max retries on batched/throttled DynamoDB operations before giving up and * throwing an IOException. Default is {@value}. See core-default.xml for * more detail. */ public static final int S3GUARD_DDB_MAX_RETRIES_DEFAULT = DEFAULT_MAX_ERROR_RETRIES; @InterfaceStability.Unstable public static final String S3GUARD_DDB_THROTTLE_RETRY_INTERVAL = "fs.s3a.s3guard.ddb.throttle.retry.interval"; public static final String S3GUARD_DDB_THROTTLE_RETRY_INTERVAL_DEFAULT = "100ms"; /** * Period of time (in milliseconds) to sleep between batches of writes. * Currently only applies to prune operations, as they are naturally a * lower priority than other operations. */ @InterfaceStability.Unstable public static final String S3GUARD_DDB_BACKGROUND_SLEEP_MSEC_KEY = "fs.s3a.s3guard.ddb.background.sleep"; public static final int S3GUARD_DDB_BACKGROUND_SLEEP_MSEC_DEFAULT = 25; /** * The default "Null" metadata store: {@value}. */ @InterfaceStability.Unstable public static final String S3GUARD_METASTORE_NULL = "org.apache.hadoop.fs.s3a.s3guard.NullMetadataStore"; /** * Use Local memory for the metadata: {@value}. * This is not coherent across processes and must be used for testing only. */ @InterfaceStability.Unstable public static final String S3GUARD_METASTORE_LOCAL = "org.apache.hadoop.fs.s3a.s3guard.LocalMetadataStore"; /** * Maximum number of records in LocalMetadataStore. */ @InterfaceStability.Unstable public static final String S3GUARD_METASTORE_LOCAL_MAX_RECORDS = "fs.s3a.s3guard.local.max_records"; public static final int DEFAULT_S3GUARD_METASTORE_LOCAL_MAX_RECORDS = 256; /** * Time to live in milliseconds in LocalMetadataStore. * If zero, time-based expiration is disabled. */ @InterfaceStability.Unstable public static final String S3GUARD_METASTORE_LOCAL_ENTRY_TTL = "fs.s3a.s3guard.local.ttl"; public static final int DEFAULT_S3GUARD_METASTORE_LOCAL_ENTRY_TTL = 10 * 1000; /** * Use DynamoDB for the metadata: {@value}. */ @InterfaceStability.Unstable public static final String S3GUARD_METASTORE_DYNAMO = "org.apache.hadoop.fs.s3a.s3guard.DynamoDBMetadataStore"; /** * Inconsistency (visibility delay) injection settings. */ @InterfaceStability.Unstable public static final String FAIL_INJECT_INCONSISTENCY_KEY = "fs.s3a.failinject.inconsistency.key.substring"; @InterfaceStability.Unstable public static final String FAIL_INJECT_INCONSISTENCY_MSEC = "fs.s3a.failinject.inconsistency.msec"; @InterfaceStability.Unstable public static final String FAIL_INJECT_INCONSISTENCY_PROBABILITY = "fs.s3a.failinject.inconsistency.probability"; /** * S3 API level parameters. */ @InterfaceStability.Unstable public static final String LIST_VERSION = "fs.s3a.list.version"; @InterfaceStability.Unstable public static final int DEFAULT_LIST_VERSION = 2; @InterfaceStability.Unstable public static final String FAIL_INJECT_THROTTLE_PROBABILITY = "fs.s3a.failinject.throttle.probability"; @InterfaceStability.Unstable public static final String FAIL_INJECT_CLIENT_FACTORY = "org.apache.hadoop.fs.s3a.InconsistentS3ClientFactory"; /** * Number of times to retry any repeatable S3 client request on failure, * excluding throttling requests: {@value}. */ public static final String RETRY_LIMIT = "fs.s3a.retry.limit"; /** * Default retry limit: {@value}. */ public static final int RETRY_LIMIT_DEFAULT = DEFAULT_MAX_ERROR_RETRIES; /** * Interval between retry attempts.: {@value}. */ public static final String RETRY_INTERVAL = "fs.s3a.retry.interval"; /** * Default retry interval: {@value}. */ public static final String RETRY_INTERVAL_DEFAULT = "500ms"; /** * Number of times to retry any throttled request: {@value}. */ public static final String RETRY_THROTTLE_LIMIT = "fs.s3a.retry.throttle.limit"; /** * Default throttled retry limit: {@value}. */ public static final int RETRY_THROTTLE_LIMIT_DEFAULT = DEFAULT_MAX_ERROR_RETRIES; /** * Interval between retry attempts on throttled requests: {@value}. */ public static final String RETRY_THROTTLE_INTERVAL = "fs.s3a.retry.throttle.interval"; /** * Default throttled retry interval: {@value}. */ public static final String RETRY_THROTTLE_INTERVAL_DEFAULT = "500ms"; /** * Should etags be exposed as checksums? */ public static final String ETAG_CHECKSUM_ENABLED = "fs.s3a.etag.checksum.enabled"; /** * Default value: false. */ public static final boolean ETAG_CHECKSUM_ENABLED_DEFAULT = false; /** * Where to get the value to use in change detection. E.g. eTag, or * versionId? */ public static final String CHANGE_DETECT_SOURCE = "fs.s3a.change.detection.source"; /** * eTag as the change detection mechanism. */ public static final String CHANGE_DETECT_SOURCE_ETAG = "etag"; /** * Object versionId as the change detection mechanism. */ public static final String CHANGE_DETECT_SOURCE_VERSION_ID = "versionid"; /** * Default change detection mechanism: eTag. */ public static final String CHANGE_DETECT_SOURCE_DEFAULT = CHANGE_DETECT_SOURCE_ETAG; /** * Mode to run change detection in. Server side comparison? Client side * comparison? Client side compare and warn rather than exception? Don't * bother at all? */ public static final String CHANGE_DETECT_MODE = "fs.s3a.change.detection.mode"; /** * Change is detected on the client side by comparing the returned id with the * expected id. A difference results in {@link RemoteFileChangedException}. */ public static final String CHANGE_DETECT_MODE_CLIENT = "client"; /** * Change is detected by passing the expected value in the GetObject request. * If the expected value is unavailable, {@link RemoteFileChangedException} is * thrown. */ public static final String CHANGE_DETECT_MODE_SERVER = "server"; /** * Change is detected on the client side by comparing the returned id with the * expected id. A difference results in a WARN level message being logged. */ public static final String CHANGE_DETECT_MODE_WARN = "warn"; /** * Change detection is turned off. Readers may see inconsistent results due * to concurrent writes without any exception or warning messages. May be * useful with third-party S3 API implementations that don't support one of * the change detection modes. */ public static final String CHANGE_DETECT_MODE_NONE = "none"; /** * Default change detection mode: server. */ public static final String CHANGE_DETECT_MODE_DEFAULT = CHANGE_DETECT_MODE_SERVER; /** * If true, raises a {@link RemoteFileChangedException} exception when S3 * doesn't provide the attribute defined by fs.s3a.change.detection.source. * For example, if source is versionId, but object versioning is not enabled * on the bucket, or alternatively if source is eTag and a third-party S3 * implementation that doesn't return eTag is used. *

* When false, only a warning message will be logged for this condition. */ public static final String CHANGE_DETECT_REQUIRE_VERSION = "fs.s3a.change.detection.version.required"; /** * Default change detection require version: true. */ public static final boolean CHANGE_DETECT_REQUIRE_VERSION_DEFAULT = true; }





© 2015 - 2024 Weber Informatics LLC | Privacy Policy