Maven / Gradle / Ivy
Show all versions of gcs-connector Show documentation
* Copyright 2014 Google Inc. All Rights Reserved.
* Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except
* in compliance with the License. You may obtain a copy of the License at
* Unless required by applicable law or agreed to in writing, software distributed under the
* License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either
* express or implied. See the License for the specific language governing permissions and
* limitations under the License.
import java.util.EnumSet;
import java.util.StringTokenizer;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.AbstractFileSystem;
import org.apache.hadoop.fs.BlockLocation;
import org.apache.hadoop.fs.CreateFlag;
import org.apache.hadoop.fs.FSDataInputStream;
import org.apache.hadoop.fs.FSDataOutputStream;
import org.apache.hadoop.fs.FileChecksum;
import org.apache.hadoop.fs.FileStatus;
import org.apache.hadoop.fs.FsServerDefaults;
import org.apache.hadoop.fs.FsStatus;
import org.apache.hadoop.fs.Options.ChecksumOpt;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.fs.permission.FsPermission;
import org.apache.hadoop.util.Progressable;
* GoogleHadoopFS provides a YARN compatible Abstract File System on top of Google Cloud Storage
* (GCS).
* It is implemented as a thin abstraction layer on top of GoogleHadoopFileSystem, but will soon
* be refactored to share a common base.
public class GoogleHadoopFS extends AbstractFileSystem {
private static final GoogleLogger logger = GoogleLogger.forEnclosingClass();
// Wrapped GoogleHadoopFileSystem instance
private GoogleHadoopFileSystem ghfs;
public GoogleHadoopFS(URI uri, Configuration conf) throws URISyntaxException, IOException {
this(new GoogleHadoopFileSystem(), uri, conf);
public GoogleHadoopFS(GoogleHadoopFileSystem ghfs, URI uri, Configuration conf)
throws URISyntaxException, IOException {
// AbstractFileSystem requires authority based AbstractFileSystems to have valid ports.
// true == GoogleHadoopFS requires authorities in URIs.
// 0 == the fake port passed to AbstractFileSystem.
super(uri, ghfs.getScheme(), true, 0);
Preconditions.checkArgument(ghfs != null, "ghfs must not be null");
this.ghfs = ghfs;
ghfs.initialize(uri, conf);
public FSDataOutputStream createInternal(
Path file,
EnumSet flag,
FsPermission absolutePermission,
int bufferSize,
short replication,
long blockSize,
Progressable progress,
ChecksumOpt checksumOpt,
boolean createParent)
throws IOException {
"createInternal(file: %s, flag: %s, absolutePermission: %s, bufferSize: %d, "
+ "replication: %b, blockSize: %d, progress: %s, checksumOpt: %s, createParent: %b)",
if (!createParent) {
// TODO: don't ignore 'createParent' flag
logger.atFine().log("Ignoring createParent=false. Creating parents anyways.");
// AbstractFileSystems rely on permission to not overwrite.
boolean overwriteFile = true;
return ghfs.create(
file, absolutePermission, overwriteFile, bufferSize, replication, blockSize, progress);
public int getUriDefaultPort() {
int defaultPort = ghfs.getDefaultPort();
logger.atFiner().log("getUriDefaultPort(): %d", defaultPort);
return defaultPort;
* This is overridden to use GoogleHadoopFileSystem's URI, because AbstractFileSystem appends the
* default port to the authority.
public URI getUri() {
return ghfs.getUri();
/** Follow HDFS conventions except allow for ':' in paths. */
public boolean isValidName(String src) {
StringTokenizer tokens = new StringTokenizer(src, Path.SEPARATOR);
while (tokens.hasMoreTokens()) {
String element = tokens.nextToken();
if (element.equals("..") || element.equals(".")) {
return false;
return true;
/** Only accept valid AbstractFileSystem and GoogleHadoopFileSystem Paths. */
public void checkPath(Path path) {
// TODO: Implement GoogleHadoopFileSystemBase.getServerDefaults(Path)
public FsServerDefaults getServerDefaults() throws IOException {
return ghfs.getServerDefaults();
public void mkdir(final Path dir, final FsPermission permission, final boolean createParent)
throws IOException {
"mkdir(dir: %s, permission: %s, createParent %b)", dir, permission, createParent);
if (!createParent) {
logger.atFine().log("Ignoring createParent=false. Creating parents anyways.");
ghfs.mkdirs(dir, permission);
public boolean delete(final Path f, final boolean recursive) throws IOException {
logger.atFiner().log("delete(path: %s, recursive: %b)", f, recursive);
return ghfs.delete(f, recursive);
public FSDataInputStream open(final Path f, int bufferSize) throws IOException {
logger.atFiner().log("open(path: %s, bufferSize: %d)", f, bufferSize);
return, bufferSize);
public boolean setReplication(final Path f, final short replication) throws IOException {
logger.atFiner().log("setReplication(path: %s, replication: %d)", f, replication);
return ghfs.setReplication(f, replication);
public void renameInternal(final Path src, final Path dst) throws IOException {
logger.atFiner().log("renameInternal(src: %s, dst: %s)", src, dst);
ghfs.renameInternal(src, dst);
public void setPermission(final Path f, final FsPermission permission) throws IOException {
logger.atFiner().log("setPermission(path: %s, permission: %s)", f, permission);
ghfs.setPermission(f, permission);
public void setOwner(final Path f, final String username, final String groupname)
throws IOException {
logger.atFiner().log("setOwner(path: %s, username: %s, groupname: %s)", f, username, groupname);
ghfs.setOwner(f, username, groupname);
public void setTimes(final Path f, final long mtime, final long atime) throws IOException {
logger.atFiner().log("setTimes(path: %s, mtime: %d, atime: %d)", f, mtime, atime);
ghfs.setTimes(f, mtime, atime);
public FileChecksum getFileChecksum(final Path f) throws IOException {
logger.atFiner().log("getFileChecksum(path: %s)", f);
return ghfs.getFileChecksum(f);
public FileStatus getFileStatus(final Path f) throws IOException {
logger.atFiner().log("getFileStatus(path: %s)", f);
return ghfs.getFileStatus(f);
public BlockLocation[] getFileBlockLocations(final Path f, final long start, final long len)
throws IOException {
logger.atFiner().log("getFileBlockLocations(path: %s, start: %d, len: %d)", f, start, len);
return ghfs.getFileBlockLocations(f, start, len);
public FsStatus getFsStatus() throws IOException {
return ghfs.getStatus();
public FileStatus[] listStatus(final Path f) throws IOException {
logger.atFiner().log("listStatus(path: %s)", f);
return ghfs.listStatus(f);
public void setVerifyChecksum(final boolean verifyChecksum) {
logger.atFiner().log("setVerifyChecksum(verifyChecksum: %b)", verifyChecksum);