All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.qcloud.chdfs.fs.CHDFSHadoopFileSystemAdapter Maven / Gradle / Ivy

There is a newer version: 3.5
Show newest version
package com.qcloud.chdfs.fs;

import org.apache.commons.io.IOUtils;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.ContentSummary;
import org.apache.hadoop.fs.CreateFlag;
import org.apache.hadoop.fs.FSDataInputStream;
import org.apache.hadoop.fs.FSDataOutputStream;
import org.apache.hadoop.fs.FileAlreadyExistsException;
import org.apache.hadoop.fs.FileChecksum;
import org.apache.hadoop.fs.FileStatus;
import org.apache.hadoop.fs.FsStatus;
import org.apache.hadoop.fs.ParentNotDirectoryException;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.fs.UnsupportedFileSystemException;
import org.apache.hadoop.fs.XAttrSetFlag;
import org.apache.hadoop.fs.permission.AclEntry;
import org.apache.hadoop.fs.permission.AclStatus;
import org.apache.hadoop.fs.permission.FsPermission;
import org.apache.hadoop.security.AccessControlException;
import org.apache.hadoop.security.token.Token;
import org.apache.hadoop.util.Progressable;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import java.io.File;
import java.io.FileNotFoundException;
import java.io.IOException;
import java.io.InputStream;
import java.net.URI;
import java.util.EnumSet;
import java.util.List;
import java.util.Map;
import java.util.Properties;
import java.util.concurrent.ThreadLocalRandom;
import java.util.regex.Matcher;
import java.util.regex.Pattern;

public class CHDFSHadoopFileSystemAdapter extends FileSystemWithLockCleaner {
    static final String SCHEME = "ofs";
    private static final Logger log = LoggerFactory.getLogger(CHDFSHadoopFileSystemAdapter.class);
    private static final String MOUNT_POINT_ADDR_PATTERN_CHDFS_TYPE =
            "^([a-zA-Z0-9-]+)\\.chdfs(-dualstack)?(\\.inner)?\\.([a-z0-9-]+)\\.([a-z0-9-.]+)";
    private static final String MOUNT_POINT_ADDR_PATTERN_COS_TYPE =
            "^([a-z0-9-]+)-([a-zA-Z0-9]+)$";
    private static final String CHDFS_USER_APPID_KEY = "fs.ofs.user.appid";
    private static final String CHDFS_TMP_CACHE_DIR_KEY = "fs.ofs.tmp.cache.dir";
    private static final String CHDFS_META_SERVER_PORT_KEY = "fs.ofs.meta.server.port";
    private static final String CHDFS_META_TRANSFER_USE_TLS_KEY = "fs.ofs.meta.transfer.tls";
    private static final String CHDFS_BUCKET_REGION = "fs.ofs.bucket.region";
    private static final String COS_ENDPOINT_SUFFIX = "fs.ofs.data.transfer.endpoint.suffix";

    private static final String CHDFS_META_ENDPOINT_SUFFIX_KEY = "fs.ofs.meta.endpoint.suffix";
    private static final boolean DEFAULT_CHDFS_META_TRANSFER_USE_TLS = true;
    private static final int DEFAULT_CHDFS_META_SERVER_PORT = 443;

    public static final String CHDFS_DATA_TRANSFER_DISTINGUISH_HOST = "fs.ofs.data.transfer.distinguish.host";

    public static final boolean DEFAULT_CHDFS_DATA_TRANSFER_DISTINGUISH_FLAG = false;

    private final CHDFSHadoopFileSystemJarLoader jarLoader = new CHDFSHadoopFileSystemJarLoader();
    private FileSystemWithLockCleaner actualImplFS = null;
    private URI uri = null;
    private Path workingDir = null;
    private long initStartMs;

    @Override
    public String getScheme() {
        return CHDFSHadoopFileSystemAdapter.SCHEME;
    }

    @Override
    public void initialize(URI name, Configuration conf) throws IOException {
        log.debug("CHDFSHadoopFileSystemAdapter adapter initialize");
        this.initStartMs = System.currentTimeMillis();
        log.debug("CHDFSHadoopFileSystemAdapter start-init-start time: {}", initStartMs);
        try {
            super.initialize(name, conf);
            this.setConf(conf);
            String mountPointAddr = name.getHost();
            if (mountPointAddr == null) {
                String errMsg = String.format("mountPointAddr is null, fullUri: %s, exp. f4mabcdefgh-xyzw.chdfs"
                        + ".ap-guangzhou.myqcloud.com or examplebucket-1250000000 or f4mabcdefgh-xyzw", name.toString());
                log.error(errMsg);
                throw new IOException(errMsg);
            }

            String ofsHost;
            if (isValidMountPointAddrChdfsType(mountPointAddr)) {
                ofsHost = mountPointAddr;
            } else if (isValidMountPointAddrCosType(mountPointAddr)) {
                String metaEndpointSuffix = getMetaEndpointSuffix(conf);
                if (!metaEndpointSuffix.isEmpty()) {
                    ofsHost = mountPointAddr + "." + metaEndpointSuffix;
                    // force close tls
                    conf.setBoolean(CHDFS_META_TRANSFER_USE_TLS_KEY, false);
                } else {
                    String bucketRegion = getChdfsBucketRegion(conf);
                    ofsHost = String.format("%s.chdfs.%s.myqcloud.com", mountPointAddr, bucketRegion);
                }
            } else {
                String errMsg = String.format("mountPointAddr %s is invalid, fullUri: %s, exp. f4mabcdefgh-xyzw.chdfs"
                                + ".ap-guangzhou.myqcloud.com or examplebucket-1250000000 or f4mabcdefgh-xyzw",
                        mountPointAddr, name.toString());
                log.error(errMsg);
                throw new IOException(errMsg);
            }

            String networkVersionId = initPluginNetworkVersion();
            conf.set("chdfs.hadoop.plugin.network.version", String.format("network:%s", networkVersionId));

            long appid = getAppid(conf);
            int jarPluginServerPort = getJarPluginServerPort(conf);
            String tmpDirPath = initCacheTmpDir(conf);
            boolean jarPluginServerHttpsFlag = isJarPluginServerHttps(conf);
            String cosEndPointSuffix = getCosEndPointSuffix(conf);
            boolean distinguishHost = isDistinguishHost(conf);
            log.debug("fs.ofs.data.transfer.distinguish.host: {}", distinguishHost);
            initJarLoadWithRetry(ofsHost, appid, jarPluginServerPort, tmpDirPath, jarPluginServerHttpsFlag,
                    cosEndPointSuffix, distinguishHost, networkVersionId);

            this.actualImplFS = jarLoader.getActualFileSystem();
            if (this.actualImplFS == null) {
                // should never reach here
                throw new IOException("impl filesystem is null");
            }

            long actualInitStartMs = System.currentTimeMillis();
            this.actualImplFS.initialize(name, conf);
            log.debug("init actual file system, [elapse-ms: {}]", System.currentTimeMillis() - actualInitStartMs);
            this.uri = this.actualImplFS.getUri();
            this.workingDir = this.actualImplFS.getWorkingDirectory();
        } catch (IOException ioe) {
            log.error("initialize failed! a ioException occur!", ioe);
            throw ioe;
        } catch (Exception e) {
            log.error("initialize failed! a unexpected exception occur!", e);
            throw new IOException("initialize failed! oops! a unexpected exception occur! " + e.toString(), e);
        }
        log.debug("total init file system, [elapse-ms: {}]", System.currentTimeMillis() - initStartMs);
    }

    boolean isValidMountPointAddrChdfsType(String mountPointAddr) {
        return Pattern.matches(MOUNT_POINT_ADDR_PATTERN_CHDFS_TYPE, mountPointAddr);
    }

    boolean isValidMountPointAddrCosType(String mountPointAddr) {
        return Pattern.matches(MOUNT_POINT_ADDR_PATTERN_COS_TYPE, mountPointAddr);
    }

    private String getCosEndPointSuffix(Configuration conf) throws IOException {
        return conf.get(COS_ENDPOINT_SUFFIX);
    }

    private String getChdfsBucketRegion(Configuration conf) throws IOException {
        String bucketRegion = conf.get(CHDFS_BUCKET_REGION);
        if (bucketRegion == null) {
            String errMsg = String.format("ofs config %s is missing", CHDFS_BUCKET_REGION);
            log.error(errMsg);
            throw new IOException(errMsg);
        }
        return bucketRegion;
    }

    private String getMetaEndpointSuffix(Configuration conf) throws IOException {
        return initStringValue(conf, CHDFS_META_ENDPOINT_SUFFIX_KEY, "").toLowerCase();
    }

    private String initStringValue(Configuration conf, String configKey, String defaultValue)
            throws IOException {
        String retValue = conf.get(configKey);
        if (retValue == null) {
            if (defaultValue == null) {
                String errMsg = String.format("chdfs config %s missing", configKey);
                log.error(errMsg);
                throw new IOException(errMsg);
            } else {
                retValue = defaultValue;
                log.debug("chdfs config {} missing, use default value {}", configKey, defaultValue);
            }
        } else {
            if (retValue.trim().isEmpty()) {
                String errMsg = String.format("chdfs config %s value %s is invalid, value should not be empty string",
                        configKey, retValue);
                log.error(errMsg);
                throw new IOException(errMsg);
            }
        }
        return retValue.trim();
    }

    private long getAppid(Configuration conf) throws IOException {
        long appid = 0;
        try {
            appid = conf.getLong(CHDFS_USER_APPID_KEY, 0);
        } catch (NumberFormatException e) {
            throw new IOException(String.format("config for %s is invalid appid number", CHDFS_USER_APPID_KEY));
        }
        if (appid <= 0) {
            throw new IOException(
                    String.format("config for %s is missing or invalid appid number", CHDFS_USER_APPID_KEY));
        }
        return appid;
    }

    private int getJarPluginServerPort(Configuration conf) {
        return conf.getInt(CHDFS_META_SERVER_PORT_KEY, DEFAULT_CHDFS_META_SERVER_PORT);
    }

    private String initCacheTmpDir(Configuration conf) throws IOException {
        String chdfsTmpCacheDirPath = conf.get(CHDFS_TMP_CACHE_DIR_KEY);
        if (chdfsTmpCacheDirPath == null) {
            String errMsg = String.format("chdfs config %s is missing", CHDFS_TMP_CACHE_DIR_KEY);
            log.error(errMsg);
            throw new IOException(errMsg);
        }
        if (!chdfsTmpCacheDirPath.startsWith("/")) {
            String errMsg = String.format("chdfs config [%s: %s] must be absolute path", CHDFS_TMP_CACHE_DIR_KEY,
                    chdfsTmpCacheDirPath);
            log.error(errMsg);
            throw new IOException(errMsg);
        }

        File chdfsTmpCacheDir = new File(chdfsTmpCacheDirPath);
        if (!chdfsTmpCacheDir.exists()) {
            // judge exists again, may many map-reduce processes create cache dir parallel
            if (!chdfsTmpCacheDir.mkdirs() && !chdfsTmpCacheDir.exists()) {
                String errMsg = String.format("mkdir for chdfs tmp dir %s failed", chdfsTmpCacheDir.getAbsolutePath());
                log.error(errMsg);
                throw new IOException(errMsg);
            }
            chdfsTmpCacheDir.setReadable(true, false);
            chdfsTmpCacheDir.setWritable(true, false);
            chdfsTmpCacheDir.setExecutable(true, false);
        }

        if (!chdfsTmpCacheDir.isDirectory()) {
            String errMsg = String.format("chdfs config [%s: %s] is invalid directory", CHDFS_TMP_CACHE_DIR_KEY,
                    chdfsTmpCacheDir.getAbsolutePath());
            log.error(errMsg);
            throw new IOException(errMsg);
        }

        if (!chdfsTmpCacheDir.canRead()) {
            String errMsg = String.format("chdfs config [%s: %s] is not readable", CHDFS_TMP_CACHE_DIR_KEY,
                    chdfsTmpCacheDirPath);
            log.error(errMsg);
            throw new IOException(errMsg);
        }

        if (!chdfsTmpCacheDir.canWrite()) {
            String errMsg = String.format("chdfs config [%s: %s] is not writeable", CHDFS_TMP_CACHE_DIR_KEY,
                    chdfsTmpCacheDirPath);
            log.error(errMsg);
            throw new IOException(errMsg);
        }
        return chdfsTmpCacheDirPath;
    }

    private boolean isJarPluginServerHttps(Configuration conf) {
        return conf.getBoolean(CHDFS_META_TRANSFER_USE_TLS_KEY, DEFAULT_CHDFS_META_TRANSFER_USE_TLS);
    }

    private boolean isDistinguishHost(Configuration conf) {
        return conf.getBoolean(CHDFS_DATA_TRANSFER_DISTINGUISH_HOST, DEFAULT_CHDFS_DATA_TRANSFER_DISTINGUISH_FLAG);
    }


    private void initJarLoadWithRetry(String mountPointAddr, long appid, int jarPluginServerPort, String tmpDirPath,
                                      boolean jarPluginServerHttps, String cosEndPointSuffix, boolean distinguishHost
            , String networkVersionId) throws IOException {
        int maxRetry = 5;
        for (int retryIndex = 0; retryIndex <= maxRetry; retryIndex++) {
            try {
                jarLoader.init(mountPointAddr, appid, jarPluginServerPort, tmpDirPath, jarPluginServerHttps,
                        cosEndPointSuffix, distinguishHost, networkVersionId);
                return;
            } catch (IOException e) {
                if (retryIndex < maxRetry) {
                    log.warn(String.format("init chdfs impl failed, we will retry again, retryInfo: %d/%d", retryIndex,
                            maxRetry), e);
                } else {
                    log.error("init chdfs impl failed", e);
                    throw new IOException("init chdfs impl failed", e);
                }
            }
            try {
                Thread.sleep(ThreadLocalRandom.current().nextLong(500, 2000));
            } catch (InterruptedException ignore) {
                // ignore
            }
        }
    }

    @java.lang.Override
    public java.net.URI getUri() {
        return this.uri;
    }

    private void judgeActualFSInitialized() {
        if (this.actualImplFS == null) {
            throw new RuntimeException("please init the fileSystem first!");
        }
    }

    private String initPluginNetworkVersion() {
        String networkVersionId = "unknown";

        Properties versionProp = new Properties();
        InputStream in = null;
        final String versionPropName = "chdfsHadoopPluginNetworkVersionInfo.properties";
        try {
            in = this.getClass().getClassLoader().getResourceAsStream(versionPropName);
            if (in != null) {
                versionProp.load(in);
                networkVersionId = versionProp.getProperty("network_version");

            } else {
                log.error("load versionInfo properties failed, propName: {} ", versionPropName);
            }
        } catch (IOException e) {
            log.error("load versionInfo properties failed", e);
        } finally {
            IOUtils.closeQuietly(in);
        }
        return networkVersionId;
    }

    @java.lang.Override
    public FSDataInputStream open(Path f, int bufferSize) throws IOException {
        judgeActualFSInitialized();
        return this.actualImplFS.open(f, bufferSize);
    }

    @java.lang.Override
    public FSDataOutputStream createNonRecursive(Path f, FsPermission permission, EnumSet flags,
                                                 int bufferSize, short replication, long blockSize, Progressable progress) throws IOException {
        judgeActualFSInitialized();
        return this.actualImplFS.createNonRecursive(f, permission, flags, bufferSize, replication, blockSize, progress);
    }

    @java.lang.Override
    public FSDataOutputStream create(Path f, FsPermission permission, boolean overwrite, int bufferSize,
                                     short replication, long blockSize, Progressable progress) throws IOException {
        judgeActualFSInitialized();
        return this.actualImplFS.create(f, permission, overwrite, bufferSize, replication, blockSize, progress);
    }

    @java.lang.Override
    public FSDataOutputStream append(Path f, int bufferSize, Progressable progress) throws IOException {
        judgeActualFSInitialized();
        return this.actualImplFS.append(f, bufferSize, progress);
    }

    public boolean truncate(Path f, long newLength) throws IOException {
        judgeActualFSInitialized();
        return this.actualImplFS.truncate(f, newLength);
    }

    @Override
    public void concat(Path trg, Path[] psrcs) throws IOException {
        judgeActualFSInitialized();
        this.actualImplFS.concat(trg, psrcs);
    }

    @java.lang.Override
    public boolean rename(Path src, Path dst) throws IOException {
        judgeActualFSInitialized();
        return this.actualImplFS.rename(src, dst);
    }

    @java.lang.Override
    public boolean delete(Path f, boolean recursive) throws IOException {
        judgeActualFSInitialized();
        return this.actualImplFS.delete(f, recursive);
    }

    @java.lang.Override
    public boolean deleteOnExit(Path f) throws IOException {
        judgeActualFSInitialized();
        return this.actualImplFS.deleteOnExit(f);
    }

    @java.lang.Override
    public boolean cancelDeleteOnExit(Path f) {
        judgeActualFSInitialized();
        return this.actualImplFS.cancelDeleteOnExit(f);
    }


    @java.lang.Override
    public FileStatus[] listStatus(Path f) throws FileNotFoundException, IOException {
        judgeActualFSInitialized();
        return this.actualImplFS.listStatus(f);
    }

    @java.lang.Override
    public Path getWorkingDirectory() {
        return this.workingDir;
    }

    @java.lang.Override
    public void setWorkingDirectory(Path new_dir) {
        this.workingDir = new_dir;
        if (this.actualImplFS == null) {
            log.warn("fileSystem is not init yet!");
        } else {
            this.actualImplFS.setWorkingDirectory(new_dir);
        }
    }

    @Override
    public Path getHomeDirectory() {
        if (this.actualImplFS == null) {
            return super.getHomeDirectory();
        }
        return this.actualImplFS.getHomeDirectory();
    }

    @java.lang.Override
    public boolean mkdirs(Path f, FsPermission permission) throws IOException {
        judgeActualFSInitialized();
        return this.actualImplFS.mkdirs(f, permission);
    }

    @java.lang.Override
    public FileStatus getFileStatus(Path f) throws IOException {
        judgeActualFSInitialized();
        return this.actualImplFS.getFileStatus(f);
    }

    @Override
    public void createSymlink(Path target, Path link, boolean createParent)
            throws AccessControlException, FileAlreadyExistsException, FileNotFoundException,
            ParentNotDirectoryException, UnsupportedFileSystemException, IOException {
        judgeActualFSInitialized();
        this.actualImplFS.createSymlink(target, link, createParent);
    }

    @Override
    public FileStatus getFileLinkStatus(final Path f)
            throws AccessControlException, FileNotFoundException, UnsupportedFileSystemException, IOException {
        judgeActualFSInitialized();
        return this.actualImplFS.getFileLinkStatus(f);
    }

    @Override
    public boolean supportsSymlinks() {
        if (this.actualImplFS == null) {
            return super.supportsSymlinks();
        }
        return this.actualImplFS.supportsSymlinks();
    }


    @Override
    public Path getLinkTarget(Path f) throws IOException {
        judgeActualFSInitialized();
        return this.actualImplFS.getLinkTarget(f);
    }

    @Override
    protected Path resolveLink(Path f) throws IOException {
        return getLinkTarget(f);
    }

    @Override
    public FileChecksum getFileChecksum(Path f, long length) throws IOException {
        judgeActualFSInitialized();
        return this.actualImplFS.getFileChecksum(f, length);
    }

    @Override
    public void setVerifyChecksum(boolean verifyChecksum) {
        judgeActualFSInitialized();
        this.actualImplFS.setVerifyChecksum(verifyChecksum);
    }

    @Override
    public void setWriteChecksum(boolean writeChecksum) {
        judgeActualFSInitialized();
        this.actualImplFS.setWriteChecksum(writeChecksum);
    }

    @Override
    public FsStatus getStatus(Path p) throws IOException {
        judgeActualFSInitialized();
        return this.actualImplFS.getStatus(p);
    }

    @Override
    public void setPermission(Path p, FsPermission permission) throws IOException {
        judgeActualFSInitialized();
        this.actualImplFS.setPermission(p, permission);
    }

    @Override
    public void setOwner(Path p, String username, String groupname) throws IOException {
        judgeActualFSInitialized();
        this.actualImplFS.setOwner(p, username, groupname);
    }

    @Override
    public void setTimes(Path p, long mtime, long atime) throws IOException {
        judgeActualFSInitialized();
        this.actualImplFS.setTimes(p, mtime, atime);
    }

    @Override
    public Path createSnapshot(Path path, String snapshotName) throws IOException {
        judgeActualFSInitialized();
        return this.actualImplFS.createSnapshot(path, snapshotName);
    }

    @Override
    public void renameSnapshot(Path path, String snapshotOldName, String snapshotNewName) throws IOException {
        judgeActualFSInitialized();
        this.actualImplFS.renameSnapshot(path, snapshotOldName, snapshotNewName);
    }

    @Override
    public void deleteSnapshot(Path path, String snapshotName) throws IOException {
        judgeActualFSInitialized();
        this.actualImplFS.deleteSnapshot(path, snapshotName);
    }

    @Override
    public void modifyAclEntries(Path path, List aclSpec) throws IOException {
        judgeActualFSInitialized();
        this.actualImplFS.modifyAclEntries(path, aclSpec);
    }

    @Override
    public void removeAclEntries(Path path, List aclSpec) throws IOException {
        judgeActualFSInitialized();
        this.actualImplFS.removeAclEntries(path, aclSpec);
    }

    @Override
    public void removeDefaultAcl(Path path) throws IOException {
        judgeActualFSInitialized();
        this.actualImplFS.removeDefaultAcl(path);
    }

    @Override
    public void removeAcl(Path path) throws IOException {
        judgeActualFSInitialized();
        this.actualImplFS.removeAcl(path);
    }

    @Override
    public void setAcl(Path path, List aclSpec) throws IOException {
        judgeActualFSInitialized();
        this.actualImplFS.setAcl(path, aclSpec);
    }

    @Override
    public AclStatus getAclStatus(Path path) throws IOException {
        judgeActualFSInitialized();
        return this.actualImplFS.getAclStatus(path);
    }

    @Override
    public void setXAttr(Path path, String name, byte[] value, EnumSet flag) throws IOException {
        judgeActualFSInitialized();
        this.actualImplFS.setXAttr(path, name, value, flag);
    }

    @Override
    public byte[] getXAttr(Path path, String name) throws IOException {
        judgeActualFSInitialized();
        return this.actualImplFS.getXAttr(path, name);
    }

    @Override
    public Map getXAttrs(Path path) throws IOException {
        judgeActualFSInitialized();
        return this.actualImplFS.getXAttrs(path);
    }

    @Override
    public Map getXAttrs(Path path, List names) throws IOException {
        judgeActualFSInitialized();
        return this.actualImplFS.getXAttrs(path, names);
    }

    @Override
    public List listXAttrs(Path path) throws IOException {
        judgeActualFSInitialized();
        return this.actualImplFS.listXAttrs(path);
    }

    @Override
    public void removeXAttr(Path path, String name) throws IOException {
        judgeActualFSInitialized();
        this.actualImplFS.removeXAttr(path, name);
    }

    @Override
    public Token getDelegationToken(String renewer) throws IOException {
        judgeActualFSInitialized();
        return this.actualImplFS.getDelegationToken(renewer);
    }

    @Override
    public String getCanonicalServiceName() {
        if (this.actualImplFS == null) {
            return null;
        } else {
            return this.actualImplFS.getCanonicalServiceName();
        }
    }

    @Override
    public ContentSummary getContentSummary(Path f) throws IOException {
        judgeActualFSInitialized();
        return this.actualImplFS.getContentSummary(f);
    }

    @Override
    public void releaseFileLock(Path p) throws IOException {
        if (this.actualImplFS == null) {
            throw new IOException("please init the fileSystem first!");
        }
        this.actualImplFS.releaseFileLock(p);
    }


    @Override
    public void close() throws IOException {
        judgeActualFSInitialized();
        super.close();
        this.actualImplFS.close();
    }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy