All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.dasasian.chok.node.ShardManager Maven / Gradle / Ivy

/**
 * Copyright (C) 2014 Dasasian ([email protected])
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *         http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package com.dasasian.chok.node;

import com.dasasian.chok.util.ChokException;
import com.dasasian.chok.util.FileUtil;
import com.dasasian.chok.util.ThrottledInputStream;
import com.dasasian.chok.util.ThrottledInputStream.ThrottleSemaphore;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.*;
import org.apache.hadoop.fs.permission.FsPermission;
import org.apache.hadoop.util.Progressable;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import java.io.File;
import java.io.IOException;
import java.net.URI;
import java.net.URISyntaxException;
import java.util.Arrays;
import java.util.Collection;
import java.util.Collections;

public class ShardManager {

    protected final static Logger LOG = LoggerFactory.getLogger(ShardManager.class);
    private final File shardsFolder;
    private final ThrottleSemaphore throttleSemaphore;

    public ShardManager(File shardsFolder) {
        this(shardsFolder, null);
    }

    public ShardManager(File shardsFolder, ThrottleSemaphore throttleSemaphore) {
        this.shardsFolder = shardsFolder;
        this.throttleSemaphore = throttleSemaphore;
        if (!this.shardsFolder.exists()) {
            this.shardsFolder.mkdirs();
        }
        if (!this.shardsFolder.exists()) {
            throw new IllegalStateException("could not create local shard folder '" + this.shardsFolder.getAbsolutePath() + "'");
        }
    }

    public File installShard(String shardName, String shardPath) throws Exception {
        File localShardFolder = getShardFolder(shardName);
        try {
            if (!localShardFolder.exists()) {
                installShard(shardName, shardPath, localShardFolder);
            }
            return localShardFolder;
        } catch (Exception e) {
            FileUtil.deleteFolder(localShardFolder);
            throw e;
        }
    }

    public void uninstallShard(String shardName) {
        File localShardFolder = getShardFolder(shardName);
        FileUtil.deleteFolder(localShardFolder);
    }

    public Collection getInstalledShards() {
        String[] folderList = shardsFolder.list(FileUtil.VISIBLE_FILES_FILTER);
        if (folderList == null) {
            return Collections.EMPTY_LIST;
        }
        return Arrays.asList(folderList);
    }

    public File getShardsFolder() {
        return shardsFolder;
    }

    public File getShardFolder(String shardName) {
        return new File(shardsFolder, shardName);
    }

    /*
     * Loads a shard from the given URI. The uri is handled bye the hadoop file
     * system. So all hadoop support file systems can be used, like local hdfs s3
     * etc. In case the shard is compressed we also unzip the content. If the
     * system property chok.spool.zip.shards is true, the zip file is staged to
     * the local disk before being unzipped.
     */
    private void installShard(String shardName, String shardPath, File localShardFolder) throws ChokException {
        LOG.info("install shard '" + shardName + "' from " + shardPath);
        // TODO sg: to fix HADOOP-4422 we try to download the shard 5 times
        int maxTries = 5;
        for (int i = 0; i < maxTries; i++) {
            URI uri;
            try {
                uri = new URI(shardPath);
                FileSystem fileSystem = FileSystem.get(uri, new Configuration());
                if (throttleSemaphore != null) {
                    fileSystem = new ThrottledFileSystem(fileSystem, throttleSemaphore);
                }
                final Path path = new Path(shardPath);
                boolean isZip = fileSystem.isFile(path) && shardPath.endsWith(".zip");

                File shardTmpFolder = new File(localShardFolder.getAbsolutePath() + "_tmp");
                try {
                    FileUtil.deleteFolder(localShardFolder);
                    FileUtil.deleteFolder(shardTmpFolder);

                    if (isZip) {
                        FileUtil.unzip(path, shardTmpFolder, fileSystem, "true".equalsIgnoreCase(System.getProperty("chok.spool.zip.shards", "false")));
                    } else {
                        fileSystem.copyToLocalFile(path, new Path(shardTmpFolder.getAbsolutePath()));
                    }
                    shardTmpFolder.renameTo(localShardFolder);
                } finally {
                    // Ensure that the tmp folder is deleted on an error
                    FileUtil.deleteFolder(shardTmpFolder);
                }
                // Looks like we were successful.
                if (i > 0) {
                    LOG.error("Loaded shard:" + shardPath);
                }
                return;
            } catch (final URISyntaxException e) {
                throw new ChokException("Can not parse uri for path: " + shardPath, e);
            } catch (final Exception e) {
                LOG.error(String.format("Error loading shard: %s (try %d of %d)", shardPath, i, maxTries), e);
                if (i >= maxTries - 1) {
                    throw new ChokException("Can not load shard: " + shardPath, e);
                }
            }
        }
    }

    @SuppressWarnings("deprecation")
    private static class ThrottledFileSystem extends FileSystem {

        private final FileSystem fileSystemDelegate;
        private final ThrottleSemaphore throttleSemaphore;

        public ThrottledFileSystem(FileSystem fileSystem, ThrottleSemaphore throttleSemaphore) {
            fileSystemDelegate = fileSystem;
            this.throttleSemaphore = throttleSemaphore;
        }

        @Override
        public FSDataOutputStream append(Path arg0, int arg1, Progressable arg2) throws IOException {
            return fileSystemDelegate.append(arg0, arg1, arg2);
        }

        @Override
        public FSDataOutputStream create(Path arg0, FsPermission arg1, boolean arg2, int arg3, short arg4, long arg5, Progressable arg6) throws IOException {
            return fileSystemDelegate.create(arg0, arg1, arg2, arg3, arg4, arg5, arg6);
        }

        @Override
        public boolean delete(Path arg0) throws IOException {
            return fileSystemDelegate.delete(arg0);
        }

        @Override
        public boolean delete(Path arg0, boolean arg1) throws IOException {
            return fileSystemDelegate.delete(arg0, arg1);
        }

        @Override
        public FileStatus getFileStatus(Path arg0) throws IOException {
            return fileSystemDelegate.getFileStatus(arg0);
        }

        @Override
        public URI getUri() {
            return fileSystemDelegate.getUri();
        }

        @Override
        public Path getWorkingDirectory() {
            return fileSystemDelegate.getWorkingDirectory();
        }

        @Override
        public void setWorkingDirectory(Path arg0) {
            fileSystemDelegate.setWorkingDirectory(arg0);
        }

        @Override
        public FileStatus[] listStatus(Path arg0) throws IOException {
            return fileSystemDelegate.listStatus(arg0);
        }

        @Override
        public boolean mkdirs(Path arg0, FsPermission arg1) throws IOException {
            return fileSystemDelegate.mkdirs(arg0, arg1);
        }

        @Override
        public FSDataInputStream open(Path path, int bufferSize) throws IOException {
            ThrottledInputStream throttledInputStream = new ThrottledInputStream(fileSystemDelegate.open(path, bufferSize), throttleSemaphore);
            return new FSDataInputStream(throttledInputStream);
        }

        @Override
        public boolean rename(Path arg0, Path arg1) throws IOException {
            return fileSystemDelegate.rename(arg0, arg1);
        }

        @Override
        public Configuration getConf() {
            return fileSystemDelegate.getConf();
        }
    }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy