All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.thinkaurelius.titan.hadoop.compat.h1.DistCacheConfigurer Maven / Gradle / Ivy

package com.thinkaurelius.titan.hadoop.compat.h1;

import com.thinkaurelius.titan.hadoop.config.job.AbstractDistCacheConfigurer;
import com.thinkaurelius.titan.hadoop.config.job.JobClasspathConfigurer;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.filecache.DistributedCache;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.mapreduce.Job;

import java.io.IOException;

public class DistCacheConfigurer extends AbstractDistCacheConfigurer implements JobClasspathConfigurer {

    public DistCacheConfigurer(String mapredJarFilename) {
        super(mapredJarFilename);
    }

    @Override
    public void configure(Job job) throws IOException {

        for (Path p : getLocalPaths()) {
            Configuration conf = job.getConfiguration();
            FileSystem jobFS = FileSystem.get(conf);
            FileSystem localFS = FileSystem.getLocal(conf);
            Path stagedPath = uploadFileIfNecessary(localFS, p, jobFS);
            DistributedCache.addFileToClassPath(stagedPath, conf, jobFS);
        }

        // We don't really need to set a mapred job jar here,
        // but doing so suppresses a warning
        String mj = getMapredJar();
        if (null != mj)
            job.getConfiguration().set(Hadoop1Compat.CFG_JOB_JAR, mj);
    }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy