All Downloads are FREE. Search and download functionalities are using the official Maven repository.

io.github.repir.MapReduceTools.NullInputFormat Maven / Gradle / Ivy

The newest version!
package io.github.repir.MapReduceTools;

import io.github.repir.Repository.Repository;
import io.github.repir.tools.lib.Log;
import org.apache.hadoop.io.NullWritable;

/**
 * A custom implementation of Hadoop's InputFormat, that holds the InputSplits
 * that are to be retrieved. This class should be used as static, using
 * {@link #setRepository(Repository.Repository)} to initialize and 
 * {@link #add(Repository.Repository, IndexReader.Query) }
 * to add Query requests to the MapReduce job. Internally, a separate InputSplit
 * is created for each repository partition. Whenever a Query request is added,
 * it is added to each Split.
 * 

* When cansplit==true, then the InputSplits are divided over 2 * nodes in cluster * (as defined in cluster.nodes), to divide the workload more evenly. * * @author jeroen */ public class NullInputFormat extends MRInputFormat { public static Log log = new Log(NullInputFormat.class); public NullInputFormat() {} public NullInputFormat(Repository repository) { super(repository); } @Override public MRInputSplit createIS(Repository repository, int partition) { return new NullInputSplit(repository, partition); } }





© 2015 - 2025 Weber Informatics LLC | Privacy Policy