
com.twitter.maple.tap.MemorySourceTap Maven / Gradle / Ivy
package com.twitter.maple.tap;
import cascading.flow.FlowProcess;
import cascading.scheme.Scheme;
import cascading.scheme.SinkCall;
import cascading.scheme.SourceCall;
import cascading.tap.SourceTap;
import cascading.tap.Tap;
import cascading.tap.hadoop.io.HadoopTupleEntrySchemeIterator;
import cascading.tuple.Fields;
import cascading.tuple.Tuple;
import cascading.tuple.TupleEntryIterator;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.NullWritable;
import org.apache.hadoop.mapred.FileInputFormat;
import org.apache.hadoop.mapred.JobConf;
import org.apache.hadoop.mapred.RecordReader;
import java.io.IOException;
import java.io.Serializable;
import java.util.List;
import java.util.UUID;
public class MemorySourceTap extends SourceTap>
implements Serializable {
public static class MemorySourceScheme
extends Scheme, Void, Object[], Void> {
private transient List tuples;
private final String id;
public MemorySourceScheme(List tuples, Fields fields, String id) {
super(fields);
assert tuples != null;
this.tuples = tuples;
this.id = id;
}
public String getId() {
return this.id;
}
public List getTuples() {
return this.tuples;
}
@Override
public void sourceConfInit(FlowProcess extends JobConf> flowProcess,
Tap, Void> tap, JobConf conf) {
FileInputFormat.setInputPaths(conf, this.id);
conf.setInputFormat(TupleMemoryInputFormat.class);
TupleMemoryInputFormat.storeTuples(conf, TupleMemoryInputFormat.TUPLES_PROPERTY, this.tuples);
}
@Override
public void sinkConfInit(FlowProcess extends JobConf> flowProcess,
Tap, Void> tap, JobConf conf) {
throw new UnsupportedOperationException("Not supported yet.");
}
@Override
public void sourcePrepare( FlowProcess extends JobConf> flowProcess, SourceCall
© 2015 - 2025 Weber Informatics LLC | Privacy Policy