All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.sysml.runtime.util.InputStreamInputFormat Maven / Gradle / Ivy

There is a newer version: 1.2.0
Show newest version
/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 * 
 *   http://www.apache.org/licenses/LICENSE-2.0
 * 
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 * KIND, either express or implied.  See the License for the
 * specific language governing permissions and limitations
 * under the License.
 */

package org.apache.sysml.runtime.util;

import java.io.BufferedReader;
import java.io.IOException;
import java.io.InputStream;
import java.io.InputStreamReader;

import org.apache.hadoop.io.LongWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapred.FileSplit;
import org.apache.hadoop.mapred.InputFormat;
import org.apache.hadoop.mapred.InputSplit;
import org.apache.hadoop.mapred.JobConf;
import org.apache.hadoop.mapred.RecordReader;
import org.apache.hadoop.mapred.Reporter;

/**
 * Custom input format and record reader to redirect common implementation of csv read 
 * over record readers (which are required for the parallel readers) to an input stream.
 * 
 */
public class InputStreamInputFormat implements InputFormat
{
	private final InputStream _input;
		
	public InputStreamInputFormat(InputStream is) {
		_input = is;
	}

	@Override
	public InputSplit[] getSplits(JobConf job, int numSplits) throws IOException {
		//return dummy handle - stream accessed purely over record reader
		return new InputSplit[]{new FileSplit(null)};
	}

	@Override
	public RecordReader getRecordReader(InputSplit split, JobConf job, Reporter reporter) throws IOException {
		return new InputStreamRecordReader(_input);
	}
		
	private static class InputStreamRecordReader implements RecordReader
	{
		private final BufferedReader _reader;
		
		public InputStreamRecordReader(InputStream is) {
			_reader = new BufferedReader(new InputStreamReader( is ));
		}
		
		@Override
		public LongWritable createKey() {
			return new LongWritable();
		}
		@Override
		public Text createValue() {
			return new Text();
		}			
		@Override
		public float getProgress() throws IOException {
			return 0;
		}
		@Override
		public long getPos() throws IOException {
			return 0;
		}
		@Override
		public boolean next(LongWritable key, Text value) throws IOException {
			String line = _reader.readLine();
			if( line != null )
				value.set(line);
			return (line != null);
		}
		@Override
		public void close() throws IOException {
			_reader.close();
		}
	}
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy