org.geneweaver.io.reader.AbstractStreamReader Maven / Gradle / Ivy
/*-
*
* Copyright 2018, 2020 The Jackson Laboratory Inc.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*
* @author Matthew Gerring
*/
package org.geneweaver.io.reader;
import java.util.HashMap;
import java.util.Iterator;
import java.util.LinkedList;
import java.util.List;
import java.util.Map;
import java.util.function.Function;
import java.util.stream.Stream;
import org.geneweaver.domain.Entity;
/**
* Base class for all reader implementations.
* @author gerrim
*
* @param
*/
public abstract class AbstractStreamReader implements StreamReader {
protected ReaderRequest request;
protected String entryName; // When reading from an archive, the entry name is set by the archive reader.
/**
* Amount to wind forward when using multi-threading.
* This is the maximum amount which one thread will tackle
* in a single job.
*/
protected int chunkSize = Integer.getInteger("org.geneweaver.io.windForward", 4096);
/**
* All readers must have a create method which is called
* by the reader factory after the no-argument constructor.
* @param request
*/
@SuppressWarnings("unchecked")
public > R init(ReaderRequest request) throws ReaderException {
this.request = request;
return (R)this;
}
/**
* Gets the chunk size.
*
* @return the windForwardAmount
*/
public int getChunkSize() {
return chunkSize;
}
/**
* Set the amount each thread will attempt to wind forward for
* its chunk. Adjusting this affects execution time for larhge runs.
*
* @param windForwardAmount the new chunk size
*/
public void setChunkSize(int windForwardAmount) {
this.chunkSize = windForwardAmount;
}
private Iterator iterator;
/**
* Used to wind forward somewhere between 0 and the chunk size.
* @return the items passed when winding forward.
*/
public List wind() throws ReaderException {
if (iterator==null || !iterator.hasNext()) iterator = stream().iterator();
List ls = new LinkedList<>(); // linked list is fast to add/iterate
for (int i = 0; i < getChunkSize() && iterator.hasNext(); i++) {
ls.add(iterator.next());
}
return ls;
}
/**
* @return the entryName
*/
public String getEntryName() {
return entryName;
}
protected String getCurrentFileName() {
String name = getEntryName();
return name!=null
? name.substring(name.indexOf('/')+1)
: request.name();
}
/**
* @param entryName the entryName to set
*/
public void setEntryName(String entryName) {
this.entryName = entryName;
}
@Override
public Function> getDefaultConnector() {
throw new RuntimeException("No connector for "+getClass().getSimpleName());
}
/**
* Used to create an index map from a segmented line.
* @param segs
* @return map of segment name to index.
*/
protected Map parseIndices(String[] segs) {
Map indices = new HashMap<>();
for (int i = 0; i < segs.length; i++) {
indices.put(segs[i].toLowerCase(), i);
}
return indices;
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy