
com.qiniu.datasource.FileContainer Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of qsuits Show documentation
Show all versions of qsuits Show documentation
qiniu-suits is a efficient tools for qiniu api implemented by java8.
package com.qiniu.datasource;
import com.qiniu.common.QiniuException;
import com.qiniu.entry.CommonParams;
import com.qiniu.interfaces.ILineProcess;
import com.qiniu.interfaces.ITypeConvert;
import com.qiniu.persistence.IResultOutput;
import com.qiniu.util.HttpRespUtils;
import com.qiniu.util.SystemUtils;
import java.io.IOException;
import java.util.ArrayList;
import java.util.List;
import java.util.Map;
import java.util.Set;
import java.util.concurrent.ExecutorService;
import java.util.concurrent.Executors;
import java.util.concurrent.atomic.AtomicBoolean;
public abstract class FileContainer implements IDataSource, IResultOutput, T> {
private String filePath;
protected String parse;
protected String separator;
protected String addKeyPrefix;
protected String rmKeyPrefix;
protected Map indexMap;
protected int unitLen;
private int threads;
protected int retryTimes = 5;
protected String savePath;
protected boolean saveTotal;
protected String saveFormat;
protected String saveSeparator;
protected Set rmFields;
private ExecutorService executorPool; // 线程池
private AtomicBoolean exitBool; // 多线程的原子操作 bool 值
private ILineProcess processor; // 定义的资源处理器
public FileContainer(String filePath, String parse, String separator, String addKeyPrefix, String rmKeyPrefix,
Map indexMap, int unitLen, int threads) {
this.filePath = filePath;
this.parse = parse;
this.separator = separator;
this.addKeyPrefix = addKeyPrefix;
this.rmKeyPrefix = rmKeyPrefix;
this.indexMap = indexMap;
this.unitLen = unitLen;
this.threads = threads;
this.saveTotal = false; // 默认全记录不保存
}
// 不调用则各参数使用默认值
public void setSaveOptions(String savePath, boolean saveTotal, String format, String separator, Set rmFields) {
this.savePath = savePath;
this.saveTotal = saveTotal;
this.saveFormat = format;
this.saveSeparator = separator;
this.rmFields = rmFields;
}
public void setRetryTimes(int retryTimes) {
this.retryTimes = retryTimes;
}
// 通过 commonParams 来更新基本参数
public void updateSettings(CommonParams commonParams) {
this.filePath = commonParams.getPath();
this.parse = commonParams.getParse();
this.separator = commonParams.getSeparator();
this.addKeyPrefix = commonParams.getAddKeyPrefix();
this.rmKeyPrefix = commonParams.getRmKeyPrefix();
this.indexMap = commonParams.getIndexMap();
this.unitLen = commonParams.getUnitLen();
this.threads = commonParams.getThreads();
this.retryTimes = commonParams.getRetryTimes();
this.savePath = commonParams.getSavePath();
this.saveTotal = commonParams.getSaveTotal();
this.saveFormat = commonParams.getSaveFormat();
this.saveSeparator = commonParams.getSaveSeparator();
this.rmFields = commonParams.getRmFields();
}
public void setProcessor(ILineProcess processor) {
this.processor = processor;
}
protected abstract ITypeConvert getNewConverter() throws IOException;
protected abstract ITypeConvert getNewStringConverter() throws IOException;
public void export(IReader reader, IResultOutput saver, ILineProcess processor) throws IOException {
ITypeConvert converter = getNewConverter();
ITypeConvert stringConverter = getNewStringConverter();
List srcList = new ArrayList<>();
List convertedList;
List writeList;
String line = "";
int retry;
while (line != null) {
retry = retryTimes + 1;
while (retry > 0) {
try {
// 避免文件过大,行数过多,使用 lines() 的 stream 方式直接转换可能会导致内存泄漏,故使用 readLine() 的方式
line = reader.readLine();
retry = 0;
} catch (IOException e) {
retry--;
if (retry == 0) throw e;
}
}
if (line != null && !"".equals(line)) srcList.add(line);
if (srcList.size() >= unitLen || (line == null && srcList.size() > 0)) {
convertedList = converter.convertToVList(srcList);
if (converter.errorSize() > 0) saver.writeError(converter.errorLines(), false);
if (saveTotal) {
writeList = stringConverter.convertToVList(convertedList);
if (writeList.size() > 0) saver.writeSuccess(String.join("\n", writeList), false);
if (stringConverter.errorSize() > 0)
saver.writeKeyFile("string-error", stringConverter.errorLines(), false);
}
// 如果抛出异常需要检测下异常是否是可继续的异常,如果是程序可继续的异常,忽略当前异常保持数据源读取过程继续进行
try {
if (processor != null) processor.processLine(convertedList);
} catch (QiniuException e) {
// 这里其实逻辑上没有做重试次数的限制,因为返回的 retry 始终大于等于 -1,所以不是必须抛出的异常则会跳过,process 本身会
// 保存失败的记录,除非是 process 出现 599 状态码才会抛出异常
retry = HttpRespUtils.checkException(e, 1);
if (retry == -2) throw e;
}
srcList.clear();
}
}
}
protected abstract IResultOutput getNewResultSaver(String order) throws IOException;
public void execInThread(IReader reader, int order) throws Exception {
// 如果是第一个线程直接使用初始的 processor 对象,否则使用 clone 的 processor 对象,多线程情况下不要直接使用传入的 processor,
// 因为对其关闭会造成 clone 的对象无法进行结果持久化的写入
ILineProcess lineProcessor = processor == null ? null : processor.clone();
// 持久化结果标识信息
String newOrder = String.valueOf(order);
IResultOutput saver = getNewResultSaver(newOrder);
executorPool.execute(() -> {
try {
String record = "order " + newOrder + ": " + reader.getName();
export(reader, saver, lineProcessor);
record += "\tsuccessfully done";
System.out.println(record);
saver.closeWriters();
if (lineProcessor != null) lineProcessor.closeResource();
reader.close();
} catch (Exception e) {
try {
System.out.println("order " + newOrder + ": " + reader.getName() + "\tnextLine:" + reader.readLine());
} catch (IOException io) {
io.printStackTrace();
}
saver.closeWriters();
if (lineProcessor != null) lineProcessor.closeResource();
SystemUtils.exit(exitBool, e);
}
});
}
protected abstract List> getFileReaders(String path) throws IOException;
public void export() throws Exception {
List> fileReaders = getFileReaders(filePath);
int filesCount = fileReaders.size();
int runningThreads = filesCount < threads ? filesCount : threads;
String info = "read objects from file(s): " + filePath + (processor == null ? "" : " and " + processor.getProcessName());
System.out.println(info + " running...");
executorPool = Executors.newFixedThreadPool(runningThreads);
exitBool = new AtomicBoolean(false);
try {
int order = 1;
for (IReader fileReader : fileReaders) {
execInThread(fileReader, order++);
}
executorPool.shutdown();
while (!executorPool.isTerminated()) Thread.sleep(1000);
System.out.println(info + " finished");
} catch (Throwable throwable) {
SystemUtils.exit(exitBool, throwable);
}
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy