All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.blazemeter.csv.RandomCSVReader Maven / Gradle / Ivy

There is a newer version: 0.8
Show newest version
package com.blazemeter.csv;

import org.apache.jmeter.save.CSVSaveService;
import org.apache.jmeter.services.FileServer;
import org.apache.jorphan.logging.LoggingManager;
import org.apache.log.Logger;

import java.io.BufferedReader;
import java.io.File;
import java.io.FileInputStream;
import java.io.IOException;
import java.io.InputStreamReader;
import java.io.RandomAccessFile;
import java.io.Reader;
import java.nio.channels.ClosedChannelException;
import java.util.ArrayList;
import java.util.Random;

public class RandomCSVReader {
    private static final Logger LOGGER = LoggingManager.getLoggerForClass();

    private File file;
    private String encoding;
    private char delim;
    private boolean randomOrder;
    private boolean isRewindOnEndOfList;

    private ArrayList offsets;
    private int curPos = 0;
    private final ThreadLocal rbr = new ThreadLocal() {
        @Override
        protected RandomBufferedReader initialValue() {
            try {
                return new RandomBufferedReader(createReader(), new RandomAccessFile(file, "r"), encoding);
            } catch (IOException e) {
                LOGGER.error("Cannot create RandomBufferedReader", e);
                throw new RuntimeException("Cannot create RandomBufferedReader", e);
            }
        }
    };
    private Random random;

    private BufferedReader consistentReader;
    private String[] header;

    private boolean isSkipFirstLine;


    public RandomCSVReader(String filename, String encoding,
                           String delim, boolean randomOrder,
                           boolean hasVariableNames, boolean firstLineIsHeader,
                           boolean isRewindOnEndOfList) {
        File f = new File(filename);
        this.file = (f.isAbsolute() || f.exists()) ? f : new File(FileServer.getFileServer().getBaseDir(), filename);
        this.encoding = encoding;
        this.delim = checkDelimiter(delim).charAt(0);
        this.isSkipFirstLine = !(!firstLineIsHeader && hasVariableNames);
        this.randomOrder = randomOrder;
        this.isRewindOnEndOfList = isRewindOnEndOfList;
        try {
            initOffsets();
            if (randomOrder) {
                initRandom();
            } else {
                initConsistentReader();
            }
            initHeader();
        } catch (IOException ex) {
            LOGGER.error("Cannot initialize RandomCSVReader, because of error: ", ex);
            throw new RuntimeException("Cannot initialize RandomCSVReader, because of error: " + ex.getMessage(), ex);
        }
    }

    private String checkDelimiter(String delim) {
        if ("\\t".equals(delim)) {
            return "\t";
        } else if (delim.isEmpty()) {
            LOGGER.debug("Empty delimiter, will use ','");
            return ",";
        }
        return delim;
    }

    private void initHeader() {
        try (BufferedReader reader = new BufferedReader(createReader())) {
            header = CSVSaveService.csvReadFile(reader, delim);
        } catch (IOException ex) {
            LOGGER.error("Cannot read CSV header ", ex);
            throw new RuntimeException("Cannot read CSV header: " + ex.getMessage(), ex);
        }
    }

    private void initConsistentReader() throws IOException {
        consistentReader = new BufferedReader(createReader());
        if (isSkipFirstLine && !this.offsets.isEmpty()) {
            consistentReader.skip(this.offsets.get(0)); //TODO: any other ideas how skip header?
        }
    }

    public void closeConsistentReader() throws IOException {
        consistentReader.close();
    }

    public boolean hasNextRecord() {
        if (!(curPos < offsets.size()) && isRewindOnEndOfList) {
            reInitialize();
            LOGGER.debug("Reset cursor position");
            curPos = 0;
            return true;
        } else if (curPos < offsets.size()) {
            return true;
        }
        return false;
    }

    private void reInitialize() {
        if (randomOrder) {
            initRandom();
        } else {
            try {
                closeConsistentReader();
                initConsistentReader();
            } catch (IOException ex) {
                LOGGER.error("Cannot reInitialize consistent reader ", ex);
                throw new RuntimeException("Cannot reInitialize consistent reader: " + ex.getMessage(), ex);
            }
        }
    }

    public String[] getHeader() {
        return header;
    }

    public String[] readNextLine() {
        try {
            curPos++;
            return CSVSaveService.csvReadFile(consistentReader, delim);
        } catch (IOException ex) {
            LOGGER.error("Cannot get next record from csv file: ", ex);
            throw new RuntimeException("Cannot get next record from csv file: " + ex.getMessage(), ex);
        }
    }

    public long getNextLineAddr() {
        int pos = getRandomPos();
        swap(curPos + pos);
        long lineAddr = offsets.get(curPos);
        curPos++;
        return lineAddr;
    }

    private void swap(int pos) {
        Integer tmp = offsets.get(curPos);
        offsets.set(curPos, offsets.get(pos));
        offsets.set(pos, tmp);
    }

    public String[] readLineWithSeek(long pos) {
        try {
            rbr.get().seek(pos);
            return CSVSaveService.csvReadFile(rbr.get(), delim);
        } catch (ClosedChannelException ex) {
            LOGGER.warn("The channel has been closed");
            return new String[0];
        } catch (IOException ex) {
            LOGGER.error("Cannot get next record from csv file: ", ex);
            throw new RuntimeException("Cannot get next record from csv file: " + ex.getMessage(), ex);
        }
    }

    private int getRandomPos() {
        return random.nextInt(offsets.size() - curPos);
    }

    private void initRandom() {
        this.random = new Random(System.currentTimeMillis());
    }

    private void initOffsets() throws IOException {
        offsets = new ArrayList<>();
        if (!isSkipFirstLine) {
            offsets.add(0);
        }
        LOGGER.info("Start reading the file: " + file.getAbsolutePath());
        try (BufferedReaderExt reader = new BufferedReaderExt(createReader(), encoding)) {
            long fileSize = file.length();
            while (reader.getPos() < fileSize) {
                CSVSaveService.csvReadFile(reader, delim);
                if (reader.getPos() < fileSize) {
                    offsets.add(reader.getPos());
                }
            }
        }
        LOGGER.info("Reading finished. Found " + offsets.size() + " records in your csv file");
    }

    private Reader createReader() throws IOException {
        return new InputStreamReader(new FileInputStream(file), encoding);
    }

    public void close() {
        try {
            if (randomOrder) {
                rbr.get().close();
            }
        } catch (IOException ex) {
            LOGGER.warn("Failed to close readers");
        }
    }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy