All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.datavec.dataframe.io.csv.CsvCombiner Maven / Gradle / Ivy

Go to download

High-performance Java Dataframe with integrated columnar storage (fork of tablesaw)

There is a newer version: 0.9.1
Show newest version
package org.datavec.dataframe.io.csv;


import com.opencsv.CSVReader;
import com.opencsv.CSVWriter;

import javax.annotation.concurrent.Immutable;
import java.io.FileReader;
import java.io.FileWriter;
import java.io.IOException;
import java.nio.file.Files;
import java.nio.file.Paths;

/**
 * Utility that takes all CSV files in a folder and combines them into a single file.  The files should all have the
 * same structure (number and type of columns) and be consistent in having or not having header lines at the beginning
 */
@Immutable
public class CsvCombiner {

    private CsvCombiner() {}

    public static void combineAll(String foldername, String newFileName, char columnSeparator, boolean headers)
                    throws IOException {

        FileWriter fileWriter = new FileWriter(newFileName);
        try (CSVWriter writer = new CSVWriter(fileWriter, ',')) {
            final boolean[] skipHeader = {false};
            Files.walk(Paths.get(foldername)).forEach(filePath -> {

                if (Files.isRegularFile(filePath) && filePath.toString().endsWith(".csv")) {
                    CsvCombiner.append(filePath.toString(), writer, columnSeparator, headers && skipHeader[0]);
                    skipHeader[0] = true;
                }
            });
            writer.flush();
        }
    }

    public static void append(String fileName, final CSVWriter writer, char columnSeparator, boolean skipHeader) {

        CSVReader reader = null;
        try {
            reader = new CSVReader(new FileReader(fileName), columnSeparator);
            if (skipHeader) { // skip the header
                reader.readNext();
            }
            String[] nextLine;
            while ((nextLine = reader.readNext()) != null) {
                writer.writeNext(nextLine);
            }
        } catch (IOException e) {
            e.printStackTrace();
        } finally {
            if (reader != null) {
                try {
                    reader.close();
                } catch (IOException e) {
                    e.printStackTrace();
                }
            }
        }
    }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy