All Downloads are FREE. Search and download functionalities are using the official Maven repository.

ai.preferred.regression.pe.Partition Maven / Gradle / Ivy

The newest version!
/*
 * This program is free software: you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program.  If not, see .
 */

package ai.preferred.regression.pe;

import ai.preferred.regression.io.CSVInputData;
import org.apache.commons.csv.CSVPrinter;
import org.kohsuke.args4j.Option;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import java.io.IOException;
import java.util.ArrayList;

public class Partition extends ProcessingElement {

  private static final Logger LOGGER = LoggerFactory.getLogger(Partition.class);

  @Option(name = "-p", aliases = {"--proportion"}, usage = "the proportion of data to be selected or excluded (ranges from 0.0 to 1.0)")
  private double percent = 0.8;

  @Option(name = "-e", aliases = {"--exclude"}, usage = "takes the other half of the selection if specified")
  private boolean exclude = false;

  @Override
  protected void process(CSVInputData reader, CSVPrinter printer) throws IOException {
    if (reader.hasHeader()) {
      printer.printRecord(reader.getHeader());
    }

    final ArrayList> data = reader.getRecords();
    final int n = (int) Math.round(percent * data.size());

    if (exclude) {
      printer.printRecords(data.subList(n, data.size()));
    } else {
      printer.printRecords(data.subList(0, n));
    }
  }

  public static void main(String[] args) {
    parseArgsAndRun(Partition.class, args);
  }

}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy