All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.expleague.ml.cli.modes.impl.SplitJsonPool Maven / Gradle / Ivy

There is a newer version: 1.4.9
Show newest version
package com.expleague.ml.cli.modes.impl;

import com.expleague.commons.text.StringUtils;
import com.expleague.commons.util.Pair;
import com.expleague.ml.cli.builders.data.impl.DataBuilderCrossValidation;
import com.expleague.ml.cli.modes.AbstractMode;
import com.expleague.ml.cli.modes.CliPoolReaderHelper;
import com.expleague.ml.data.tools.DataTools;
import com.expleague.ml.data.tools.Pool;
import org.apache.commons.cli.CommandLine;
import org.apache.commons.cli.MissingArgumentException;

import java.io.FileWriter;
import java.io.IOException;

import static com.expleague.ml.cli.JMLLCLI.*;

/**
 * User: qdeee
 * Date: 16.09.15
 */
public class SplitJsonPool extends AbstractMode {

  public void run(final CommandLine command) throws MissingArgumentException, IOException {
    if (!command.hasOption(LEARN_OPTION) && !command.hasOption(JSON_FORMAT) && !command.hasOption(CROSS_VALIDATION_OPTION)) {
      throw new MissingArgumentException("Please provide: learn_option, json_flag and cross_validation_option");
    }

    final DataBuilderCrossValidation builder = new DataBuilderCrossValidation();
    CliPoolReaderHelper.setPoolReader(command, builder);
    builder.setLearnPath(command.getOptionValue(LEARN_OPTION));
    final String[] cvOptions = StringUtils.split(command.getOptionValue(CROSS_VALIDATION_OPTION), "/", 2);
    builder.setRandomSeed(Integer.valueOf(cvOptions[0]));
    builder.setPartition(cvOptions[1]);

    final Pair pools = builder.create();

    final String outputName = getOutputName(command);
    DataTools.writePoolTo(pools.getFirst(), new FileWriter(outputName + ".learn"));
    DataTools.writePoolTo(pools.getSecond(), new FileWriter(outputName + ".test"));
  }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy