All Downloads are FREE. Search and download functionalities are using the official Maven repository.

weka.core.converters.CSVSaver Maven / Gradle / Ivy

/*
 *    This program is free software; you can redistribute it and/or modify
 *    it under the terms of the GNU General Public License as published by
 *    the Free Software Foundation; either version 2 of the License, or
 *    (at your option) any later version.
 *
 *    This program is distributed in the hope that it will be useful,
 *    but WITHOUT ANY WARRANTY; without even the implied warranty of
 *    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *    GNU General Public License for more details.
 *
 *    You should have received a copy of the GNU General Public License
 *    along with this program; if not, write to the Free Software
 *    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
 */

/*
 *    CSVSaver.java
 *    Copyright (C) 2004 University of Waikato, Hamilton, New Zealand
 *
 */

package weka.core.converters;

import weka.core.Capabilities;
import weka.core.Instance;
import weka.core.Instances;
import weka.core.RevisionUtils;
import weka.core.SparseInstance;
import weka.core.Capabilities.Capability;
import weka.core.Utils;

import java.io.IOException;
import java.io.PrintWriter;

/**
 
 * Writes to a destination that is in csv format
 * 

* * Valid options are:

* *

 -i <the input file>
 * The input file
* *
 -o <the output file>
 * The output file
* * * @author Stefan Mutter ([email protected]) * @version $Revision: 7950 $ * @see Saver */ public class CSVSaver extends AbstractFileSaver implements BatchConverter, IncrementalConverter, FileSourcedConverter { /** for serialization */ static final long serialVersionUID = 476636654410701807L; /** Constructor */ public CSVSaver(){ resetOptions(); } /** * Returns a string describing this Saver * @return a description of the Saver suitable for * displaying in the explorer/experimenter gui */ public String globalInfo() { return "Writes to a destination that is in csv format"; } /** * Returns a description of the file type. * * @return a short file description */ public String getFileDescription() { return "CSV file: comma separated files"; } /** * Resets the Saver */ public void resetOptions() { super.resetOptions(); setFileExtension(".csv"); } /** * Returns the Capabilities of this saver. * * @return the capabilities of this object * @see Capabilities */ public Capabilities getCapabilities() { Capabilities result = super.getCapabilities(); // attributes result.enable(Capability.NOMINAL_ATTRIBUTES); result.enable(Capability.NUMERIC_ATTRIBUTES); result.enable(Capability.DATE_ATTRIBUTES); result.enable(Capability.STRING_ATTRIBUTES); result.enable(Capability.MISSING_VALUES); // class result.enable(Capability.NOMINAL_CLASS); result.enable(Capability.NUMERIC_CLASS); result.enable(Capability.DATE_CLASS); result.enable(Capability.STRING_CLASS); result.enable(Capability.MISSING_CLASS_VALUES); result.enable(Capability.NO_CLASS); return result; } /** Saves an instances incrementally. Structure has to be set by using the * setStructure() method or setInstances() method. * @param inst the instance to save * @throws IOException throws IOEXception if an instance cannot be saved incrementally. */ public void writeIncremental(Instance inst) throws IOException{ int writeMode = getWriteMode(); Instances structure = getInstances(); PrintWriter outW = null; if(getRetrieval() == BATCH || getRetrieval() == NONE) throw new IOException("Batch and incremental saving cannot be mixed."); if(getWriter() != null) outW = new PrintWriter(getWriter()); if(writeMode == WAIT){ if(structure == null){ setWriteMode(CANCEL); if(inst != null) System.err.println("Structure(Header Information) has to be set in advance"); } else setWriteMode(STRUCTURE_READY); writeMode = getWriteMode(); } if(writeMode == CANCEL){ if(outW != null) outW.close(); cancel(); } if(writeMode == STRUCTURE_READY){ setWriteMode(WRITE); //write header if(retrieveFile() == null && outW == null){ // print out attribute names as first row for (int i = 0; i < structure.numAttributes(); i++) { System.out.print(structure.attribute(i).name()); if (i < structure.numAttributes()-1) { System.out.print(","); } else { System.out.println(); } } } else{ for (int i = 0; i < structure.numAttributes(); i++) { outW.print(structure.attribute(i).name()); if (i < structure.numAttributes()-1) { outW.print(","); } else { outW.println(); } } outW.flush(); } writeMode = getWriteMode(); } if(writeMode == WRITE){ if(structure == null) throw new IOException("No instances information available."); if(inst != null){ //write instance if(retrieveFile() == null && outW == null) System.out.println(inst); else{ outW.println(instanceToString(inst)); //flushes every 100 instances m_incrementalCounter++; if(m_incrementalCounter > 100){ m_incrementalCounter = 0; outW.flush(); } } } else{ //close if(outW != null){ outW.flush(); outW.close(); } m_incrementalCounter = 0; resetStructure(); outW = null; resetWriter(); } } } /** Writes a Batch of instances * @throws IOException throws IOException if saving in batch mode is not possible */ public void writeBatch() throws IOException { if(getInstances() == null) throw new IOException("No instances to save"); if(getRetrieval() == INCREMENTAL) throw new IOException("Batch and incremental saving cannot be mixed."); setRetrieval(BATCH); setWriteMode(WRITE); if(retrieveFile() == null && getWriter() == null){ // print out attribute names as first row for (int i = 0; i < getInstances().numAttributes(); i++) { System.out.print(getInstances().attribute(i).name()); if (i < getInstances().numAttributes()-1) { System.out.print(","); } else { System.out.println(); } } for (int i = 0; i < getInstances().numInstances(); i++) { System.out.println(getInstances().instance(i)); } setWriteMode(WAIT); return; } PrintWriter outW = new PrintWriter(getWriter()); // print out attribute names as first row for (int i = 0; i < getInstances().numAttributes(); i++) { outW.print(Utils.quote(getInstances().attribute(i).name())); if (i < getInstances().numAttributes()-1) { outW.print(","); } else { outW.println(); } } for (int i = 0; i < getInstances().numInstances(); i++) { outW.println(instanceToString((getInstances().instance(i)))); } outW.flush(); outW.close(); setWriteMode(WAIT); outW = null; resetWriter(); setWriteMode(CANCEL); } /** * turns an instance into a string. takes care of sparse instances as well. * * @param inst the instance to turn into a string */ protected String instanceToString(Instance inst) { StringBuffer result; Instance outInst; int i; result = new StringBuffer(); if (inst instanceof SparseInstance) { outInst = new Instance(inst.weight(), inst.toDoubleArray()); outInst.setDataset(inst.dataset()); } else { outInst = inst; } for (i = 0; i < outInst.numAttributes(); i++) { if (i > 0) result.append(","); if (outInst.isMissing(i)) result.append("?"); else result.append(outInst.toString(i)); } return result.toString(); } /** * Returns the revision string. * * @return the revision */ public String getRevision() { return RevisionUtils.extract("$Revision: 7950 $"); } /** * Main method. * * @param args should contain the options of a Saver. */ public static void main(String[] args) { runFileSaver(new CSVSaver(), args); } }




© 2015 - 2025 Weber Informatics LLC | Privacy Policy