All Downloads are FREE. Search and download functionalities are using the official Maven repository.

weka.core.converters.XRFFSaver Maven / Gradle / Ivy

/*
 *    This program is free software; you can redistribute it and/or modify
 *    it under the terms of the GNU General Public License as published by
 *    the Free Software Foundation; either version 2 of the License, or
 *    (at your option) any later version.
 *
 *    This program is distributed in the hope that it will be useful,
 *    but WITHOUT ANY WARRANTY; without even the implied warranty of
 *    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *    GNU General Public License for more details.
 *
 *    You should have received a copy of the GNU General Public License
 *    along with this program; if not, write to the Free Software
 *    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
 */

/*
 * XRFFSaver.java
 * Copyright (C) 2006 University of Waikato, Hamilton, New Zealand
 *
 */

package weka.core.converters;

import weka.core.Capabilities;
import weka.core.Instances;
import weka.core.Option;
import weka.core.RevisionUtils;
import weka.core.SingleIndex;
import weka.core.Utils;
import weka.core.Capabilities.Capability;
import weka.core.xml.XMLInstances;

import java.io.File;
import java.io.IOException;
import java.io.OutputStream;
import java.io.PrintWriter;
import java.util.Enumeration;
import java.util.Vector;
import java.util.zip.GZIPOutputStream;

/**
 
 * Writes to a destination that is in the XML version of the ARFF format. The data can be compressed with gzip, in order to save space.
 * 

* * Valid options are:

* *

 -i <the input file>
 *  The input file
* *
 -o <the output file>
 *  The output file
* *
 -C <class index>
 *  The class index (first and last are valid as well).
 *  (default: last)
* *
 -compress
 *  Compresses the data (uses '.xrff.gz' as extension instead of '.xrff')
 *  (default: off)
* * * @author FracPete (fracpete at waikato dot ac dot nz) * @version $Revision: 1.5 $ * @see Saver */ public class XRFFSaver extends AbstractFileSaver implements BatchConverter { /** for serialization */ private static final long serialVersionUID = -7226404765213522043L; /** the class index */ protected SingleIndex m_ClassIndex = new SingleIndex(); /** the generated XML document */ protected XMLInstances m_XMLInstances; /** whether to compress the output */ protected boolean m_CompressOutput = false; /** * Constructor */ public XRFFSaver(){ resetOptions(); } /** * Returns a string describing this Saver * * @return a description of the Saver suitable for * displaying in the explorer/experimenter gui */ public String globalInfo() { return "Writes to a destination that is in the XML version of the ARFF format. " + "The data can be compressed with gzip, in order to save space."; } /** * Returns an enumeration describing the available options. * * @return an enumeration of all the available options. */ public Enumeration listOptions() { Vector result; result = new Vector(); Enumeration en = super.listOptions(); while (en.hasMoreElements()) result.addElement(en.nextElement()); result.addElement( new Option( "\tThe class index (first and last are valid as well).\n" + "\t(default: last)", "C", 1, "-C ")); result.addElement( new Option( "\tCompresses the data (uses '" + XRFFLoader.FILE_EXTENSION_COMPRESSED + "' as extension instead of '" + XRFFLoader.FILE_EXTENSION + "')\n" + "\t(default: off)", "compress", 0, "-compress")); return result.elements(); } /** * returns the options of the current setup * * @return the current options */ public String[] getOptions(){ int i; Vector result; String[] options; result = new Vector(); if (getClassIndex().length() != 0) { result.add("-C"); result.add(getClassIndex()); } if (getCompressOutput()) result.add("-compress"); options = super.getOptions(); for (i = 0; i < options.length; i++) result.add(options[i]); return (String[]) result.toArray(new String[result.size()]); } /** * Parses the options for this object.

* * Valid options are:

* *

 -i <the input file>
   *  The input file
* *
 -o <the output file>
   *  The output file
* *
 -C <class index>
   *  The class index (first and last are valid as well).
   *  (default: last)
* *
 -compress
   *  Compresses the data (uses '.xrff.gz' as extension instead of '.xrff')
   *  (default: off)
* * * @param options the options to use * @throws Exception if setting of options fails */ public void setOptions(String[] options) throws Exception { String tmpStr; tmpStr = Utils.getOption('C', options); if (tmpStr.length() != 0) setClassIndex(tmpStr); else setClassIndex("last"); setCompressOutput(Utils.getFlag("compress", options)); super.setOptions(options); } /** * Returns a description of the file type. * * @return a short file description */ public String getFileDescription() { return "XRFF data files"; } /** * Gets all the file extensions used for this type of file * * @return the file extensions */ public String[] getFileExtensions() { return new String[]{XRFFLoader.FILE_EXTENSION, XRFFLoader.FILE_EXTENSION_COMPRESSED}; } /** * Sets the destination file. * * @param outputFile the destination file. * @throws IOException throws an IOException if file cannot be set */ public void setFile(File outputFile) throws IOException { if (outputFile.getAbsolutePath().endsWith(XRFFLoader.FILE_EXTENSION_COMPRESSED)) setCompressOutput(true); super.setFile(outputFile); } /** * Resets the Saver */ public void resetOptions() { super.resetOptions(); if (getCompressOutput()) setFileExtension(XRFFLoader.FILE_EXTENSION_COMPRESSED); else setFileExtension(XRFFLoader.FILE_EXTENSION); try { m_XMLInstances = new XMLInstances(); } catch (Exception e) { m_XMLInstances = null; } } /** * Returns the tip text for this property * * @return tip text for this property suitable for * displaying in the explorer/experimenter gui */ public String classIndexTipText() { return "Sets the class index (\"first\" and \"last\" are valid values)"; } /** * Get the index of the class attribute. * * @return the index of the class attribute */ public String getClassIndex() { return m_ClassIndex.getSingleIndex(); } /** * Sets index of the class attribute. * * @param value the index of the class attribute */ public void setClassIndex(String value) { m_ClassIndex.setSingleIndex(value); } /** * Returns the tip text for this property * * @return tip text for this property suitable for * displaying in the explorer/experimenter gui */ public String compressOutputTipText() { return "Optional compression of the output data"; } /** * Gets whether the output data is compressed. * * @return true if the output data is compressed */ public boolean getCompressOutput() { return m_CompressOutput; } /** * Sets whether to compress the output. * * @param value if truee the output will be compressed */ public void setCompressOutput(boolean value) { m_CompressOutput = value; } /** * Returns the Capabilities of this saver. * * @return the capabilities of this object * @see Capabilities */ public Capabilities getCapabilities() { Capabilities result = super.getCapabilities(); // attributes result.enableAllAttributes(); result.enable(Capability.MISSING_VALUES); // class result.enableAllClasses(); result.enable(Capability.MISSING_CLASS_VALUES); result.enable(Capability.NO_CLASS); return result; } /** * Sets instances that should be stored. * * @param instances the instances */ public void setInstances(Instances instances) { if (m_ClassIndex.getSingleIndex().length() != 0) { m_ClassIndex.setUpper(instances.numAttributes() - 1); instances.setClassIndex(m_ClassIndex.getIndex()); } super.setInstances(instances); } /** * Sets the destination output stream. * * @param output the output stream. * @throws IOException throws an IOException if destination cannot be set */ public void setDestination(OutputStream output) throws IOException { if (getCompressOutput()) super.setDestination(new GZIPOutputStream(output)); else super.setDestination(output); } /** * Writes a Batch of instances * * @throws IOException throws IOException if saving in batch mode * is not possible */ public void writeBatch() throws IOException { if (getInstances() == null) throw new IOException("No instances to save"); if (getRetrieval() == INCREMENTAL) throw new IOException("Batch and incremental saving cannot be mixed."); setRetrieval(BATCH); setWriteMode(WRITE); // generate XML m_XMLInstances.setInstances(getInstances()); if ((retrieveFile() == null) && (getWriter() == null)) { System.out.println(m_XMLInstances.toString()); setWriteMode(WAIT); } else { PrintWriter outW = new PrintWriter(getWriter()); outW.println(m_XMLInstances.toString()); outW.flush(); outW.close(); setWriteMode(WAIT); outW = null; resetWriter(); setWriteMode(CANCEL); } } /** * Returns the revision string. * * @return the revision */ public String getRevision() { return RevisionUtils.extract("$Revision: 1.5 $"); } /** * Main method. * * @param args should contain the options of a Saver. */ public static void main(String[] args) { runFileSaver(new XRFFSaver(), args); } }




© 2015 - 2025 Weber Informatics LLC | Privacy Policy