All Downloads are FREE. Search and download functionalities are using the official Maven repository.

weka.attributeSelection.GreedyStepwise Maven / Gradle / Ivy

Go to download

The Waikato Environment for Knowledge Analysis (WEKA), a machine learning workbench. This version represents the developer version, the "bleeding edge" of development, you could say. New functionality gets added to this version.

There is a newer version: 3.9.6
Show newest version
/*
 *   This program is free software: you can redistribute it and/or modify
 *   it under the terms of the GNU General Public License as published by
 *   the Free Software Foundation, either version 3 of the License, or
 *   (at your option) any later version.
 *
 *   This program is distributed in the hope that it will be useful,
 *   but WITHOUT ANY WARRANTY; without even the implied warranty of
 *   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *   GNU General Public License for more details.
 *
 *   You should have received a copy of the GNU General Public License
 *   along with this program.  If not, see .
 */

/*
 *    GreedyStepwise.java
 *    Copyright (C) 2004-2012 University of Waikato, Hamilton, New Zealand
 *
 */

package weka.attributeSelection;

import java.util.*;
import java.util.concurrent.Callable;
import java.util.concurrent.ExecutorService;
import java.util.concurrent.Executors;
import java.util.concurrent.Future;

import weka.core.Instances;
import weka.core.Option;
import weka.core.OptionHandler;
import weka.core.Range;
import weka.core.RevisionUtils;
import weka.core.Utils;

/**
 *  GreedyStepwise :
*
* Performs a greedy forward or backward search through the space of attribute * subsets. May start with no/all attributes or from an arbitrary point in the * space. Stops when the addition/deletion of any remaining attributes results * in a decrease in evaluation. Can also produce a ranked list of attributes by * traversing the space from one side to the other and recording the order that * attributes are selected.
*

* * * Valid options are: *

* *

 * -C
 *  Use conservative forward search
 * 
* *
 * -B
 *  Use a backward search instead of a
 *  forward one.
 * 
* *
 * -P <start set>
 *  Specify a starting set of attributes.
 *  Eg. 1,3,5-7.
 * 
* *
 * -R
 *  Produce a ranked list of attributes.
 * 
* *
 * -T <threshold>
 *  Specify a theshold by which attributes
 *  may be discarded from the ranking.
 *  Use in conjuction with -R
 * 
* *
 * -N <num to select>
 *  Specify number of attributes to select
 * 
* *
 * -num-slots <int>
 *  The number of execution slots, for example, the number of cores in the CPU. (default 1)
 * 
* *
 * -D
 *  Print debugging output
 * 
* * * * @author Mark Hall * @version $Revision: 15519 $ */ public class GreedyStepwise extends ASSearch implements RankedOutputSearch, StartSetHandler, OptionHandler { /** for serialization */ static final long serialVersionUID = -6312951970168325471L; /** does the data have a class */ protected boolean m_hasClass; /** holds the class index */ protected int m_classIndex; /** number of attributes in the data */ protected int m_numAttribs; /** true if the user has requested a ranked list of attributes */ protected boolean m_rankingRequested; /** * go from one side of the search space to the other in order to generate a * ranking */ protected boolean m_doRank; /** used to indicate whether or not ranking has been performed */ protected boolean m_doneRanking; /** * A threshold by which to discard attributes---used by the AttributeSelection * module */ protected double m_threshold; /** * The number of attributes to select. -1 indicates that all attributes are to * be retained. Has precedence over m_threshold */ protected int m_numToSelect = -1; protected int m_calculatedNumToSelect; /** the merit of the best subset found */ protected double m_bestMerit; /** a ranked list of attribute indexes */ protected double[][] m_rankedAtts; protected int m_rankedSoFar; /** the best subset found */ protected BitSet m_best_group; protected ASEvaluation m_ASEval; protected Instances m_Instances; /** holds the start set for the search as a Range */ protected Range m_startRange; /** holds an array of starting attributes */ protected int[] m_starting; /** Use a backwards search instead of a forwards one */ protected boolean m_backward = false; /** * If set then attributes will continue to be added during a forward search as * long as the merit does not degrade */ protected boolean m_conservativeSelection = false; /** Print debugging output */ protected boolean m_debug = false; protected int m_poolSize = 1; /** Thread pool */ protected transient ExecutorService m_pool = null; /** * Constructor */ public GreedyStepwise() { m_threshold = -Double.MAX_VALUE; m_doneRanking = false; m_startRange = new Range(); m_starting = null; resetOptions(); } /** * Returns a string describing this search method * * @return a description of the search suitable for displaying in the * explorer/experimenter gui */ public String globalInfo() { return "GreedyStepwise :\n\nPerforms a greedy forward or backward search " + "through " + "the space of attribute subsets. May start with no/all attributes or from " + "an arbitrary point in the space. Stops when the addition/deletion of any " + "remaining attributes results in a decrease in evaluation. " + "Can also produce a ranked list of " + "attributes by traversing the space from one side to the other and " + "recording the order that attributes are selected.\n"; } /** * Returns the tip text for this property * * @return tip text for this property suitable for displaying in the * explorer/experimenter gui */ public String searchBackwardsTipText() { return "Search backwards rather than forwards."; } /** * Set whether to search backwards instead of forwards * * @param back true to search backwards */ public void setSearchBackwards(boolean back) { m_backward = back; if (m_backward) { setGenerateRanking(false); } } /** * Get whether to search backwards * * @return true if the search will proceed backwards */ public boolean getSearchBackwards() { return m_backward; } /** * Returns the tip text for this property * * @return tip text for this property suitable for displaying in the * explorer/experimenter gui */ public String thresholdTipText() { return "Set threshold by which attributes can be discarded. Default value " + "results in no attributes being discarded. Use in conjunction with " + "generateRanking"; } /** * Set the threshold by which the AttributeSelection module can discard * attributes. * * @param threshold the threshold. */ @Override public void setThreshold(double threshold) { m_threshold = threshold; } /** * Returns the threshold so that the AttributeSelection module can discard * attributes from the ranking. */ @Override public double getThreshold() { return m_threshold; } /** * Returns the tip text for this property * * @return tip text for this property suitable for displaying in the * explorer/experimenter gui */ public String numToSelectTipText() { return "Specify the number of attributes to retain. The default value " + "(-1) indicates that all attributes are to be retained. Use either " + "this option or a threshold to reduce the attribute set."; } /** * Specify the number of attributes to select from the ranked list (if * generating a ranking). -1 indicates that all attributes are to be retained. * * @param n the number of attributes to retain */ @Override public void setNumToSelect(int n) { m_numToSelect = n; } /** * Gets the number of attributes to be retained. * * @return the number of attributes to retain */ @Override public int getNumToSelect() { return m_numToSelect; } /** * Gets the calculated number of attributes to retain. This is the actual * number of attributes to retain. This is the same as getNumToSelect if the * user specifies a number which is not less than zero. Otherwise it should be * the number of attributes in the (potentially transformed) data. */ @Override public int getCalculatedNumToSelect() { if (m_numToSelect >= 0) { m_calculatedNumToSelect = m_numToSelect; } return m_calculatedNumToSelect; } /** * Returns the tip text for this property * * @return tip text for this property suitable for displaying in the * explorer/experimenter gui */ public String generateRankingTipText() { return "Set to true if a ranked list is required."; } /** * Records whether the user has requested a ranked list of attributes. * * @param doRank true if ranking is requested */ @Override public void setGenerateRanking(boolean doRank) { m_rankingRequested = doRank; } /** * Gets whether ranking has been requested. This is used by the * AttributeSelection module to determine if rankedAttributes() should be * called. * * @return true if ranking has been requested. */ @Override public boolean getGenerateRanking() { return m_rankingRequested; } /** * Returns the tip text for this property * * @return tip text for this property suitable for displaying in the * explorer/experimenter gui */ public String startSetTipText() { return "Set the start point for the search. This is specified as a comma " + "separated list off attribute indexes starting at 1. It can include " + "ranges. Eg. 1,2,5-9,17."; } /** * Sets a starting set of attributes for the search. It is the search method's * responsibility to report this start set (if any) in its toString() method. * * @param startSet a string containing a list of attributes (and or ranges), * eg. 1,2,6,10-15. * @throws Exception if start set can't be set. */ @Override public void setStartSet(String startSet) throws Exception { m_startRange.setRanges(startSet); } /** * Returns a list of attributes (and or attribute ranges) as a String * * @return a list of attributes (and or attribute ranges) */ @Override public String getStartSet() { return m_startRange.getRanges(); } /** * Returns the tip text for this property * * @return tip text for this property suitable for displaying in the * explorer/experimenter gui */ public String conservativeForwardSelectionTipText() { return "If true (and forward search is selected) then attributes " + "will continue to be added to the best subset as long as merit does " + "not degrade."; } /** * Set whether attributes should continue to be added during a forward search * as long as merit does not decrease * * @param c true if atts should continue to be atted */ public void setConservativeForwardSelection(boolean c) { m_conservativeSelection = c; } /** * Gets whether conservative selection has been enabled * * @return true if conservative forward selection is enabled */ public boolean getConservativeForwardSelection() { return m_conservativeSelection; } /** * Returns the tip text for this property * * @return tip text for this property suitable for displaying in the * explorer/experimenter gui */ public String debuggingOutputTipText() { return "Output debugging information to the console"; } /** * Set whether to output debugging info to the console * * @param d true if dubugging info is to be output */ public void setDebuggingOutput(boolean d) { m_debug = d; } /** * Get whether to output debugging info to the console * * @return true if dubugging info is to be output */ public boolean getDebuggingOutput() { return m_debug; } /** * @return a string to describe the option */ public String numExecutionSlotsTipText() { return "The number of execution slots, for example, the number of cores in the CPU."; } /** * Gets the number of threads. */ public int getNumExecutionSlots() { return m_poolSize; } /** * Sets the number of threads */ public void setNumExecutionSlots(int nT) { m_poolSize = nT; } /** * Returns an enumeration describing the available options. * * @return an enumeration of all the available options. **/ @Override public Enumeration




© 2015 - 2024 Weber Informatics LLC | Privacy Policy