weka.datagenerators.Test Maven / Gradle / Ivy

/*
 *   This program is free software: you can redistribute it and/or modify
 *   it under the terms of the GNU General Public License as published by
 *   the Free Software Foundation, either version 3 of the License, or
 *   (at your option) any later version.
 *
 *   This program is distributed in the hope that it will be useful,
 *   but WITHOUT ANY WARRANTY; without even the implied warranty of
 *   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *   GNU General Public License for more details.
 *
 *   You should have received a copy of the GNU General Public License
 *   along with this program.  If not, see .
 */

/*
 * Test.java
 * Copyright (C) 2000-2012 University of Waikato, Hamilton, New Zealand
 *
 */

package weka.datagenerators;

import java.io.Serializable;

import weka.core.Attribute;
import weka.core.Instance;
import weka.core.Instances;
import weka.core.RevisionHandler;
import weka.core.RevisionUtils;
import weka.core.Utils;

/**
 * Class to represent a test. 

 * 

 * The string representation of the test can be supplied in standard notation or
 * for a subset of types of attributes in Prolog notation.

 * 
 * Following examples for all possible tests that can be represented by this
 * class, given in standard notation.

 * 

 * Examples of tests for numeric attributes:

 * B >= 2.333

 * B < 4.56

 * 

 * Examples of tests for nominal attributes with more then 2 values:

 * A = rain 

 * A != rain

 * 

 * Examples of tests for nominal attribute with exactly 2 values:

 * A = false 

 * A = true

 * 

 * 

 * The Prolog notation is only supplied for numeric attributes and for nominal
 * attributes that have the values "true" and "false".

 * 

 * Following examples for the Prolog notation provided.

 * 

 * Examples of tests for numeric attributes:

 * The same as for standard notation above.

 * 

 * Examples of tests for nominal attributes with values "true"and "false":

 * A

 * not(A)

 * 

 * (Other nominal attributes are not supported by the Prolog notation.)

 * 

 * 
 * @author Gabi Schmidberger ([email protected])
 * @version $Revision: 10203 $
 **/

public class Test implements Serializable, RevisionHandler {

  /** for serialization */
  static final long serialVersionUID = -8890645875887157782L;

  /** the attribute index */
  int m_AttIndex;

  /** the split */
  double m_Split;

  /** whether to negate the test */
  boolean m_Not;

  /** the dataset */
  Instances m_Dataset;

  /**
   * Constructor
   * 
   * @param i the attribute index
   * @param s the split
   * @param dataset the dataset
   */
  public Test(int i, double s, Instances dataset) {
    m_AttIndex = i;
    m_Split = s;
    m_Dataset = dataset;

    m_Not = false;
  }

  /**
   * Constructor
   * 
   * @param i the attribute index
   * @param s the split
   * @param dataset the dataset
   * @param n whether to negate the test
   */
  public Test(int i, double s, Instances dataset, boolean n) {
    m_AttIndex = i;
    m_Split = s;
    m_Dataset = dataset;
    m_Not = n;
  }

  /**
   * Negates the test.
   * 
   * @return the test itself negated
   */
  public Test getNot() { // returns a modified copy
    return new Test(m_AttIndex, m_Split, m_Dataset, m_Not ? false : true);
  }

  /**
   * Determines whether an instance passes the test.
   * 
   * @param inst the instance
   * @return true if the instance satisfies the test, false otherwise
   * @throws Exception if something goes wrong
   */
  public boolean passesTest(Instance inst) throws Exception {
    if (inst.isMissing(m_AttIndex)) {
      return false; // missing values fail
    }

    boolean isNominal = inst.attribute(m_AttIndex).isNominal();
    double attribVal = inst.value(m_AttIndex);
    if (!m_Not) {
      if (isNominal) {
        if (((int) attribVal) != ((int) m_Split)) {
          return false;
        }
      } else if (attribVal >= m_Split) {
        return false;
      }
    } else {
      if (isNominal) {
        if (((int) attribVal) == ((int) m_Split)) {
          return false;
        }
      } else if (attribVal < m_Split) {
        return false;
      }
    }
    return true;
  }

  /**
   * Returns the test represented by a string.
   * 
   * @return a string representing the test
   */
  @Override
  public String toString() {
    return (m_Dataset.attribute(m_AttIndex).name() + " " + testComparisonString());
  }

  /**
   * Returns the test represented by a string in Prolog notation.
   * 
   * @return a string representing the test in Prolog notation
   */
  public String toPrologString() {
    Attribute att = m_Dataset.attribute(m_AttIndex);
    StringBuffer str = new StringBuffer();
    String attName = m_Dataset.attribute(m_AttIndex).name();
    if (att.isNumeric()) {
      str = str.append(attName + " ");
      if (m_Not) {
        str = str.append(">= " + Utils.doubleToString(m_Split, 3));
      } else {
        str = str.append("< " + Utils.doubleToString(m_Split, 3));
      }
    } else {
      String value = att.value((int) m_Split);

      if (value == "false") {
        str = str.append("not(" + attName + ")");
      } else {
        str = str.append(attName);
      }
    }
    return str.toString();
  }

  /**
   * Gives a string representation of the test, starting from the comparison
   * symbol.
   * 
   * @return a string representing the test
   */
  private String testComparisonString() {
    Attribute att = m_Dataset.attribute(m_AttIndex);
    if (att.isNumeric()) {
      return ((m_Not ? ">= " : "< ") + Utils.doubleToString(m_Split, 3));
    } else {
      if (att.numValues() != 2) {
        return ((m_Not ? "!= " : "= ") + att.value((int) m_Split));
      } else {
        return ("= " + (m_Not ? att.value((int) m_Split == 0 ? 1 : 0) : att
          .value((int) m_Split)));
      }
    }
  }

  /**
   * Compares the test with the test that is given as parameter.
   * 
   * @param t the test the object is compared to
   * @return true if the two Tests are equal
   */
  public boolean equalTo(Test t) {
    return (m_AttIndex == t.m_AttIndex && m_Split == t.m_Split && m_Not == t.m_Not);
  }

  /**
   * Returns the revision string.
   * 
   * @return the revision
   */
  @Override
  public String getRevision() {
    return RevisionUtils.extract("$Revision: 10203 $");
  }
}