All Downloads are FREE. Search and download functionalities are using the official Maven repository.

weka.core.AttributeExpression Maven / Gradle / Ivy

/*
 *    This program is free software; you can redistribute it and/or modify
 *    it under the terms of the GNU General Public License as published by
 *    the Free Software Foundation; either version 2 of the License, or
 *    (at your option) any later version.
 *
 *    This program is distributed in the hope that it will be useful,
 *    but WITHOUT ANY WARRANTY; without even the implied warranty of
 *    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *    GNU General Public License for more details.
 *
 *    You should have received a copy of the GNU General Public License
 *    along with this program; if not, write to the Free Software
 *    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
 */

/*
 *    AttributeExpression.java
 *    Copyright (C) 2006 University of Waikato, Hamilton, New Zealand
 *
 */

package weka.core;

import java.io.Serializable;
import java.util.Stack;
import java.util.StringTokenizer;
import java.util.Vector;

/**
 * A general purpose class for parsing mathematical expressions
 * involving attribute values. Values can be provided in an array
 * or in an Instance. Values are accessed in the expression by
 * prefixing their index (starting at 1) with the character 'a'.
 *
 * 
 Example expression: a1^2*a5/log(a7*4.0) 
* * Supported opperators: +, -, *, /, ^, log, abs, cos, exp, sqrt, * floor, ceil, rint, tan, sin, (, ). * * @author Mark Hall * @version $Revision: 5989 $ */ public class AttributeExpression implements Serializable, RevisionHandler { /** for serialization */ static final long serialVersionUID = 402130123261736245L; /** * Inner class handling an attribute index as an operand */ private class AttributeOperand implements Serializable, RevisionHandler { /** for serialization */ static final long serialVersionUID = -7674280127286031105L; /** the index of the attribute */ protected int m_attributeIndex; /** true if the value of the attribute are to be multiplied by -1 */ protected boolean m_negative; /** * Constructor * * @param operand * @param sign * @throws Exception */ public AttributeOperand(String operand, boolean sign) throws Exception { // strip the leading 'a' and set the index m_attributeIndex = (Integer.parseInt(operand.substring(1)))-1; m_negative = sign; } /** * Return a string describing this object * @return a string descibing the attribute operand */ public String toString() { String result = ""; if (m_negative) { result += '-'; } return result+"a"+(m_attributeIndex+1); } /** * Returns the revision string. * * @return the revision */ public String getRevision() { return RevisionUtils.extract("$Revision: 5989 $"); } } /** * Inner class for storing numeric constant opperands */ private class NumericOperand implements Serializable, RevisionHandler { /** for serialization */ static final long serialVersionUID = 9037007836243662859L; /** numeric constant */ protected double m_numericConst; /** * Constructor * * @param operand * @param sign * @throws Exception */ public NumericOperand(String operand, boolean sign) throws Exception { m_numericConst = Double.valueOf(operand).doubleValue(); if (sign) { m_numericConst *= -1.0; } } /** * Return a string describing this object * @return a string descibing the numeric operand */ public String toString() { return ""+m_numericConst; } /** * Returns the revision string. * * @return the revision */ public String getRevision() { return RevisionUtils.extract("$Revision: 5989 $"); } } /** * Inner class for storing operators */ private class Operator implements Serializable, RevisionHandler { /** for serialization */ static final long serialVersionUID = -2760353522666004638L; /** the operator */ protected char m_operator; /** * Constructor * * @param opp the operator */ public Operator(char opp) { if (!isOperator(opp)) { throw new IllegalArgumentException("Unrecognized operator:" + opp); } m_operator = opp; } /** * Apply this operator to the supplied arguments * @param first the first argument * @param second the second argument * @return the result */ protected double applyOperator(double first, double second) { switch (m_operator) { case '+' : return (first+second); case '-' : return (first-second); case '*' : return (first*second); case '/' : return (first/second); case '^' : return Math.pow(first,second); } return Double.NaN; } /** * Apply this operator (function) to the supplied argument * @param value the argument * @return the result */ protected double applyFunction(double value) { switch (m_operator) { case 'l' : return Math.log(value); case 'b' : return Math.abs(value); case 'c' : return Math.cos(value); case 'e' : return Math.exp(value); case 's' : return Math.sqrt(value); case 'f' : return Math.floor(value); case 'h' : return Math.ceil(value); case 'r' : return Math.rint(value); case 't' : return Math.tan(value); case 'n' : return Math.sin(value); } return Double.NaN; } /** * Return a string describing this object * @return a string descibing the operator */ public String toString() { return ""+m_operator; } /** * Returns the revision string. * * @return the revision */ public String getRevision() { return RevisionUtils.extract("$Revision: 5989 $"); } } /** Operator stack */ private Stack m_operatorStack = new Stack(); /** Supported operators. l = log, b = abs, c = cos, e = exp, s = sqrt, f = floor, h = ceil, r = rint, t = tan, n = sin */ private static final String OPERATORS = "+-*/()^lbcesfhrtn"; /** Unary functions. l = log, b = abs, c = cos, e = exp, s = sqrt, f = floor, h = ceil, r = rint, t = tan, n = sin */ private static final String UNARY_FUNCTIONS = "lbcesfhrtn"; /** Holds the original infix expression */ private String m_originalInfix; /** Holds the expression in postfix form */ private Vector m_postFixExpVector; /** True if the next numeric constant or attribute index is negative */ private boolean m_signMod = false; /** Holds the previous token */ private String m_previousTok = ""; /** * Handles the processing of an infix operand to postfix * @param tok the infix operand * @throws Exception if there is difficulty parsing the operand */ private void handleOperand(String tok) throws Exception { // if it contains an 'a' then its an attribute index if (tok.indexOf('a') != -1) { m_postFixExpVector.addElement(new AttributeOperand(tok,m_signMod)); } else { try { // should be a numeric constant m_postFixExpVector.addElement(new NumericOperand(tok, m_signMod)); } catch (NumberFormatException ne) { throw new Exception("Trouble parsing numeric constant"); } } m_signMod = false; } /** * Handles the processing of an infix operator to postfix * @param tok the infix operator * @throws Exception if there is difficulty parsing the operator */ private void handleOperator(String tok) throws Exception { boolean push = true; char tokchar = tok.charAt(0); if (tokchar == ')') { String popop = " "; do { popop = (String)(m_operatorStack.pop()); if (popop.charAt(0) != '(') { m_postFixExpVector.addElement(new Operator(popop.charAt(0))); } } while (popop.charAt(0) != '('); } else { int infixToc = infixPriority(tok.charAt(0)); while (!m_operatorStack.empty() && stackPriority(((String)(m_operatorStack.peek())).charAt(0)) >= infixToc) { // try an catch double operators and see if the current one can // be interpreted as the sign of an upcoming number if (m_previousTok.length() == 1 && isOperator(m_previousTok.charAt(0)) && m_previousTok.charAt(0) != ')') { if (tok.charAt(0) == '-') { m_signMod = true; } else { m_signMod = false; } push = false; break; } else { String popop = (String)(m_operatorStack.pop()); m_postFixExpVector.addElement(new Operator(popop.charAt(0))); } } if (m_postFixExpVector.size() == 0) { if (tok.charAt(0) == '-') { m_signMod = true; push = false; } } if (push) { m_operatorStack.push(tok); } } } /** * Converts a string containing a mathematical expression in infix form * to postfix form. The result is stored in the vector m_postfixExpVector * * @param infixExp the infix expression to convert * @throws Exception if something goes wrong during the conversion */ public void convertInfixToPostfix(String infixExp) throws Exception { m_originalInfix = infixExp; infixExp = Utils.removeSubstring(infixExp, " "); infixExp = Utils.replaceSubstring(infixExp,"log","l"); infixExp = Utils.replaceSubstring(infixExp,"abs","b"); infixExp = Utils.replaceSubstring(infixExp,"cos","c"); infixExp = Utils.replaceSubstring(infixExp,"exp","e"); infixExp = Utils.replaceSubstring(infixExp,"sqrt","s"); infixExp = Utils.replaceSubstring(infixExp,"floor","f"); infixExp = Utils.replaceSubstring(infixExp,"ceil","h"); infixExp = Utils.replaceSubstring(infixExp,"rint","r"); infixExp = Utils.replaceSubstring(infixExp,"tan","t"); infixExp = Utils.replaceSubstring(infixExp,"sin","n"); StringTokenizer tokenizer = new StringTokenizer(infixExp, OPERATORS, true); m_postFixExpVector = new Vector(); while (tokenizer.hasMoreTokens()) { String tok = tokenizer.nextToken(); if (tok.length() > 1) { handleOperand(tok); } else { // probably an operator, but could be a single char operand if (isOperator(tok.charAt(0))) { handleOperator(tok); } else { // should be a numeric constant handleOperand(tok); } } m_previousTok = tok; } while (!m_operatorStack.empty()) { String popop = (String)(m_operatorStack.pop()); if (popop.charAt(0) == '(' || popop.charAt(0) == ')') { throw new Exception("Mis-matched parenthesis!"); } m_postFixExpVector.addElement(new Operator(popop.charAt(0))); } } /** * Evaluate the expression using the supplied Instance. * Assumes that the infix expression has been converted to * postfix and stored in m_postFixExpVector * * @param instance the Instance containing values to apply * the expression to * @throws Exception if something goes wrong */ public double evaluateExpression(Instance instance) throws Exception { double [] vals = new double [instance.numAttributes()+1]; for(int i = 0; i < instance.numAttributes(); i++) { if (instance.isMissing(i)) { vals[i] = Instance.missingValue(); } else { vals[i] = instance.value(i); } } evaluateExpression(vals); return vals[vals.length - 1]; } /** * Evaluate the expression using the supplied array of attribute values. * The result is stored in the last element of the array. Assumes that * the infix expression has been converted to postfix and stored in * m_postFixExpVector * @param vals the values to apply the expression to * @throws Exception if something goes wrong */ public void evaluateExpression(double [] vals) throws Exception { Stack operands = new Stack(); for (int i=0;i




© 2015 - 2025 Weber Informatics LLC | Privacy Policy