org.navimatrix.jaxen.function.StringLengthFunction Maven / Gradle / Ivy
/*
* $Header: /cvs/jaxen/jaxen/src/java/main/org/jaxen/function/StringLengthFunction.java,v 1.12 2006/02/05 21:47:41 elharo Exp $
* $Revision: 1.12 $
* $Date: 2006/02/05 21:47:41 $
*
* ====================================================================
*
* Copyright 2000-2002 bob mcwhirter & James Strachan.
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions are
* met:
*
* * Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
*
* * Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* * Neither the name of the Jaxen Project nor the names of its
* contributors may be used to endorse or promote products derived
* from this software without specific prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS
* IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
* TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A
* PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
* OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
* EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
* PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
* PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
* LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
* NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
* SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*
* ====================================================================
* This software consists of voluntary contributions made by many
* individuals on behalf of the Jaxen Project and was originally
* created by bob mcwhirter and
* James Strachan . For more information on the
* Jaxen Project, please see .
*
* $Id: StringLengthFunction.java,v 1.12 2006/02/05 21:47:41 elharo Exp $
*/
package org.navimatrix.jaxen.function;
import java.util.List;
import org.navimatrix.jaxen.Context;
import org.navimatrix.jaxen.Function;
import org.navimatrix.jaxen.FunctionCallException;
import org.navimatrix.jaxen.Navigator;
/**
* 4.2 number string-length(string)
*
*
* The string-length function returns the number of Unicode characters
* in its argument. This is not necessarily
* the same as the number Java chars
* in the corresponding Java string. In particular, if the Java String
* contains surrogate pairs each such pair will be counted as only one character
* by this function. If the argument is omitted,
* it returns the length of the string-value of the context node.
*
*
* @author bob mcwhirter (bob @ werken.com)
* @see Section
* 4.2 of the XPath Specification
*/
public class StringLengthFunction implements Function
{
/**
* Create a new StringLengthFunction
object.
*/
public StringLengthFunction() {}
/**
*
* Returns the number of Unicode characters in the string-value of the argument.
*
*
* @param context the context at the point in the
* expression when the function is called
* @param args a list containing the item whose string-value is to be counted.
* If empty, the length of the context node's string-value is returned.
*
* @return a Double
giving the number of Unicode characters
*
* @throws FunctionCallException if args has more than one item
*/
public Object call(Context context,
List args) throws FunctionCallException
{
if (args.size() == 0)
{
return evaluate( context.getNodeSet(),
context.getNavigator() );
}
else if (args.size() == 1)
{
return evaluate( args.get(0),
context.getNavigator() );
}
throw new FunctionCallException( "string-length() requires one argument." );
}
/**
*
* Returns the number of Unicode characters in the string-value of
* an object.
*
*
* @param obj the object whose string-value is counted
* @param nav used to calculate the string-values of the first two arguments
*
* @return a Double
giving the number of Unicode characters
*
* @throws FunctionCallException if the string contains mismatched surrogates
*/
public static Double evaluate(Object obj, Navigator nav) throws FunctionCallException
{
String str = StringFunction.evaluate( obj, nav );
// String.length() counts UTF-16 code points; not Unicode characters
char[] data = str.toCharArray();
int length = 0;
for (int i = 0; i < data.length; i++) {
char c = data[i];
length++;
// if this is a high surrogate; assume the next character is
// is a low surrogate and skip it
if (c >= 0xD800) {
try {
char low = data[i+1];
if (low < 0xDC00 || low > 0xDFFF) {
throw new FunctionCallException("Bad surrogate pair in string " + str);
}
i++; // increment past low surrogate
}
catch (ArrayIndexOutOfBoundsException ex) {
throw new FunctionCallException("Bad surrogate pair in string " + str);
}
}
}
return new Double(length);
}
}
© 2015 - 2024 Weber Informatics LLC | Privacy Policy