All Downloads are FREE. Search and download functionalities are using the official Maven repository.

edu.emory.mathcs.nlp.common.util.StringUtils Maven / Gradle / Ivy

The newest version!
/**
 * Copyright 2015, Emory University
 * 
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 * 
 *     http://www.apache.org/licenses/LICENSE-2.0
 * 
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package edu.emory.mathcs.nlp.common.util;

import java.util.ArrayList;
import java.util.List;

import edu.emory.mathcs.nlp.common.constant.CharConst;
import edu.emory.mathcs.nlp.common.constant.MetaConst;
import edu.emory.mathcs.nlp.common.constant.StringConst;

/**
 * @author Jinho D. Choi ({@code [email protected]})
 */
public class StringUtils
{
	private StringUtils() {}
	
	static public int getLCSLength(String[] x, String[] y)
	{
		final int M = x.length;
		final int N = y.length;
		
		int[][] counts = new int[M+1][N+1];
		int i, j;
		
		for (i=1; i<=M; i++)
			for (j=1; j<=N; j++)
				counts[i][j] = (x[i-1].equals(y[j-1])) ? counts[i-1][j-1] + 1 : Math.max(counts[i][j-1], counts[i-1][j]);

		return counts[M][N];
	}
	
	static public String removeAll(String original, char remove)
	{
		char[] cs = original.toCharArray();
		char[] ns = new char[cs.length];
		int i, j;
		
		for (i=0,j=0; i 1 && CharUtils.isPunctuation(cs[i]) && cs[i] == cs[i-1] && cs[i] == cs[i-2])
				continue;
			
			build.append(cs[i]);
		}
		
		return (build.length() < size) ? build.toString() : s;
	}
	
	static public List stripPunctuation(List tokens)
	{
		List list = new ArrayList<>();
		
		for (String token : tokens)
		{
			if (!containsPunctuationOnly(token))
				list.add(token);
		}
		
		return list;
	}
	
	static public List stripPunctuation(String[] tokens)
	{
		List list = new ArrayList<>();
		
		for (String token : tokens)
		{
			if (!containsPunctuationOnly(token))
				list.add(token);
		}
		
		return list;
	}
	
//	====================================== Boolean ======================================
	
	/**
	 * @return {@code true} if the specific string includes only upper-case characters.
	 * @see CharUtils#isUpperCase(char).
	 */
	static public boolean containsUpperCaseOnly(String s)
	{
		char[] cs= s.toCharArray();
		int i, size = cs.length;
		
		for (i=0; i




© 2015 - 2024 Weber Informatics LLC | Privacy Policy