All Downloads are FREE. Search and download functionalities are using the official Maven repository.

edu.emory.mathcs.nlp.common.util.CharTokenizer Maven / Gradle / Ivy

The newest version!
/**
 * Copyright 2015, Emory University
 * 
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 * 
 *     http://www.apache.org/licenses/LICENSE-2.0
 * 
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package edu.emory.mathcs.nlp.common.util;

import java.util.ArrayList;
import java.util.List;

import edu.emory.mathcs.nlp.common.constant.StringConst;

/**
 * @author Jinho D. Choi ({@code [email protected]})
 */
public class CharTokenizer
{
	private char c_delim;
	
	public CharTokenizer(char delim)
	{
		initDelimiter(delim);
	}
	
	public void initDelimiter(char delim)
	{
		c_delim = delim;
	}
	
	public List tokenizeToList(String s)
	{
		return tokenizeToList(s, false);
	}
	
	public List tokenizeToList(String s, boolean includeEmpty)
	{
		List list = new ArrayList<>();
		int i, bIndex = 0, len = s.length();
		char[] cs = s.toCharArray();
		
		for (i=0; i list = tokenizeToList(s, includeEmpty);
		return list.toArray(new String[list.size()]);
	}
	
	/** Not including empty strings. */
	public String[] tokenize(String s)
	{
		return tokenize(s, false);
	}

//	public String[] tokenize(String s, boolean includeDelim)
//	{
//		IntArrayList list = new IntArrayList();
//		char[] cs = s.toCharArray();
//		int i, len = s.length();
//		
//		for (i=0; i




© 2015 - 2024 Weber Informatics LLC | Privacy Policy