edu.emory.mathcs.nlp.common.util.CharTokenizer Maven / Gradle / Ivy
The newest version!
/**
* Copyright 2015, Emory University
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package edu.emory.mathcs.nlp.common.util;
import java.util.ArrayList;
import java.util.List;
import edu.emory.mathcs.nlp.common.constant.StringConst;
/**
* @author Jinho D. Choi ({@code [email protected]})
*/
public class CharTokenizer
{
private char c_delim;
public CharTokenizer(char delim)
{
initDelimiter(delim);
}
public void initDelimiter(char delim)
{
c_delim = delim;
}
public List tokenizeToList(String s)
{
return tokenizeToList(s, false);
}
public List tokenizeToList(String s, boolean includeEmpty)
{
List list = new ArrayList<>();
int i, bIndex = 0, len = s.length();
char[] cs = s.toCharArray();
for (i=0; i list = tokenizeToList(s, includeEmpty);
return list.toArray(new String[list.size()]);
}
/** Not including empty strings. */
public String[] tokenize(String s)
{
return tokenize(s, false);
}
// public String[] tokenize(String s, boolean includeDelim)
// {
// IntArrayList list = new IntArrayList();
// char[] cs = s.toCharArray();
// int i, len = s.length();
//
// for (i=0; i
© 2015 - 2024 Weber Informatics LLC | Privacy Policy