simplegrammar.SimpleTokenizer Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of simple-grammar Show documentation
Show all versions of simple-grammar Show documentation
Library is used to define LL* grammars and use them to parse text data, e. g. programming
languages or data in different formats like JSON or XML
The newest version!
/*
Copyright 2019 Sergejs Vinniks
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/
package simplegrammar;
import java.util.ArrayList;
import java.util.HashSet;
import java.util.List;
import java.util.Set;
public class SimpleTokenizer extends Tokenizer {
private final Set ignoredTokens;
private final List tokens;
private int position;
public SimpleTokenizer() {
ignoredTokens = new HashSet<>();
tokens = new ArrayList<>();
position = -1;
}
public void ignoreTokens(String... tokens) {
for (String token : tokens)
ignoredTokens.add(token);
}
public void addToken(Token token) {
if (!ignoredTokens.contains(token.getName()))
tokens.add(token);
}
public void addAll(Tokenizer tokenizer) {
while (tokenizer.hasNext())
addToken(tokenizer.get());
}
@Override
public boolean hasNext(int depth) {
return tokens.size() > position + depth;
}
@Override
protected Token doPeek(int depth) {
return tokens.get(position + depth);
}
@Override
protected Token doGet() {
position++;
return doPeek(0);
}
public void reset() {
position = -1;
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy