ai.vespa.schemals.schemadocument.SchemaDocumentLexer Maven / Gradle / Ivy
package ai.vespa.schemals.schemadocument;
import java.util.ArrayList;
import java.util.List;
import org.eclipse.lsp4j.Position;
import ai.vespa.schemals.common.ClientLogger;
import ai.vespa.schemals.parser.Token;
import ai.vespa.schemals.tree.CSTUtils;
import ai.vespa.schemals.tree.SchemaNode;
/*
* Class to view a document as a list of tokens.
* Contrary to usual standards, this will construct a list of tokens *after* parsing is done.
* This is because we can exploit CongoCC to avoid dealing with complex lexing logic.
*
* Mainly used for completion.
*
* @author mangern
* */
public class SchemaDocumentLexer {
private SchemaNode CST;
private List tokens = new ArrayList<>();
public void setCST(SchemaNode CST) {
this.CST = CST;
tokens.clear();
collectAllTokens(CST);
}
public void dumpTokens(ClientLogger logger) {
for (var node : tokens) {
Position start = node.getRange().getStart();
Position end = node.getRange().getEnd();
logger.info(
node.getDirtyType().toString() +
(node.getIsDirty() ? " [DIRTY]" : "") +
", (" + start.getLine() + ", " + start.getCharacter() + ") - (" + end.getLine() + ", " + end.getCharacter() + ")");
}
}
public SchemaNode tokenAtOrBeforePosition(Position pos, boolean skipNL) {
int index = indexOfPosition(pos, skipNL);
if (index == -1)return null;
//if (pos.equals(tokens.get(index).range().getStart())) index--;
//if (index == -1)return null;
return tokens.get(index);
}
/*
* Finds the sequence of token types supplied by 'pattern' by searching backwards
* up to 'allowSkip' places before the supplied position
* Returns a reference to the LexicalToken at the position if found
* null otherwise
*
* TODO: The ideal pattern whould be some kind of regular expression
* */
public SchemaNode matchBackwards(Position pos, int allowSkip, boolean allowDirty, Token.TokenType... pattern) {
int index = indexOfPosition(pos, false);
if (index == -1)return null;
int skipped = 0;
for (int patternStart = index - pattern.length + 1; patternStart >= 0 && skipped <= allowSkip; patternStart--, skipped++) {
boolean matched = true;
for (int i = 0; i < pattern.length; i++) {
if (pattern[i] != tokens.get(patternStart + i).getDirtyType()) {
matched = false;
}
if (tokens.get(patternStart + i).getIsDirty() && !allowDirty) {
matched = false;
}
}
if (matched) return tokens.get(patternStart);
}
return null;
}
public SchemaNode matchBackwardsOnLine(Position pos, boolean allowDirty, Token.TokenType... pattern) {
int index = indexOfPosition(pos, false);
if (index == -1)return null;
for (int patternStart = index - pattern.length + 1; patternStart >= 0; patternStart--) {
boolean matched = true;
if (tokens.get(patternStart).getRange().getStart().getLine() != pos.getLine()) break;
for (int i = 0; i < pattern.length; i++) {
if (pattern[i] != tokens.get(patternStart + i).getDirtyType()) {
matched = false;
}
if (tokens.get(patternStart + i).getIsDirty() && !allowDirty) {
matched = false;
}
}
if (matched) return tokens.get(patternStart);
}
return null;
}
/*
* Returns the index of the last token at or before the supplied position
* -1 if no such token exists
* */
private int indexOfPosition(Position pos, boolean skipNL) {
int lastIndex = -1;
for (int i = 0; i < tokens.size(); i++) {
if (skipNL && tokens.get(i).getDirtyType() == Token.TokenType.NL) continue;
if (CSTUtils.positionLT(pos, tokens.get(i).getRange().getStart())) break;
lastIndex = i;
}
return lastIndex;
}
private void collectAllTokens(SchemaNode node) {
if (node == null)return;
if (node.getDirtyType() != null) {
tokens.add(node);
}
for (SchemaNode child : node) {
collectAllTokens(child);
}
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy