All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.unlaxer.Token Maven / Gradle / Ivy

package org.unlaxer;

import java.io.Serializable;
import java.util.ArrayDeque;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.Deque;
import java.util.List;
import java.util.Map;
import java.util.Optional;
import java.util.function.Predicate;
import java.util.function.UnaryOperator;
import java.util.stream.Collectors;
import java.util.stream.Stream;

import org.unlaxer.ParserHierarchy.NameKind;
import org.unlaxer.listener.OutputLevel;
import org.unlaxer.parser.Parser;
import org.unlaxer.reducer.TagBasedReducer.NodeKind;
import org.unlaxer.util.FactoryBoundCache;
import org.unlaxer.util.NullSafetyConcurrentHashMap;

public class Token implements Serializable{
	
	private static final long serialVersionUID = -2232289508694932061L;

	static final FactoryBoundCache empties = 
			new FactoryBoundCache<>(RangedString::new);
	
	static final FactoryBoundCache displayString = 
			new FactoryBoundCache<>(
					token->TokenPrinter.get(token,0,OutputLevel.detail,false));

	
	
	public final Optional tokenString;
	public Parser parser;
	public final Range tokenRange;
	
	public Optional parent;
	private final List originalChildren;
	//TODO make private and rename astNodeChildren
	public  final List filteredChildren; // astNodeChildren
	
	private Map extraObjectByName = new NullSafetyConcurrentHashMap<>();
	private Map relatedTokenByName = new NullSafetyConcurrentHashMap<>();

	public enum ChildrenKind{
		original,
		astNodes
	}
	
	public final TokenKind tokenKind;
	
	
	public Token(TokenKind tokenKind , RangedString token, Parser parser) {
		this(tokenKind , token , parser , new ArrayList<>());
	}
	
	public Token(TokenKind tokenKind , List tokens , Parser parser , int position) {
		this(tokenKind , 
			createRangedString(tokens , position),
			parser,
			tokens);
	}
	
	// TODO too specialized...?
//	Predicate AST_NODES = token -> token.parser.hasTag(NodeKind.node.getTag()); <-こちらだと動かない。そもそもTagなしの状態もありってことかな?
  Predicate AST_NODES = token -> false == token.parser.hasTag(NodeKind.notNode.getTag());

	
	public Token(TokenKind tokenKind , RangedString token, Parser parser , List children) {
		super();
		this.tokenKind = tokenKind;
		this.tokenString = token.token;
		this.tokenRange = token.range;
		this.parser = parser;
		this.originalChildren = children;
		parent= Optional.empty();
		children.stream().forEach(child->{
			child.parent = Optional.of(this);
//			child.parser.setParent(parser);
		});
		this.filteredChildren = children.stream()
			.filter(AST_NODES)
			.collect(Collectors.toList());
	}
	
	public Token setParent(Token parentToken) {
		parent = Optional.ofNullable(parentToken);
		return this;
	}

	public Token setParent(Optional parentToken) {
		parent = parentToken;
		return this;
	}

	
	public static Token empty(TokenKind tokenKind , int position , Parser parser){
		return new Token(tokenKind , empties.get(position),parser);
	}
	
	public Optional getToken() {
		return tokenString;
	}
	
	public Range getTokenRange() {
		return tokenRange;
	}
	
	public RangedString getRangedString(){
		return new RangedString(tokenRange , tokenString);
	}
	
	public Parser getParser(){
		return parser;
	}
	
  public  T  getParser(Class parserClass) {
    return parserClass.cast(parser);
  }
  
    public  TypedToken typed(Class parserClassOrInterface){
    	if(parserClassOrInterface.isInterface()) {
    		return typedWithInterface(parserClassOrInterface);
    	}
    	return new TypedToken(this, Parser.get(parserClassOrInterface)).setParent(parent);
    }
    
    public  TypedToken typed(T parser){
    	return new TypedToken(this, parser).setParent(parent);
    }
    
    public  TypedToken typedWithInterface(Class parserInterface){
    	if(false == parserInterface.isInterface()) {
    		throw new IllegalArgumentException();
    	}
    	return new TypedToken(this, parserInterface.cast(parser)).setParent(parent);
    }


	public static RangedString createRangedString(List tokens, int position){
		
		if(tokens.isEmpty()){
			return new RangedString(position);
		}
		
		Optional token = Optional.of(
			tokens.stream()
				.map(Token::getToken)
				.filter(Optional::isPresent)
				.map(Optional::get)
				.collect(Collectors.joining()));
		
		int startIndex = tokens.get(0).tokenRange.startIndexInclusive;
		int endIndex = tokens.get(tokens.size()-1).tokenRange.endIndexExclusive;
		return new RangedString(new Range(startIndex, endIndex), token);
	}
	
	public List flatten(){
		return flatten(ScanDirection.Depth ,ChildrenKind.astNodes);
	}
	
	public List flatten(ScanDirection breadthOrDepth){
		return flatten(breadthOrDepth , ChildrenKind.astNodes);
	}
	
	public List flatten(ScanDirection breadthOrDepth , ChildrenKind childrenKind){
		return breadthOrDepth == ScanDirection.Depth ?
				flattenDepth(childrenKind) : flattenBreadth(childrenKind);
	}
	
	public List flattenDepth(ChildrenKind childrenKind){
		List list = new ArrayList();
		list.add(this);
		for(Token child :children(childrenKind)){
			list.addAll(child.flattenDepth(childrenKind));
		}
		return list;
	}
	
	public List flattenBreadth(ChildrenKind childrenKind){
		List list = new ArrayList();
		Deque deque = new ArrayDeque();
		deque.add(this);
		while (false == deque.isEmpty()) {
			Token poll = deque.poll();
			list.add(poll);
			if(false ==poll.children(childrenKind).isEmpty()) {
				deque.addAll(poll.children(childrenKind));
			}
		}
		return list;
	}

	
	public enum ScanDirection{
		Breadth,
		Depth
	}
	
	@Override
	public String toString() {
		return displayString.get(this);
	}
	
	public boolean isTerminalSymbol(){
		return parser.forTerminalSymbol();
	}

	public TokenKind getTokenKind() {
		return tokenKind;
	}
	public Token replace(Parser replace) {
		this.parser = replace;
		return this;
	}
	
	public Token newWithReplace(Parser replace) {
	  return new Token(tokenKind, originalChildren, replace ,tokenRange.startIndexInclusive )
			  .setParent(parent);
	}
	
	public 

TypedToken

newWithReplaceTyped(P replace) { return new Token(tokenKind, originalChildren, replace ,tokenRange.startIndexInclusive ).typed(replace) .setParent(parent); } public

TypedToken

newWithReplacedParserConstructRangedStringTyped(P replace){ return newWithReplacedParserConstructRangedStringTyped(replace , ChildrenKind.astNodes) .setParent(parent); } public Token newWithReplacedParserConstructRangedString(Parser replace){ return newWithReplacedParserConstructRangedString(replace , ChildrenKind.astNodes); } public Token newWithReplacedParserConstructRangedString(Parser replace , ChildrenKind childrenKind){ if(false == children(childrenKind).isEmpty()){ throw new IllegalArgumentException("not support collected token"); } return new Token(tokenKind,new RangedString(tokenRange, tokenString),replace).setParent(parent); } public

TypedToken

newWithReplacedParserConstructRangedStringTyped(P replace , ChildrenKind childrenKind){ if(false == children(childrenKind).isEmpty()){ throw new IllegalArgumentException("not support collected token"); } return new Token(tokenKind,new RangedString(tokenRange, tokenString),replace) .typed(replace).setParent(parent); } List children(ChildrenKind kind){ return kind == ChildrenKind.astNodes ? filteredChildren : originalChildren; } public Token newCreatesOf(List newChildrens) { Token newToken = new Token(tokenKind , newChildrens , parser , tokenRange.startIndexInclusive) .setParent(parent); return newToken; } public Token newCreatesOf(Token... newChildrens) { return newCreatesOf(Arrays.asList(newChildrens)); } @SuppressWarnings("unchecked") public Token newCreatesOf(Predicate... filterForChildrens) { List newChildren = Stream.of(filterForChildrens) .flatMap(this::getChildren) .collect(Collectors.toList()); return newCreatesOf(newChildren); } public Token newCreatesOf(TokenEffecterWithMatcher... tokenEffecterWithMatchers) { return newCreatesOf(ChildrenKind.astNodes, tokenEffecterWithMatchers); } public Token newCreatesOf(ChildrenKind kind , TokenEffecterWithMatcher... tokenEffecterWithMatchers) { List newChildren = children(kind).stream() .map(token->{ for (TokenEffecterWithMatcher tokenEffecterWithMatcher : tokenEffecterWithMatchers) { if(tokenEffecterWithMatcher.target.test(token)) { return tokenEffecterWithMatcher.effector.apply(token); } } return token; }) .collect(Collectors.toList()); return newCreatesOf(newChildren); } public Token getDirectAncestor(Predicate predicates){ return getDirectAncestorAsOptional(predicates).orElseThrow(); } public Optional getDirectAncestorAsOptional(Predicate predicates){ Token current = this; while(true) { if(current.parent.isEmpty()) { return Optional.empty(); } Token parentToken = current.parent.get(); if(predicates.test(parentToken)) { return Optional.of(parentToken); } current = parentToken; } } public Token getAncestor(Predicate predicates){ return getAncestorAsOptional(predicates).orElseThrow(); } public Optional getAncestorAsOptional(Predicate predicates){ int level=0; Token current = this; while(true) { if(current.parent.isEmpty()) { return Optional.empty(); } Token parentToken = current.parent.get(); if(predicates.test(parentToken)) { return Optional.of(parentToken); } if(level>0) { for(Token child : parentToken.originalChildren) { if(predicates.test(child)) { return Optional.of(child); } } } current = parentToken; level++; } } //FIXME! 現在flattenしてから探しているものをinterface化する public interface AbstractDescendantFinder{ } public Token getChild(Predicate predicates) { return getChild(predicates , ChildrenKind.astNodes); } public Token getChild(Predicate predicates , ChildrenKind childrenKind) { return children(childrenKind).stream().filter(predicates).findFirst().orElseThrow(); } public int getChildIndex(Predicate predicates) { return getChildIndex(ChildrenKind.astNodes, predicates); } public int getChildIndex(ChildrenKind childrenKind, Predicate predicates) { int index=0; for (Token token : children(childrenKind)) { if(predicates.test(token)) { return index; } index++; } throw new IllegalArgumentException("predicates is not match"); } public Token getChildWithParser(Predicate predicatesWithTokensParser) { return getChildWithParser(predicatesWithTokensParser,ChildrenKind.astNodes); } public Token getChildWithParser(Predicate predicatesWithTokensParser , ChildrenKind childrenKind) { return children(childrenKind).stream().filter(token-> predicatesWithTokensParser.test(token.parser)).findFirst().orElseThrow(); } public int getChildIndexWithParser(Predicate predicatesWithTokensParser) { return getChildIndexWithParser(ChildrenKind.astNodes, predicatesWithTokensParser); } public int getChildIndexWithParser(ChildrenKind childrenKind, Predicate predicatesWithTokensParser) { int index=0; for (Token token : children(childrenKind)) { if(predicatesWithTokensParser.test(token.parser)) { return index; } index++; } throw new IllegalArgumentException("predicates is not match"); } public Token getChildWithParser(Class parserClass) { return getChildWithParser(parser -> parser.getClass() == parserClass); } public

TypedToken

getChildWithParserTyped(Class

parserClass) { return getChildWithParser(parser -> parser.getClass() == parserClass).typed(parserClass); } public int getChildIndexWithParser(Class parserClass) { return getChildIndexWithParser(ChildrenKind.astNodes, parserClass); } public int getChildIndexWithParser(ChildrenKind childrenKind, Class parserClass) { return getChildIndexWithParser(childrenKind , parser -> parser.getClass() == parserClass); } public Optional getChildAsOptional(Predicate predicates ) { return getChildAsOptional(predicates , ChildrenKind.astNodes); } public Optional getChildAsOptional(Predicate predicates ,ChildrenKind childrenKind) { return children(childrenKind).stream().filter(predicates).findFirst(); } public Optional getChildWithParserAsOptional(Predicate predicatesWithTokensParser){ return getChildWithParserAsOptional(predicatesWithTokensParser , ChildrenKind.astNodes); } public Optional getChildWithParserAsOptional(Predicate predicatesWithTokensParser, ChildrenKind childrenKind) { return children(childrenKind).stream().filter(token-> predicatesWithTokensParser.test(token.parser)).findFirst(); } public Optional getChildWithParserAsOptional(Class parserClass) { return getChildWithParserAsOptional(parser -> parser.getClass() == parserClass); } public

Optional> getChildWithParserAsOptionalTyped(Class

parserClass) { return getChildWithParserAsOptional(parser -> parser.getClass() == parserClass).map(token->token.typed(parserClass)); } public Stream getChildren(Predicate predicates) { return getChildren(predicates , ChildrenKind.astNodes); } public Stream getChildren(Predicate predicates , ChildrenKind childrenKind) { return children(childrenKind).stream().filter(predicates); } public Stream getChildrenWithParser(Predicate predicatesWithTokensParser){ return getChildrenWithParser(predicatesWithTokensParser , ChildrenKind.astNodes); } public Stream getChildrenWithParser(Predicate predicatesWithTokensParser, ChildrenKind childrenKind) { return children(childrenKind).stream().filter(token-> predicatesWithTokensParser.test(token.parser)); } public Stream getChildrenWithParser(Class parserClass) { return getChildrenWithParser(parser -> parser.getClass() == parserClass); } public

Stream> getChildrenWithParserTyped(Class

parserClass) { return getChildrenWithParser(parser -> parser.getClass() == parserClass).map(token->token.typed(parserClass)); } public List getChildrenAsList(Predicate predicates) { return getChildren(predicates).collect(Collectors.toList()); } public List getChildrenWithParserAsList(Predicate predicatesWithTokensParser) { return getChildrenWithParser(predicatesWithTokensParser).collect(Collectors.toList()); } public List getChildrenWithParserAsList(Class parserClass) { return getChildrenWithParserAsList(parser -> parser.getClass() == parserClass); } public

List> getChildrenWithParserAsListTyped(Class

parserClass) { return getChildrenWithParserTyped(parserClass).collect(Collectors.toList()); } public Token getChildFromOriginal(int index) { return children(ChildrenKind.original).get(index); } public Token getChildFromAstNodes(int index) { return filteredChildren.get(index); } // public Token getChild(Predicate predicates) { // return getChild(predicates , ChildrenKind.astNodes); // } // // public Token getChild(Predicate predicates , ChildrenKind childrenKind) { // return children(childrenKind).stream().filter(predicates).findFirst().orElseThrow(); // } // // public int getChildIndex(Predicate predicates) { // return getChildIndex(ChildrenKind.astNodes, predicates); // } // // public int getChildIndex(ChildrenKind childrenKind, Predicate predicates) { // // int index=0; // for (Token token : children(childrenKind)) { // if(predicates.test(token)) { // return index; // } // index++; // } // throw new IllegalArgumentException("predicates is not match"); // } // // public Token getChildWithParser(Predicate predicatesWithTokensParser) { // return getChildWithParser(predicatesWithTokensParser,ChildrenKind.astNodes); // } // // public Token getChildWithParser(Predicate predicatesWithTokensParser , ChildrenKind childrenKind) { // return children(childrenKind).stream().filter(token-> predicatesWithTokensParser.test(token.parser)).findFirst().orElseThrow(); // } // // public int getChildIndexWithParser(Predicate predicatesWithTokensParser) { // return getChildIndexWithParser(ChildrenKind.astNodes, predicatesWithTokensParser); // } // // public int getChildIndexWithParser(ChildrenKind childrenKind, Predicate predicatesWithTokensParser) { // // int index=0; // for (Token token : children(childrenKind)) { // if(predicatesWithTokensParser.test(token.parser)) { // return index; // } // index++; // } // throw new IllegalArgumentException("predicates is not match"); // } // // // // public Token getDescendantWithParser(Class parserClass) { // return getDescendantWithParser(parser -> parser.getClass() == parserClass); // } // // public int getDescendantIndexWithParser(Class parserClass) { // return getChildIndexWithParser(ChildrenKind.astNodes, parserClass); // } // // public int getDescendantIndexWithParser(ChildrenKind childrenKind, Class parserClass) { // // return getChildIndexWithParser(childrenKind , parser -> parser.getClass() == parserClass); // } // // public Optional getDescendantAsOptional(Predicate predicates ) { // return getChildAsOptional(predicates , ChildrenKind.astNodes); // } // public Optional getDescendantAsOptional(Predicate predicates ,ChildrenKind childrenKind) { // return children(childrenKind).stream().filter(predicates).findFirst(); // } // // public Optional getChildWithParserAsOptional(Predicate predicatesWithTokensParser){ // return getChildWithParserAsOptional(predicatesWithTokensParser , ChildrenKind.astNodes); // } // public Optional getChildWithParserAsOptional(Predicate predicatesWithTokensParser, // ChildrenKind childrenKind) { // return children(childrenKind).stream().filter(token-> predicatesWithTokensParser.test(token.parser)).findFirst(); // } // // public Optional getChildWithParserAsOptional(Class parserClass) { // return getChildWithParserAsOptional(parser -> parser.getClass() == parserClass); // } // // public Stream getChildren(Predicate predicates) { // return getChildren(predicates , ChildrenKind.astNodes); // } // public Stream getChildren(Predicate predicates , ChildrenKind childrenKind) { // return children(childrenKind).stream().filter(predicates); // } // // public Stream getChildrenWithParser(Predicate predicatesWithTokensParser){ // return getChildrenWithParser(predicatesWithTokensParser , ChildrenKind.astNodes); // } // public Stream getChildrenWithParser(Predicate predicatesWithTokensParser, // ChildrenKind childrenKind) { // return children(childrenKind).stream().filter(token-> predicatesWithTokensParser.test(token.parser)); // } // // public Stream getChildrenWithParser(Class parserClass) { // return getChildrenWithParser(parser -> parser.getClass() == parserClass); // } // // public List getChildrenAsList(Predicate predicates) { // return getChildren(predicates).collect(Collectors.toList()); // } // // public List getChildrenWithParserAsList(Predicate predicatesWithTokensParser) { // return getChildrenWithParser(predicatesWithTokensParser).collect(Collectors.toList()); // } // // public List getChildrenWithParserAsList(Class parserClass) { // return getChildrenWithParserAsList(parser -> parser.getClass() == parserClass); // } public List getOriginalChildren() { return originalChildren; } public List getAstNodeChildren() { return filteredChildren; } public Token addChildren(Token...tokens) { for (Token token : tokens) { originalChildren.add(token); if(AST_NODES.test(token)) { filteredChildren.add(token); } } return this; } @SuppressWarnings("unchecked") public Optional getExtraObject(Name name) { return Optional.ofNullable( (T)extraObjectByName.get(name)); } public void putExtraObject(Name name , Object object) { extraObjectByName.put(name , object); } public boolean removeExtraObject(Name name) { var preset = extraObjectByName.remove(name); return preset != null ; } public Optional getRelatedToken(Name name) { return Optional.ofNullable( relatedTokenByName.get(name)); } public void putRelatedToken(Name name , Token relatedToken) { relatedTokenByName.put(name , relatedToken); } public Optional removeRelatedToken(Name name) { return Optional.ofNullable(relatedTokenByName.remove(name)); } public String getPath() { return getPath(parser.getName(NameKind.computedName).getSimpleName()); } String getPath(String path) { if(parent.isEmpty()) { return "/"+path; } return parent.get().getPath(parent.get().parser.getName(NameKind.computedName).getSimpleName()+"/" + path); } }





© 2015 - 2025 Weber Informatics LLC | Privacy Policy