All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.hl7.fhir.r4.fhirpath.FHIRLexer Maven / Gradle / Ivy

Go to download

Builds the hapi fhir r4. Requires hapi-fhir-base and hapi-fhir-utilities be built first and be excluded from any other poms requiring it.

The newest version!
package org.hl7.fhir.r4.fhirpath;

import org.hl7.fhir.exceptions.FHIRException;
import org.hl7.fhir.utilities.SourceLocation;
import org.hl7.fhir.utilities.Utilities;

// shared lexer for concrete syntaxes 
// - FluentPath
// - Mapping language

public class FHIRLexer {
  public class FHIRLexerException extends FHIRException {

    public FHIRLexerException() {
      super();
    }

    public FHIRLexerException(String message, Throwable cause) {
      super(message, cause);
    }

    public FHIRLexerException(String message) {
      super(message);
    }

    public FHIRLexerException(Throwable cause) {
      super(cause);
    }

  }

  private String source;
  private int cursor;
  private int currentStart;
  private String current;
  private SourceLocation currentLocation;
  private SourceLocation currentStartLocation;
  private int id;
  private String name;

  public FHIRLexer(String source, String name) throws FHIRLexerException {
    this.source = source;
    this.name = name == null ? "??" : name;
    currentLocation = new SourceLocation(1, 1);
    next();
  }

  public FHIRLexer(String source, int i) throws FHIRLexerException {
    this.source = source;
    this.cursor = i;
    currentLocation = new SourceLocation(1, 1);
    next();
  }

  public String getCurrent() {
    return current;
  }

  public SourceLocation getCurrentLocation() {
    return currentLocation;
  }

  public boolean isConstant() {
    return current != null && (current.charAt(0) == '\'' || current.charAt(0) == '"') || current.charAt(0) == '@'
        || current.charAt(0) == '%' || current.charAt(0) == '-' || current.charAt(0) == '+'
        || (current.charAt(0) >= '0' && current.charAt(0) <= '9') || current.equals("true") || current.equals("false")
        || current.equals("{}");
  }

  public boolean isFixedName() {
    return current != null && (current.charAt(0) == '`');
  }

  public boolean isStringConstant() {
    return current.charAt(0) == '\'' || current.charAt(0) == '"' || current.charAt(0) == '`';
  }

  public String take() throws FHIRLexerException {
    String s = current;
    next();
    return s;
  }

  public int takeInt() throws FHIRLexerException {
    String s = current;
    if (!Utilities.isInteger(s))
      throw error("Found " + current + " expecting an integer");
    next();
    return Integer.parseInt(s);
  }

  public boolean isToken() {
    if (Utilities.noString(current))
      return false;

    if (current.startsWith("$"))
      return true;

    if (current.equals("*") || current.equals("**"))
      return true;

    if ((current.charAt(0) >= 'A' && current.charAt(0) <= 'Z')
        || (current.charAt(0) >= 'a' && current.charAt(0) <= 'z')) {
      for (int i = 1; i < current.length(); i++)
        if (!((current.charAt(1) >= 'A' && current.charAt(1) <= 'Z')
            || (current.charAt(1) >= 'a' && current.charAt(1) <= 'z')
            || (current.charAt(1) >= '0' && current.charAt(1) <= '9')))
          return false;
      return true;
    }
    return false;
  }

  public FHIRLexerException error(String msg) {
    return error(msg, currentLocation.toString());
  }

  public FHIRLexerException error(String msg, String location) {
    return new FHIRLexerException("Error in " + name + " at " + location + ": " + msg);
  }

  public void next() throws FHIRLexerException {
    skipWhitespaceAndComments();
    current = null;
    currentStart = cursor;
    currentStartLocation = currentLocation;
    if (cursor < source.length()) {
      char ch = source.charAt(cursor);
      if (ch == '!' || ch == '>' || ch == '<' || ch == ':' || ch == '-' || ch == '=') {
        cursor++;
        if (cursor < source.length()
            && (source.charAt(cursor) == '=' || source.charAt(cursor) == '~' || source.charAt(cursor) == '-')
            || (ch == '-' && source.charAt(cursor) == '>'))
          cursor++;
        current = source.substring(currentStart, cursor);
      } else if (ch == '.') {
        cursor++;
        if (cursor < source.length() && (source.charAt(cursor) == '.'))
          cursor++;
        current = source.substring(currentStart, cursor);
      } else if (ch >= '0' && ch <= '9') {
        cursor++;
        boolean dotted = false;
        while (cursor < source.length() && ((source.charAt(cursor) >= '0' && source.charAt(cursor) <= '9')
            || (source.charAt(cursor) == '.') && !dotted)) {
          if (source.charAt(cursor) == '.')
            dotted = true;
          cursor++;
        }
        if (source.charAt(cursor - 1) == '.')
          cursor--;
        current = source.substring(currentStart, cursor);
      } else if ((ch >= 'a' && ch <= 'z') || (ch >= 'A' && ch <= 'Z')) {
        while (cursor < source.length() && ((source.charAt(cursor) >= 'A' && source.charAt(cursor) <= 'Z')
            || (source.charAt(cursor) >= 'a' && source.charAt(cursor) <= 'z')
            || (source.charAt(cursor) >= '0' && source.charAt(cursor) <= '9') || source.charAt(cursor) == '_'))
          cursor++;
        current = source.substring(currentStart, cursor);
      } else if (ch == '%') {
        cursor++;
        if (cursor < source.length() && (source.charAt(cursor) == '`')) {
          cursor++;
          while (cursor < source.length() && (source.charAt(cursor) != '`'))
            cursor++;
          cursor++;
        } else
          while (cursor < source.length() && ((source.charAt(cursor) >= 'A' && source.charAt(cursor) <= 'Z')
              || (source.charAt(cursor) >= 'a' && source.charAt(cursor) <= 'z')
              || (source.charAt(cursor) >= '0' && source.charAt(cursor) <= '9') || source.charAt(cursor) == ':'
              || source.charAt(cursor) == '-'))
            cursor++;
        current = source.substring(currentStart, cursor);
      } else if (ch == '/') {
        cursor++;
        if (cursor < source.length() && (source.charAt(cursor) == '/')) {
          // this is en error - should already have been skipped
          error("This shoudn't happen?");
        }
        current = source.substring(currentStart, cursor);
      } else if (ch == '$') {
        cursor++;
        while (cursor < source.length() && (source.charAt(cursor) >= 'a' && source.charAt(cursor) <= 'z'))
          cursor++;
        current = source.substring(currentStart, cursor);
      } else if (ch == '{') {
        cursor++;
        ch = source.charAt(cursor);
        if (ch == '}')
          cursor++;
        current = source.substring(currentStart, cursor);
      } else if (ch == '"') {
        cursor++;
        boolean escape = false;
        while (cursor < source.length() && (escape || source.charAt(cursor) != '"')) {
          if (escape)
            escape = false;
          else
            escape = (source.charAt(cursor) == '\\');
          cursor++;
        }
        if (cursor == source.length())
          throw error("Unterminated string");
        cursor++;
        current = "\"" + source.substring(currentStart + 1, cursor - 1) + "\"";
      } else if (ch == '`') {
        cursor++;
        boolean escape = false;
        while (cursor < source.length() && (escape || source.charAt(cursor) != '`')) {
          if (escape)
            escape = false;
          else
            escape = (source.charAt(cursor) == '\\');
          cursor++;
        }
        if (cursor == source.length())
          throw error("Unterminated string");
        cursor++;
        current = "`" + source.substring(currentStart + 1, cursor - 1) + "`";
      } else if (ch == '\'') {
        cursor++;
        char ech = ch;
        boolean escape = false;
        while (cursor < source.length() && (escape || source.charAt(cursor) != ech)) {
          if (escape)
            escape = false;
          else
            escape = (source.charAt(cursor) == '\\');
          cursor++;
        }
        if (cursor == source.length())
          throw error("Unterminated string");
        cursor++;
        current = source.substring(currentStart, cursor);
        if (ech == '\'')
          current = "\'" + current.substring(1, current.length() - 1) + "\'";
      } else if (ch == '`') {
        cursor++;
        boolean escape = false;
        while (cursor < source.length() && (escape || source.charAt(cursor) != '`')) {
          if (escape)
            escape = false;
          else
            escape = (source.charAt(cursor) == '\\');
          cursor++;
        }
        if (cursor == source.length())
          throw error("Unterminated string");
        cursor++;
        current = "`" + source.substring(currentStart + 1, cursor - 1) + "`";
      } else if (ch == '@') {
        int start = cursor;
        cursor++;
        while (cursor < source.length() && isDateChar(source.charAt(cursor), start))
          cursor++;
        current = source.substring(currentStart, cursor);
      } else { // if CharInSet(ch, ['.', ',', '(', ')', '=', '$']) then
        cursor++;
        current = source.substring(currentStart, cursor);
      }
    }
  }

  private void skipWhitespaceAndComments() {
    boolean last13 = false;
    boolean done = false;
    while (cursor < source.length() && !done) {
      if (cursor < source.length() - 1 && "//".equals(source.substring(cursor, cursor + 2))) {
        while (cursor < source.length() && !((source.charAt(cursor) == '\r') || source.charAt(cursor) == '\n'))
          cursor++;
      } else if (cursor < source.length() - 1 && "/*".equals(source.substring(cursor, cursor + 2))) {
        while (cursor < source.length() - 1 && !"*/".equals(source.substring(cursor, cursor + 2))) {
          last13 = currentLocation.checkChar(source.charAt(cursor), last13);
          cursor++;
        }
        if (cursor >= source.length() - 1) {
          error("Unfinished comment");
        } else {
          cursor = cursor + 2;
        }
      } else if (Character.isWhitespace(source.charAt(cursor))) {
        last13 = currentLocation.checkChar(source.charAt(cursor), last13);
        cursor++;
      } else {
        done = true;
      }
    }
  }

  private boolean isDateChar(char ch, int start) {
    int eot = source.charAt(start + 1) == 'T' ? 10 : 20;

    return ch == '-' || ch == ':' || ch == 'T' || ch == '+' || ch == 'Z' || Character.isDigit(ch)
        || (cursor - start == eot && ch == '.' && cursor < source.length() - 1
            && Character.isDigit(source.charAt(cursor + 1)));
  }

  public boolean isOp() {
    return ExpressionNode.Operation.fromCode(current) != null;
  }

  public boolean done() {
    return currentStart >= source.length();
  }

  public int nextId() {
    id++;
    return id;
  }

  public SourceLocation getCurrentStartLocation() {
    return currentStartLocation;
  }

  // special case use
  public void setCurrent(String current) {
    this.current = current;
  }

  public boolean hasComment() {
    return !done() && current.startsWith("//");
  }

  public boolean hasToken(String kw) {
    return !done() && kw.equals(current);
  }

  public boolean hasToken(String... names) {
    if (done())
      return false;
    for (String s : names)
      if (s.equals(current))
        return true;
    return false;
  }

  public void token(String kw) throws FHIRLexerException {
    if (!kw.equals(current))
      throw error("Found \"" + current + "\" expecting \"" + kw + "\"");
    next();
  }

  public String readConstant(String desc) throws FHIRLexerException {
    if (!isStringConstant())
      throw error("Found " + current + " expecting \"[" + desc + "]\"");

    return processConstant(take());
  }

  public String readFixedName(String desc) throws FHIRLexerException {
    if (!isFixedName())
      throw error("Found " + current + " expecting \"[" + desc + "]\"");

    return processFixedName(take());
  }

  public String processConstant(String s) throws FHIRLexerException {
    StringBuilder b = new StringBuilder();
    int i = 1;
    while (i < s.length() - 1) {
      char ch = s.charAt(i);
      if (ch == '\\') {
        i++;
        switch (s.charAt(i)) {
        case 't':
          b.append('\t');
          break;
        case 'r':
          b.append('\r');
          break;
        case 'n':
          b.append('\n');
          break;
        case 'f':
          b.append('\f');
          break;
        case '\'':
          b.append('\'');
          break;
        case '"':
          b.append('"');
          break;
        case '`':
          b.append('`');
          break;
        case '\\':
          b.append('\\');
          break;
        case '/':
          b.append('/');
          break;
        case 'u':
          i++;
          int uc = Integer.parseInt(s.substring(i, i + 4), 16);
          b.append(Character.toString(uc));
          i = i + 4;
          break;
        default:
          throw new FHIRLexerException("Unknown character escape \\" + s.charAt(i));
        }
      } else {
        b.append(ch);
        i++;
      }
    }
    return b.toString();
  }

  public String processFixedName(String s) throws FHIRLexerException {
    StringBuilder b = new StringBuilder();
    int i = 1;
    while (i < s.length() - 1) {
      char ch = s.charAt(i);
      if (ch == '\\') {
        i++;
        switch (s.charAt(i)) {
        case 't':
          b.append('\t');
          break;
        case 'r':
          b.append('\r');
          break;
        case 'n':
          b.append('\n');
          break;
        case 'f':
          b.append('\f');
          break;
        case '\'':
          b.append('\'');
          break;
        case '"':
          b.append('"');
          break;
        case '\\':
          b.append('\\');
          break;
        case '/':
          b.append('/');
          break;
        case 'u':
          i++;
          int uc = Integer.parseInt(s.substring(i, i + 4), 16);
          b.append(Character.toString(uc));
          i = i + 4;
          break;
        default:
          throw new FHIRLexerException("Unknown character escape \\" + s.charAt(i));
        }
      } else {
        b.append(ch);
        i++;
      }
    }
    return b.toString();
  }

  public void skipToken(String token) throws FHIRLexerException {
    if (getCurrent().equals(token))
      next();

  }

  public String takeDottedToken() throws FHIRLexerException {
    StringBuilder b = new StringBuilder();
    b.append(take());
    while (!done() && getCurrent().equals(".")) {
      b.append(take());
      b.append(take());
    }
    return b.toString();
  }

  public void skipComments() throws FHIRLexerException {
    while (!done() && hasComment())
      next();
  }

  public int getCurrentStart() {
    return currentStart;
  }

}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy