org.firebirdsql.jdbc.escape.FBEscapedParser Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of jaybird Show documentation
Show all versions of jaybird Show documentation
JDBC Driver for the Firebird RDBMS
The newest version!
/*
* Firebird Open Source JDBC Driver
*
* Distributable under LGPL license.
* You may obtain a copy of the License at http://www.gnu.org/copyleft/lgpl.html
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* LGPL License for more details.
*
* This file was created by members of the firebird development team.
* All individual contributions remain the Copyright (C) of those
* individuals. Contributors to this file are either listed here or
* can be obtained from a source control history command.
*
* All rights reserved.
*/
package org.firebirdsql.jdbc.escape;
import org.firebirdsql.jdbc.FBProcedureCall;
import org.firebirdsql.util.InternalApi;
import java.sql.SQLException;
import java.text.BreakIterator;
import java.util.ArrayDeque;
import java.util.Locale;
import java.util.regex.Pattern;
/**
* The class {@code FBEscapedParser} parses the SQL and converts escaped syntax to native form.
*
* @author Roman Rokytskyy
* @author Mark Rotteveel
*/
@InternalApi
public final class FBEscapedParser {
/*
Stored procedure calls support both following syntax:
{call procedure_name[(arg1, arg2, ...)]}
or
{?= call procedure_name[(arg1, arg2, ...)]}
*/
private static final String ESCAPE_CALL_KEYWORD = "call";
private static final String ESCAPE_CALL_KEYWORD3 = "?";
private static final String ESCAPE_DATE_KEYWORD = "d";
private static final String ESCAPE_TIME_KEYWORD = "t";
private static final String ESCAPE_TIMESTAMP_KEYWORD = "ts";
private static final String ESCAPE_FUNCTION_KEYWORD = "fn";
private static final String ESCAPE_ESCAPE_KEYWORD = "escape";
private static final String ESCAPE_OUTERJOIN_KEYWORD = "oj";
private static final String ESCAPE_LIMIT_KEYWORD = "limit";
/**
* Regular expression to check for existence of JDBC escapes, is used to
* stop processing the entire SQL statement if it does not contain any of
* the escape introducers.
*/
private static final Pattern CHECK_ESCAPE_PATTERN = Pattern.compile(
"\\{(?:(?:\\?\\s*=\\s*)?call|d|ts?|escape|fn|oj|limit)\\s",
Pattern.CASE_INSENSITIVE);
private static final String LIMIT_OFFSET_CLAUSE = " offset ";
private FBEscapedParser() {
// No instances
}
/**
* Check if the target SQL contains at least one of the escaped syntax commands. This method performs a simple regex
* match, so it may report that SQL contains escaped syntax when the "{"
is followed by
* the escaped syntax command in regular string constants that are passed as parameters. In this case
* {@link #parse(String)} will perform complete SQL parsing.
*
* @param sql
* to test
* @return {@code true} if the {@code sql} is suspected to contain escaped syntax.
*/
private static boolean checkForEscapes(String sql) {
return CHECK_ESCAPE_PATTERN.matcher(sql).find();
}
/**
* Converts escaped parts in {@code sql} to native representation.
*
* @param sql
* to parse
* @return native form of the {@code sql}.
*/
public static String toNativeSql(String sql) throws SQLException {
return parse(sql);
}
/**
* Converts escaped parts in {@code sql} to native representation.
*
* @param sql
* to parse
* @return native form of the {@code sql}.
*/
@SuppressWarnings("java:S127")
public static String parse(final String sql) throws SQLException {
if (!checkForEscapes(sql)) return sql;
ParserState state = ParserState.INITIAL_STATE;
// Note initialising to 8 as that is the minimum size in Oracle Java, and we (usually) need less than the default of 16
final var bufferStack = new ArrayDeque(8);
final int sqlLength = sql.length();
var buffer = new StringBuilder(sqlLength);
for (int i = 0; i < sqlLength; i++) {
char currentChar = sql.charAt(i);
state = state.nextState(currentChar);
switch (state) {
case INITIAL_STATE -> {
// Ignore leading whitespace
}
case NORMAL_STATE, LITERAL_STATE,
START_LINE_COMMENT, LINE_COMMENT, START_BLOCK_COMMENT, BLOCK_COMMENT, END_BLOCK_COMMENT,
POSSIBLE_Q_LITERAL_ENTER -> buffer.append(currentChar);
case ESCAPE_ENTER_STATE -> {
bufferStack.push(buffer);
buffer = new StringBuilder();
}
case ESCAPE_EXIT_STATE -> {
if (bufferStack.isEmpty()) {
throw new FBSQLParseException("Unbalanced JDBC escape, too many '}'");
}
String escapeText = buffer.toString();
buffer = bufferStack.pop();
escapeToNative(buffer, escapeText);
}
case Q_LITERAL_START -> {
buffer.append(currentChar);
if (++i >= sqlLength) {
throw new FBSQLParseException("Unexpected end of string at parser state " + state);
}
final char alternateStartChar = sql.charAt(i);
buffer.append(alternateStartChar);
final char alternateEndChar = qLiteralEndChar(alternateStartChar);
for (i++; i < sqlLength; i++) {
currentChar = sql.charAt(i);
buffer.append(currentChar);
if (currentChar == alternateEndChar && i + 1 < sqlLength && sql.charAt(i + 1) == '\'') {
state = ParserState.Q_LITERAL_END;
break;
}
}
if (i == sqlLength) {
throw new FBSQLParseException("Unexpected end of string at parser state " + state);
}
}
default -> throw new FBSQLParseException("Unexpected parser state " + state);
}
}
if (!bufferStack.isEmpty()) {
throw new FBSQLParseException("Unbalanced JDBC escape, too many '{'");
}
return buffer.toString();
}
private static char qLiteralEndChar(char startChar) {
return switch (startChar) {
case '(' -> ')';
case '{' -> '}';
case '[' -> ']';
case '<' -> '>';
default -> startChar;
};
}
private static void processEscaped(final String escaped, final StringBuilder keyword, final StringBuilder payload) {
assert keyword.isEmpty() && payload.isEmpty() : "StringBuilders keyword and payload should be empty";
// Extract the keyword from the escaped syntax.
final BreakIterator iterator = BreakIterator.getWordInstance();
iterator.setText(escaped);
final int keyStart = iterator.first();
final int keyEnd = iterator.next();
keyword.append(escaped, keyStart, keyEnd);
int payloadStart = keyEnd;
// Remove whitespace before payload
while (payloadStart < escaped.length() - 1 && escaped.charAt(payloadStart) <= ' ') {
payloadStart++;
}
int payloadEnd = escaped.length();
// Remove whitespace after payload
while (payloadEnd > payloadStart && escaped.charAt(payloadEnd - 1) <= ' ') {
payloadEnd--;
}
payload.append(escaped, payloadStart, payloadEnd);
}
/**
* This method checks the passed parameter to conform the escaped syntax,
* checks for the unknown keywords and re-formats result according to the
* Firebird SQL syntax.
*
* @param target
* Target StringBuilder to append to.
* @param escaped
* the part of escaped SQL between the '{' and '}'.
*/
private static void escapeToNative(final StringBuilder target, final String escaped) throws SQLException {
final StringBuilder keyword = new StringBuilder();
final StringBuilder payload = new StringBuilder(Math.max(16, escaped.length()));
processEscaped(escaped, keyword, payload);
//Handle keywords.
final String keywordStr = keyword.toString().toLowerCase(Locale.ROOT);
// NOTE: We assume here that all KEYWORD constants are lowercase!
switch (keywordStr) {
// TODO Should we call convertProcedureCall? It leads to inefficient double parsing
case ESCAPE_CALL_KEYWORD -> convertProcedureCall(target, "{" + keyword + ' ' + payload + '}');
// TODO Should we call convertProcedureCall? It leads to inefficient double parsing
case ESCAPE_CALL_KEYWORD3 -> convertProcedureCall(target, "{" + ESCAPE_CALL_KEYWORD3 + payload + '}');
case ESCAPE_DATE_KEYWORD -> toDateString(target, payload);
case ESCAPE_ESCAPE_KEYWORD -> convertEscapeString(target, payload);
case ESCAPE_FUNCTION_KEYWORD -> convertEscapedFunction(target, payload);
case ESCAPE_OUTERJOIN_KEYWORD -> convertOuterJoin(target, payload);
case ESCAPE_TIME_KEYWORD -> toTimeString(target, payload);
case ESCAPE_TIMESTAMP_KEYWORD -> toTimestampString(target, payload);
case ESCAPE_LIMIT_KEYWORD -> convertLimitString(target, payload);
default -> throw new FBSQLParseException("Unknown keyword " + keywordStr + " for escaped syntax.");
}
}
/**
* This method converts the 'yyyy-mm-dd' date format into the Firebird
* understandable format.
*
* @param target
* Target StringBuilder to append to.
* @param dateStr
* the date in the 'yyyy-mm-dd' format.
*/
private static void toDateString(final StringBuilder target, final CharSequence dateStr) {
// use shorthand date cast (using just the string will not work in all contexts)
target.append("DATE ").append(dateStr);
}
/**
* This method converts the 'hh:mm:ss' time format into the Firebird
* understandable format.
*
* @param target
* Target StringBuilder to append to.
* @param timeStr
* the date in the 'hh:mm:ss' format.
*/
private static void toTimeString(final StringBuilder target, final CharSequence timeStr) {
// use shorthand time cast (using just the string will not work in all contexts)
target.append("TIME ").append(timeStr);
}
/**
* This method converts the 'yyyy-mm-dd hh:mm:ss' timestamp format into the
* Firebird understandable format.
*
* @param target
* Target StringBuilder to append to.
* @param timestampStr
* the date in the 'yyyy-mm-dd hh:mm:ss' format.
*/
private static void toTimestampString(final StringBuilder target, final CharSequence timestampStr) {
// use shorthand timestamp cast (using just the string will not work in all contexts)
target.append("TIMESTAMP ").append(timestampStr);
}
/**
* Converts the escaped procedure call syntax into the native procedure call.
*
* @param target
* Target StringBuilder to append native procedure call to.
* @param procedureCall
* part of {call proc_name(...)} without curly braces and "call"
* word.
*/
private static void convertProcedureCall(final StringBuilder target, final String procedureCall) throws SQLException {
FBEscapedCallParser tempParser = new FBEscapedCallParser();
FBProcedureCall call = tempParser.parseCall(procedureCall);
call.checkParameters();
target.append(call.getSQL(false));
}
/**
* This method converts the escaped outer join call syntax into the native
* outer join. Actually, we do not change anything here, since Firebird's
* syntax is the same.
*
* @param target
* Target StringBuilder to append to.
* @param outerJoin
* Outer join text
*/
private static void convertOuterJoin(final StringBuilder target, final CharSequence outerJoin) {
target.append(outerJoin);
}
/**
* Convert the {@code "{escape '...'}"} call into the corresponding escape clause for Firebird.
*
* @param escapeString
* escape string to convert
*/
private static void convertEscapeString(final StringBuilder target, final CharSequence escapeString) {
target.append("ESCAPE ").append(escapeString);
}
/**
* Convert the {@code "{limit [offset ]}"} call into the corresponding rows clause for Firebird.
*
* NOTE: We assume that the {limit ...} escape occurs in the right place to work for a
* {@code ROWS}
* clause in Firebird.
*
*
* This implementation supports a parameter for the value of <rows>, but not for <rows_offset>.
*
*
* @param limitClause
* Limit clause
*/
private static void convertLimitString(final StringBuilder target, final CharSequence limitClause)
throws FBSQLParseException {
final String limitEscape = limitClause.toString().toLowerCase(Locale.ROOT);
final int offsetStart = limitEscape.indexOf(LIMIT_OFFSET_CLAUSE);
if (offsetStart == -1) {
target.append("ROWS ").append(limitEscape);
} else {
final String rows = limitEscape.substring(0, offsetStart).trim();
final String offset = limitEscape.substring(offsetStart + LIMIT_OFFSET_CLAUSE.length()).trim();
if (offset.indexOf('?') != -1) {
throw new FBSQLParseException("Extended limit escape ({limit offset }) does not support parameters for ");
}
target.append("ROWS ").append(offset).append(" TO ").append(offset).append("+").append(rows);
}
}
/**
* This method converts escaped function to a server function call. Actually
* we do not change anything here, we hope that all UDF are defined.
*
* @param target
* Target StringBuilder to append to.
* @param escapedFunction
* escaped function call
* @throws FBSQLParseException
* if something was wrong.
*/
private static void convertEscapedFunction(final StringBuilder target, final CharSequence escapedFunction)
throws FBSQLParseException {
final String templateResult = FBEscapedFunctionHelper.convertTemplate(escapedFunction.toString());
target.append(templateResult != null ? templateResult : escapedFunction);
}
private enum ParserState {
/**
* Initial parser state (to ignore leading whitespace)
*/
INITIAL_STATE {
@Override
protected ParserState nextState(char inputChar) throws FBSQLParseException {
return Character.isWhitespace(inputChar) ? INITIAL_STATE : NORMAL_STATE.nextState(inputChar);
}
},
/**
* Normal SQL query text state
*/
NORMAL_STATE {
@Override
protected ParserState nextState(char inputChar) {
return switch (inputChar) {
case '\'' -> LITERAL_STATE;
case '{' -> ESCAPE_ENTER_STATE;
case '}' -> ESCAPE_EXIT_STATE;
case '-' -> START_LINE_COMMENT;
case '/' -> START_BLOCK_COMMENT;
case 'q', 'Q' -> POSSIBLE_Q_LITERAL_ENTER;
default -> NORMAL_STATE;
};
}
},
/**
* SQL literal text (text inside quotes)
*/
LITERAL_STATE {
@Override
protected ParserState nextState(char inputChar) {
return (inputChar == '\'') ? NORMAL_STATE : LITERAL_STATE;
}
},
/**
* Start of JDBC escape ({ character encountered).
*/
ESCAPE_ENTER_STATE {
@Override
protected ParserState nextState(char inputChar) throws FBSQLParseException {
return switch (inputChar) {
//@formatter:off
case // start of {?= call ...}
'?',
// start of {call ...}
'c', 'C',
// start of {d ...}
'd', 'D',
// start of {t ...} or {ts ...}
't', 'T',
// start of {escape ...}
'e', 'E',
// start of {fn ...}
'f', 'F',
// start of {oj ...}
'o', 'O',
// start of {limit ...}
'l', 'L' -> NORMAL_STATE;
//@formatter:on
default -> throw new FBSQLParseException(
"Unexpected first character inside JDBC escape: " + inputChar);
};
}
},
/**
* End of JDBC escape (} character encountered)
*/
ESCAPE_EXIT_STATE {
@Override
protected ParserState nextState(char inputChar) throws FBSQLParseException {
return NORMAL_STATE.nextState(inputChar);
}
},
/**
* Potential start of line comment
*/
START_LINE_COMMENT {
@Override
protected ParserState nextState(char inputChar) throws FBSQLParseException {
return (inputChar == '-') ? LINE_COMMENT : NORMAL_STATE.nextState(inputChar);
}
},
/**
* Line comment
*/
LINE_COMMENT {
@Override
protected ParserState nextState(char inputChar) {
return (inputChar == '\n') ? NORMAL_STATE : LINE_COMMENT;
}
},
/**
* Potential start of block comment
*/
START_BLOCK_COMMENT {
@Override
protected ParserState nextState(char inputChar) throws FBSQLParseException {
return (inputChar == '*') ? BLOCK_COMMENT : NORMAL_STATE.nextState(inputChar);
}
},
/**
* Block comment
*/
BLOCK_COMMENT {
@Override
protected ParserState nextState(char inputChar) {
return (inputChar == '*') ? END_BLOCK_COMMENT : BLOCK_COMMENT;
}
},
/**
* Potential block comment end
*/
END_BLOCK_COMMENT {
@Override
protected ParserState nextState(char inputChar) {
return (inputChar == '/') ? NORMAL_STATE : BLOCK_COMMENT;
}
},
/**
* Potential Q-literal
*/
POSSIBLE_Q_LITERAL_ENTER {
@Override
protected ParserState nextState(char inputChar) {
return (inputChar == '\'') ? Q_LITERAL_START : NORMAL_STATE;
}
},
/**
* Start of Q escape, next character will be the alternate end character. Further processing needs to be done
* separately.
*/
Q_LITERAL_START {
@Override
protected ParserState nextState(char inputChar) throws FBSQLParseException {
throw new FBSQLParseException("Q-literal handling needs to be performed separately");
}
},
Q_LITERAL_END {
@Override
protected ParserState nextState(char inputChar) throws FBSQLParseException {
if (inputChar != '\'') {
throw new FBSQLParseException("Invalid char " + inputChar + " for state Q_LITERAL_END");
}
return NORMAL_STATE;
}
};
/**
* Decides on the next ParserState based on the input character.
*
* @param inputChar
* Input character
* @return Next state
* @throws FBSQLParseException
* For incorrect character for current state during parsing
*/
protected abstract ParserState nextState(char inputChar) throws FBSQLParseException;
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy