![JAR search and dependency download from the Maven repository](/logo.png)
it.unibz.inf.ontop.spec.sqlparser.ApproximateSelectQueryAttributeExtractor Maven / Gradle / Ivy
The newest version!
package it.unibz.inf.ontop.spec.sqlparser;
/*
* #%L
* ontop-obdalib-core
* %%
* Copyright (C) 2009 - 2014 Free University of Bozen-Bolzano
* %%
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
* #L%
*/
import com.google.common.collect.ImmutableList;
import it.unibz.inf.ontop.dbschema.*;
import it.unibz.inf.ontop.exception.InvalidQueryException;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
/**
* Used when the SQL cannot be parsed.
* The algorithm performs a crude approximate extraction of attribute names.
*
* Created by Roman Kontchakov on 09/01/2017.
*/
public class ApproximateSelectQueryAttributeExtractor {
private final QuotedIDFactory idfac;
private static final Pattern AS = Pattern.compile(
"(((\\w+)|(\"[^\"]+\")|(`[^`]+`)|(\\[[^]]+]))\\.)*" + // database, schema, table
"(?(\\w+)|(\"[^\"]+\")|(`[^`]+`)|(\\[[^]]+]))" + // all ID components can be unquoted or quoated in ", ` or []
"(\\s+(AS\\s+)?" +
"(?(\\w+)|(\"[^\"]+\")|(`[^`]+`)|(\\[[^]]+])))?", Pattern.CASE_INSENSITIVE);
private static final Pattern BRACKETS = Pattern.compile("\\([^()]*\\)");
private static final Pattern COL_SEP = Pattern.compile(",");
private static final Pattern SELECT = Pattern.compile("\\A\\s*SELECT\\s+(DISTINCT\\s)?", Pattern.CASE_INSENSITIVE);
private static final Pattern FROM = Pattern.compile("\\sFROM\\s", Pattern.CASE_INSENSITIVE);
public ApproximateSelectQueryAttributeExtractor(QuotedIDFactory idfac) {
this.idfac = idfac;
}
public ImmutableList getAttributes(String sql) throws InvalidQueryException {
Matcher startMatcher = SELECT.matcher(sql);
if (!startMatcher.find())
throw new InvalidQueryException("Error parsing SQL query: Couldn't find SELECT clause", sql);
int start = startMatcher.end();
Matcher endMatcher = FROM.matcher(sql);
if (!endMatcher.find())
throw new InvalidQueryException("Error parsing SQL query: Couldn't find FROM clause", sql);
int end = endMatcher.start();
String projection = sql.substring(start, end);
// remove all brackets
for (Matcher matcher = BRACKETS.matcher(projection); matcher.find(); matcher = BRACKETS.matcher(projection))
projection = matcher.replaceAll("");
final ImmutableList.Builder attributes = ImmutableList.builder();
for (String column : COL_SEP.split(projection)) {
Matcher columnMatcher = AS.matcher(column);
if (columnMatcher.find()) {
String columnString = columnMatcher.group("column");
String aliasString = columnMatcher.group("alias");
QuotedID attribute = idfac.createAttributeID(aliasString == null ? columnString : aliasString);
attributes.add(attribute);
}
}
return attributes.build();
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy