org.aksw.sparqlify.update.IncrementalQueryUpdateManager Maven / Gradle / Ivy
package org.aksw.sparqlify.update;
import java.sql.SQLException;
import java.util.ArrayList;
import java.util.Collection;
import java.util.HashSet;
import java.util.List;
import java.util.Map;
import java.util.Set;
import org.aksw.commons.collections.diff.HashSetDiff;
import org.aksw.jena_sparql_api.utils.DnfUtils;
import org.aksw.jena_sparql_api.utils.FilterUtils;
import org.aksw.jena_sparql_api.utils.QuadUtils;
import org.aksw.jena_sparql_api.views.PatternUtils;
import org.apache.jena.graph.Node;
import org.apache.jena.query.Query;
import org.apache.jena.query.QueryFactory;
import org.apache.jena.query.ResultSet;
import org.apache.jena.sparql.algebra.Algebra;
import org.apache.jena.sparql.algebra.Op;
import org.apache.jena.sparql.core.Quad;
import org.apache.jena.sparql.engine.binding.Binding;
import org.apache.jena.sparql.expr.Expr;
import org.apache.jena.sparql.expr.ExprList;
import org.apache.jena.sparql.resultset.ResultSetMem;
import com.google.common.base.Joiner;
/**
* Keeps track of changes to a sparql query result
* in the course of updates.
*
*
* @author Claus Stadler
*
*/
public class IncrementalQueryUpdateManager
implements GraphListener
{
//private Map> sigToGraphs = new HashMap>();
Set quadFilters = new HashSet();
private ModelSparqlEndpoint sparqlEndpoint;
private Query query;
//private Set dirtyQuads = new HashSet();
HashSetDiff diff = new HashSetDiff();
HashSetDiff aggregatedChanges = new HashSetDiff();
/**
* Checks whether the given quad is relevant to this view.
*
* @param quad
* @return
*/
public boolean isRelevant(Quad quad)
{
for(QuadFilter graph : quadFilters) {
if(graph.doesAccept(quad)) {
return true;
}
}
return false;
}
/**
* Checks whether the given quad already exists in the store.
* FIXME Implement for batched checking
*
* @param quad
* @return
*/
public boolean doesExist(Quad quad) {
return sparqlEndpoint.createQueryExecution(FilterCompiler.askForQuad(quad)).execAsk();
}
public ResultSet processQuads(Iterable quads)
{
List orFilters = new ArrayList();
for(Quad quad : quads) {
for(QuadFilter graph : quadFilters) {
//graph.add(quad);
if(graph.doesAccept(quad)) {
// Take the original query, and evaluate it against the
// new triple
// TODO Currently we create a single huge filter statement
// A different strategy would be to create unions.
// Might be worth evaluating what the performance
// differenc is.
Map varMap = QuadUtils.getVarMapping(graph.getPattern(), quad);
List andFilters = new ArrayList();
for(Map.Entry entry : varMap.entrySet()) {
String str = FilterCompiler.compileFilter(entry.getValue(), "?" + entry.getKey().getName());
andFilters.add(str);
//filters += FilterCompiler.wrapFilter(FilterCompiler.compileFilter(entry.getValue(), "?" + entry.getKey().getName()));
}
orFilters.add(Joiner.on(" && ").join(andFilters));
}
}
}
if(orFilters.isEmpty()) {
return new ResultSetMem();
}
String filter = FilterCompiler.wrapFilter("(" + Joiner.on(") || (").join(orFilters) + ")");
// TODO This is a string hack to append our filter to the original query.
// Maybe there is a clean, structured jena way to do that?
String qs = query.toString();
int hackPos = qs.lastIndexOf("}");
qs = qs.substring(0, hackPos) + filter + "}";
ResultSet rs = sparqlEndpoint.createQueryExecution(qs).execSelect();
return rs;
}
/**
* This method must only be called for triples that were actually removed
* from the underlying store.
* Otherwise the view will go out of sync.
*
* @param quad
*/
public void removeSeen(Quad quad)
{
if(!isRelevant(quad)) {
return;
}
}
/**
* This method must only be called for triples that were actually added
* to the underlying store.
* Otherwise the view will go out of sync.
*
* @param quad
*/
public void add(Quad quad)
{
if(!isRelevant(quad)) {
return;
}
diff.add(quad);
}
public static Set resultSetToBindings(ResultSet rs) {
Set result = new HashSet();
while(rs.hasNext()) {
result.add(rs.nextBinding());
}
return result;
}
public HashSetDiff getChanges()
{
HashSetDiff result = new HashSetDiff();
result.getAdded().addAll(aggregatedChanges.getAdded());
result.getRemoved().addAll(aggregatedChanges.getRemoved());
aggregatedChanges.clear();
return result;
}
public void computeInserts()
{
System.out.println("#dirty quads: " + diff.getAdded().size());
Set added = resultSetToBindings(processQuads(diff.getAdded()));
diff.getAdded().clear();
for(Binding item : added) {
aggregatedChanges.add(item);
}
}
public void computeDeletions()
{
System.out.println("#deletion dirty quads: " + diff.getRemoved().size());
Set removed = resultSetToBindings(processQuads(diff.getRemoved()));
diff.getRemoved().clear();
for(Binding item : removed) {
aggregatedChanges.remove(item);
}
}
public void remove(Quad quad)
{
if(!isRelevant(quad)) {
return;
}
diff.remove(quad);
}
public IncrementalQueryUpdateManager(String queryString, ModelSparqlEndpoint sparqlEndpoint)
throws SQLException
{
this.sparqlEndpoint = sparqlEndpoint;
query = QueryFactory.create(queryString);
Op op = Algebra.compile(query);
op = Algebra.toQuadForm(op);
System.out.println(op);
//op = Algebra.optimize(op);
//System.out.println(op);
//String queryHash = StringUtils.md5Hash(queryString);
//viewTable = new ViewTable(dataSource, "sparql_matview_data_" + queryHash, query.getQueryPattern().varsMentioned());
//viewTable.clear();
// fill the table
//sparqlIntoView(sparqlEndpoint, queryString, viewTable);
// TODO Hack! Does not work with unions (because they scope filters)
ExprList exprs = FilterUtils.collectExprs(op, new ExprList());
Collection quads = PatternUtils.collectQuads(op, new ArrayList());
List clauses = DnfUtils.toClauses(exprs);
System.out.println("DNF = " + clauses);
Set> dnf = FilterUtils.toSets(clauses);
boolean isSatisfiable = dnf == null || DnfUtils.isSatisfiable(dnf);
if(!isSatisfiable) {
throw new RuntimeException("The view definition was detected to not be satisfiable");
}
//System.out.println("Satisfiable? " + DnfExprTransformer.isSatisfiable(dnf));
// Determine those expressions that are common to all clauses
/*
Set> clausesSet = toSets(clauses);
Set common = new HashSet();
if(!clausesSet.isEmpty()) {
common.addAll(clausesSet.iterator().next());
for(Set entry : clausesSet) {
common.retainAll(entry);
if(common.isEmpty()) {
break;
}
}
}
for(Quad quad : quads) {
List filter = new ArrayList();
for(Expr x : common) {
if(PatternUtils.getVariables(quad).containsAll(x.getVarsMentioned())) {
filter.add(new ExprList(x));
System.out.println("For quad " + quad + " got expr " + x);
}
}
graphs.add(new FilteredGraph(quad, filter));
//QuadSignature signature = Equivalence.getSignature(quad);
//MultiMaps.put(sigToGraphs, signature, new FilteredGraph(quad, filter));
}
*/
for(Quad quad : quads) {
Set> filter = FilterUtils.determineFilterDnf(quad, dnf);
System.out.println("For quad " + quad + " got expr " + filter);
quadFilters.add(new QuadFilter(quad, filter));
}
}
// TODO The incemental update manager is separate from the view
public static void sparqlIntoView(ModelSparqlEndpoint sparqlEndpoint, String queryString, ViewTable viewTable)
throws SQLException
{
ResultSet rs = sparqlEndpoint.createQueryExecution(queryString).execSelect();
while(rs.hasNext()) {
Binding binding = rs.nextBinding();
viewTable.insert(binding);
}
}
@Override
public void onPreBatchStart() {
// TODO Auto-generated method stub
}
@Override
public void onPreInsert(Quad quad) {
this.add(quad);
}
@Override
public void onPreDelete(Quad quad) {
this.remove(quad);
}
@Override
public void onPreBatchEnd() {
computeDeletions();
}
@Override
public void onPostBatchStart() {
// TODO Auto-generated method stub
}
@Override
public void onPostInsert(Quad quad) {
// TODO Auto-generated method stub
}
@Override
public void onPostDelete(Quad quad) {
// TODO Auto-generated method stub
}
@Override
public void onPostBatchEnd() {
computeInserts();
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy