com.bigdata.rdf.sparql.ast.TestStaticAnalysis_CanJoinUsingConstraints Maven / Gradle / Ivy
Show all versions of bigdata-rdf-test Show documentation
/**
Copyright (C) SYSTAP, LLC DBA Blazegraph 2006-2016. All rights reserved.
Contact:
SYSTAP, LLC DBA Blazegraph
2501 Calvert ST NW #106
Washington, DC 20008
[email protected]
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; version 2 of the License.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
*/
/*
* Created on Oct 20, 2011
*/
package com.bigdata.rdf.sparql.ast;
import java.util.Arrays;
import java.util.LinkedHashSet;
import java.util.Random;
import java.util.Set;
import org.apache.log4j.Logger;
import com.bigdata.bop.Constant;
import com.bigdata.rdf.internal.IV;
import com.bigdata.rdf.internal.VTE;
import com.bigdata.rdf.internal.impl.TermId;
/**
* This test suite is built around around BSBM Q5. Each test has an existing
* join path and a new vertex to be added to the join path. The question is
* whether or not the vertex can join with the join path using one or
* more shared variable(s). This tests a method used to incrementally grow a
* join path when it is dynamically decided that an {@link IJoinNode} may be
* added to the join path based on shared variables. Static analysis easily
* reports those joins which are allowed based on the variables directly given
* with two {@link IJoinNode}s. The purpose of this test suite is to explore
* when joins (based on shared variables) become permissible through
* {@link FilterNode}s as the variable(s) used within those constraints become
* bound.
*
* This set of unit tests explores various join paths and verifies that the
* canJoin() and canJoinUsingConstraints() methods correctly recognize edges by
* which a join path can be extended corresponding to both static and dynamic
* analysis of the query.
*
* @see StaticAnalysis#canJoin(IJoinNode, IJoinNode)
* @see {@link StaticAnalysis#canJoinUsingConstraints(IJoinNode[], IJoinNode, FilterNode[])}
*
* @author Bryan Thompson
* @version $Id: TestBOpUtility_canJoinUsingConstraints.java 4211 2011-02-20
* 21:20:44Z thompsonbry $
*
* @todo These are the full plans generated by the runtime and static
* optimizers. One way to test canJoinXXX() is to run out these join plans
* and verify that they report "true" in each case. However, the critical
* bit to test are join plans where the predicates w/o the shared
* variables can be run earlier due to the FILTERs.
*
*
* test_bsbm_q5 : static [0] : : ids=[1, 2, 4, 6, 0, 3, 5]
* test_bsbm_q5 : runtime[0] : : ids=[1, 2, 0, 4, 6, 3, 5]
*
*/
//@SuppressWarnings("unchecked")
public class TestStaticAnalysis_CanJoinUsingConstraints extends
AbstractASTEvaluationTestCase {
private static final Logger log = Logger
.getLogger(TestStaticAnalysis_CanJoinUsingConstraints.class);
/**
*
*/
public TestStaticAnalysis_CanJoinUsingConstraints() {
}
/**
* @param name
*/
public TestStaticAnalysis_CanJoinUsingConstraints(final String name) {
super(name);
}
/**
* Return a (Mock) IV.
*/
@SuppressWarnings("rawtypes")
private IV mockIV() {
return TermId.mockIV(VTE.URI);
}
/**
* Unit tests to verify that arguments are validated.
*
* @see StaticAnalysis#canJoinUsingConstraints(IJoinNode[], IJoinNode, FilterNode[])
*/
public void test_canJoinUsingConstraints_illegalArgument() {
@SuppressWarnings("rawtypes")
final ConstantNode p = new ConstantNode(new Constant(mockIV()));
@SuppressWarnings("rawtypes")
final ConstantNode q = new ConstantNode(new Constant(mockIV()));
@SuppressWarnings("rawtypes")
final ConstantNode r = new ConstantNode(new Constant(mockIV()));
final VarNode x = new VarNode("x");
final VarNode y = new VarNode("y");
// Note: no shared variables.
final StatementPatternNode p1 = new StatementPatternNode(x, q, r);
final StatementPatternNode p2 = new StatementPatternNode(y, p, q);
final StaticAnalysis sa = new StaticAnalysis(new QueryRoot(QueryType.SELECT));
// path must not be null.
try {
sa.canJoinUsingConstraints(//
null, // path
p1,// vertex
new FilterNode[0]// constraints
);
fail("Expecting: " + IllegalArgumentException.class);
} catch (IllegalArgumentException ex) {
if (log.isInfoEnabled())
log.info("Expecting: " + IllegalArgumentException.class);
}
// vertex must not be null.
try {
sa.canJoinUsingConstraints(//
new IJoinNode[]{p1}, // path
null,// vertex
new FilterNode[0]// constraints
);
fail("Expecting: " + IllegalArgumentException.class);
} catch (IllegalArgumentException ex) {
if (log.isInfoEnabled())
log.info("Expecting: " + IllegalArgumentException.class);
}
// path may not be empty.
try {
sa.canJoinUsingConstraints(//
new IJoinNode[] {}, // path
p1,// vertex
new FilterNode[0]// constraints
);
fail("Expecting: " + IllegalArgumentException.class);
} catch (IllegalArgumentException ex) {
if (log.isInfoEnabled())
log.info("Expecting: " + IllegalArgumentException.class);
}
// path elements may not be null.
try {
sa.canJoinUsingConstraints(//
new IJoinNode[] { p2, null }, // path
p1,// vertex
new FilterNode[0]// constraints
);
fail("Expecting: " + IllegalArgumentException.class);
} catch (IllegalArgumentException ex) {
if (log.isInfoEnabled())
log.info("Expecting: " + IllegalArgumentException.class);
}
// vertex must not appear in the path.
try {
sa.canJoinUsingConstraints(//
new IJoinNode[] { p2, p1 }, // path
p1,// vertex
new FilterNode[0]// constraints
);
fail("Expecting: " + IllegalArgumentException.class);
} catch (IllegalArgumentException ex) {
if (log.isInfoEnabled())
log.info("Expecting: " + IllegalArgumentException.class);
}
// constraint array may not contain null elements.
try {
sa.canJoinUsingConstraints(//
new IJoinNode[] { p2 }, // path
p1,// vertex
new FilterNode[] { //
new FilterNode(new VarNode("x")),
null //
}// constraints
);
fail("Expecting: " + IllegalArgumentException.class);
} catch (IllegalArgumentException ex) {
if (log.isInfoEnabled())
log.info("Expecting: " + IllegalArgumentException.class);
}
}
/**
* Unit test for one-step joins based on the {@link #product} variable.
*/
public void test_canJoinUsingConstraints_1step_productVar() {
final BSBMQ5Setup s = new BSBMQ5Setup(store);
final StaticAnalysis sa = new StaticAnalysis(s.queryRoot);
// share ?product
final IJoinNode[] a = new IJoinNode[] { s.p0, s.p2, s.p4, s.p6 };
for (int i = 0; i < a.length; i++) {
for (int j = i; j < a.length; j++) {
final IJoinNode t0 = a[i];
final IJoinNode t1 = a[j];
assertTrue(sa.canJoin(t0, t1));
assertTrue(sa.canJoin(t1, t0));
if (t0 != t1) {
/*
* Test join path extension, but not when the vertex used to
* extend the path is already present in the join path.
*/
assertTrue(sa.canJoinUsingConstraints(//
new IJoinNode[] { t0 }, // path
t1,// vertex
new FilterNode[0]// constraints
));
assertTrue(sa.canJoinUsingConstraints(//
new IJoinNode[] { t1 }, // path
t0,// vertex
new FilterNode[0]// constraints
));
}
}
}
}
/**
* Unit test for multi-step join paths based on the {@link #product}
* variable.
*/
public void test_canJoinUsingConstraints_multiStep_productVar() {
final BSBMQ5Setup s = new BSBMQ5Setup(store);
final StaticAnalysis sa = new StaticAnalysis(s.queryRoot);
final Random r = new Random();
// share ?product
final IJoinNode[] a = new IJoinNode[] { s.p0, s.p2, s.p4, s.p6 };
// existing path length [1:3].
final int existingPathLength = r.nextInt(3) + 1;
// generated pre-existing path.
final IJoinNode[] path = new IJoinNode[existingPathLength];
// vertex which will extend that path
final IJoinNode vertex;
{
// collection of predicates used so far by the path.
final Set used = new LinkedHashSet();
for (int i = 0; i < path.length; i++) {
// Locate an unused predicate.
int index;
while (true) {
index = r.nextInt(a.length);
if (!used.contains(index)) {
used.add(index);
break;
}
}
// add to the path.
path[i] = a[index];
}
// Locate an unused predicate to serve as the extension vertex.
{
// Locate an unused predicate.
int index;
while (true) {
index = r.nextInt(a.length);
if (!used.contains(index)) {
used.add(index);
break;
}
}
vertex = a[index];
}
}
// Verify all joins in the path are legal.
for (int i = 0; i < path.length - 1; i++) {
assertTrue(sa.canJoin(path[i], path[i + 1]));
}
// Verify the extension of the path is legal.
assertTrue(sa.canJoinUsingConstraints(//
path,//
vertex,//
new FilterNode[0]// constraints
));
}
/**
* Unit test examines the predicates without shared variables and verifies
* (a) that joins are not permitted when the constraints are not considered;
* and (b) that joins are permitted when the constraints are considered.
*
* This test is identical to {@link #test_canJoinUsingConstraints_p5_p6()()}
* except that it considers the ({@link #p3} x {@link #p4}) join via the
* {@link #c1} constraint instead.
*/
public void test_canJoinUsingConstraints_p3_p4() {
final BSBMQ5Setup s = new BSBMQ5Setup(store);
final StaticAnalysis sa = new StaticAnalysis(s.queryRoot);
/*
* Verify (p3,p4) join is not permitted when we do not consider the
* constraints (i.e., the join would be an unconstrained cross product
* if it were executed).
*/
assertFalse(sa.canJoin(s.p3, s.p4));
assertFalse(sa.canJoin(s.p4, s.p3));
assertFalse(sa.canJoinUsingConstraints(//
new IJoinNode[] { s.p3 }, // path
s.p4,// vertex
new FilterNode[0]// constraints
));
assertFalse(sa.canJoinUsingConstraints(//
new IJoinNode[] { s.p4 }, // path
s.p3,// vertex
new FilterNode[0]// constraints
));
/*
* Verify (p3,p4) join is not permitted if we do not consider the
* constraint which provides the shared variables.
*/
assertFalse(sa.canJoinUsingConstraints(//
new IJoinNode[] { s.p3 }, // path
s.p4,// vertex
new FilterNode[] { s.c2 }// constraints
));
assertFalse(sa.canJoinUsingConstraints(//
new IJoinNode[] { s.p4 }, // path
s.p3,// vertex
new FilterNode[] { s.c2 }// constraints
));
/*
* Verify (p3,p4) join is permitted if we consider the constraint which
* provides the shared variables.
*/
assertTrue(sa.canJoinUsingConstraints(//
new IJoinNode[] { s.p3 }, // path
s.p4,// vertex
new FilterNode[] { s.c1 }// constraints
));
assertTrue(sa.canJoinUsingConstraints(//
new IJoinNode[] { s.p4 }, // path
s.p3,// vertex
new FilterNode[] { s.c1 }// constraints
));
}
/**
* Unit test examines the predicates without shared variables and verifies
* (a) that joins are not permitted when the constraints are not considered;
* and (b) that joins are permitted when the constraints are considered.
*
* This test is identical to {@link #test_canJoinUsingConstraints_p3_p4()}
* except that it considers the ({@link #p5} x {@link #p6}) join via the
* {@link #c2} constraint instead.
*/
public void test_canJoinUsingConstraints_p5_p6() {
final BSBMQ5Setup s = new BSBMQ5Setup(store);
final StaticAnalysis sa = new StaticAnalysis(s.queryRoot);
/*
* Verify (p5,p6) join is not permitted when we do not consider the
* constraints (i.e., the join would be an unconstrained cross product
* if it were executed).
*/
assertFalse(sa.canJoin(s.p5, s.p6));
assertFalse(sa.canJoin(s.p6, s.p5));
assertFalse(sa.canJoinUsingConstraints(//
new IJoinNode[] { s.p5 }, // path
s.p6,// vertex
new FilterNode[0]// constraints
));
assertFalse(sa.canJoinUsingConstraints(//
new IJoinNode[] { s.p6 }, // path
s.p5,// vertex
new FilterNode[0]// constraints
));
/*
* Verify (p5,p6) join is not permitted if we do not consider the
* constraint which provides the shared variables.
*/
assertFalse(sa.canJoinUsingConstraints(//
new IJoinNode[] { s.p5 }, // path
s.p6,// vertex
new FilterNode[] { s.c1 }// constraints
));
assertFalse(sa.canJoinUsingConstraints(//
new IJoinNode[] { s.p6 }, // path
s.p5,// vertex
new FilterNode[] { s.c1 }// constraints
));
/*
* Verify (p5,p6) join is permitted if we consider the constraint which
* provides the shared variables.
*/
assertTrue(sa.canJoinUsingConstraints(//
new IJoinNode[] { s.p5 }, // path
s.p6,// vertex
new FilterNode[] { s.c2 }// constraints
));
assertTrue(sa.canJoinUsingConstraints(//
new IJoinNode[] { s.p6 }, // path
s.p5,// vertex
new FilterNode[] { s.c2 }// constraints
));
}
/*
* Unit tests for attaching constraints using a specific join path.
*/
/** path = [1, 2, 4, 6, 0, 3, 5]
*/
public void test_attachConstraints_BSBM_Q5_path01() {
final BSBMQ5Setup s = new BSBMQ5Setup(store);
final StaticAnalysis sa = new StaticAnalysis(s.queryRoot);
final IJoinNode[] path = { s.p1, s.p2, s.p4, s.p6, s.p0, s.p3, s.p5 };
final FilterNode[][] actual = sa
.getJoinGraphConstraints(path, s.constraints,
null/* knownBoundVars */, true/* pathIsComplete */);
@SuppressWarnings("unchecked")
final Set[] expected = new Set[] { //
s.NA, // p1
s.C0, // p2
s.NA, // p4
s.NA, // p6
s.NA, // p0
s.C1, // p3
s.C2, // p5
};
assertSameConstraints(expected, actual);
}
/** [5, 3, 1, 0, 2, 4, 6]
. */
public void test_attachConstraints_BSBM_Q5_path02() {
final BSBMQ5Setup s = new BSBMQ5Setup(store);
final StaticAnalysis sa = new StaticAnalysis(s.queryRoot);
final IJoinNode[] path = { s.p5, s.p3, s.p1, s.p0, s.p2, s.p4, s.p6 };
final FilterNode[][] actual = sa
.getJoinGraphConstraints(path, s.constraints,
null/* knownBoundVars */, true/* pathIsComplete */);
@SuppressWarnings("unchecked")
final Set[] expected = new Set[] { //
s.NA, // p5
s.NA, // p3
s.NA, // p1
s.C0, // p0
s.NA, // p2
s.C1, // p4
s.C2, // p6
};
assertSameConstraints(expected, actual);
}
/** [3, 4, 5, 6, 1, 2, 0]
(key-range constraint variant). */
public void test_attachConstraints_BSBM_Q5_path03() {
final BSBMQ5Setup s = new BSBMQ5Setup(store);
final StaticAnalysis sa = new StaticAnalysis(s.queryRoot);
final IJoinNode[] path = { s.p3, s.p4, s.p5, s.p6, s.p1, s.p2, s.p0 };
final FilterNode[][] actual = sa
.getJoinGraphConstraints(path, s.constraints,
null/* knownBoundVars */, true/* pathIsComplete */);
@SuppressWarnings("unchecked")
final Set[] expected = new Set[] { //
s.NA, // p3
asSet(new FilterNode[]{s.c0,s.c1}), // p4
s.NA, // p5
s.C2, // p6
s.NA, // p1
s.NA, // p2
s.NA, // p0
};
assertSameConstraints(expected, actual);
}
/**
* [5 6 0 2 1 4 3]
.
*
* FIXME The above join path produces a false ZERO result for the query and
* all of the join path segments below produce a false exact ZERO (0E)
* cardinality estimate. Figure out why. The final path chosen could have
* been any of the one step extensions of a path with a false 0E cardinality
* estimate.
*
*
* INFO : 3529 main com.bigdata.bop.joinGraph.rto.JGraph.expand(JGraph.java:1116):
* ** round=4: paths{in=14,considered=26,out=6}
* path srcCard * f ( in sumRgCt tplsRead out limit adjCard) = estRead estCard : sumEstRead sumEstCard sumEstCost joinPath
* 0 0E * 0.00 ( 0 0 0 0 200 0) = 0 0E : 1 0 0 [ 5 6 0 2 1 4 ]
* 1 0E * 0.00 ( 0 0 0 0 200 0) = 0 0E : 1 0 0 [ 5 6 0 2 4 3 ]
* 2 0E * 0.00 ( 0 0 0 0 200 0) = 0 0E : 1 0 0 [ 5 6 0 4 1 3 ]
* 3 0E * 0.00 ( 0 0 0 0 200 0) = 0 0E : 1 0 0 [ 5 6 2 1 4 3 ]
* 4 208 * 1.00 ( 26 26 26 26 400 26) = 26 208 : 16576 1447 1447 [ 5 3 1 2 4 0 ]
* 5 0E * 0.00 ( 0 0 0 0 200 0) = 0 0E : 2 1 1 [ 5 3 6 0 1 2 ]
*
*/
public void test_attachConstraints_BSBM_Q5_path04() {
final BSBMQ5Setup s = new BSBMQ5Setup(store);
final StaticAnalysis sa = new StaticAnalysis(s.queryRoot);
final IJoinNode[] path = { s.p5, s.p6, s.p0, s.p2, s.p1, s.p4, s.p3 };
final FilterNode[][] actual = sa
.getJoinGraphConstraints(path, s.constraints,
null/* knownBoundVars */, true/* pathIsComplete */);
@SuppressWarnings("unchecked")
final Set[] expected = new Set[] { //
s.NA, // p5
asSet(new FilterNode[] { s.c0, s.c2 }), // p6
s.NA, // p0
s.NA, // p2
s.NA, // p1
s.NA, // p4
s.C1, // p3
};
assertSameConstraints(expected, actual);
}
/**
* Verifies that the right set of constraints is attached at each of the
* vertices of a join path. Comparison of {@link FilterNode} instances is by
* reference.
*
* @param expected
* @param actual
*/
static void assertSameConstraints(final Set[] expected,
final FilterNode[][] actual) {
assertEquals("length", expected.length, actual.length);
for (int i = 0; i < expected.length; i++) {
final Set e = expected[i];
final FilterNode[] a = actual[i];
if (e.size() != a.length) {
fail("Differs at expected[" + i + "] : expecting " + e.size()
+ ", not " + a.length + " elements: "
+ Arrays.toString(a));
}
for (int j = 0; j < a.length; j++) {
boolean foundRef = false;
for (FilterNode t : e) {
if (t == a[j]) {
foundRef = true;
break;
}
}
if (!foundRef) {
fail("Differs at expected[" + i + "][" + j + "] : actual="
+ a[j]);
}
}
}
}
}