
com.xmlcalabash.extensions.Sparql Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of xmlcalabash1-rdf Show documentation
Show all versions of xmlcalabash1-rdf Show documentation
XML Calabash extension steps to load/query RDF
The newest version!
package com.xmlcalabash.extensions;
import com.hp.hpl.jena.query.Query;
import com.hp.hpl.jena.query.QueryExecution;
import com.hp.hpl.jena.query.QueryExecutionFactory;
import com.hp.hpl.jena.query.QueryFactory;
import com.hp.hpl.jena.query.QuerySolution;
import com.hp.hpl.jena.query.ResultSet;
import com.hp.hpl.jena.query.ResultSetFormatter;
import com.hp.hpl.jena.rdf.model.Literal;
import com.hp.hpl.jena.rdf.model.RDFNode;
import com.hp.hpl.jena.rdf.model.Resource;
import com.hp.hpl.jena.rdf.model.StmtIterator;
import com.xmlcalabash.core.XMLCalabash;
import com.xmlcalabash.core.XProcConstants;
import com.xmlcalabash.core.XProcException;
import com.xmlcalabash.core.XProcRuntime;
import com.xmlcalabash.io.ReadablePipe;
import com.xmlcalabash.runtime.XAtomicStep;
import com.xmlcalabash.util.Base64;
import com.xmlcalabash.util.S9apiUtils;
import com.xmlcalabash.util.TreeWriter;
import com.xmlcalabash.util.XProcURIResolver;
import net.sf.saxon.s9api.QName;
import net.sf.saxon.s9api.SaxonApiException;
import net.sf.saxon.s9api.XdmNode;
import org.apache.jena.riot.Lang;
import org.apache.jena.riot.RiotReader;
import org.apache.jena.riot.lang.LangRIOT;
import org.apache.jena.riot.system.ErrorHandler;
import org.apache.jena.riot.system.ParserProfile;
import org.apache.jena.riot.system.RiotLib;
import org.apache.jena.riot.system.StreamRDF;
import org.apache.jena.riot.system.StreamRDFLib;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import org.xml.sax.InputSource;
import javax.xml.transform.Source;
import javax.xml.transform.TransformerException;
import javax.xml.transform.URIResolver;
import javax.xml.transform.sax.SAXSource;
import java.io.IOException;
import java.io.InputStream;
import java.net.MalformedURLException;
import java.net.URI;
import java.net.URISyntaxException;
import java.net.URL;
import java.net.URLConnection;
import java.util.Iterator;
/**
* Created by IntelliJ IDEA.
* User: ndw
* Date: Oct 8, 2008
* Time: 7:44:07 AM
* To change this template use File | Settings | File Templates.
*/
@XMLCalabash(
name = "cx:sparql",
type = "{http://xmlcalabash.com/ns/extensions}sparql")
public class Sparql extends RDFStep {
private static final QName _content_type = new QName("content-type");
private static final QName s_sparql = new QName("http://www.w3.org/2005/sparql-results#", "sparql");
private static final QName s_head = new QName("http://www.w3.org/2005/sparql-results#", "head");
private static final QName s_variable = new QName("http://www.w3.org/2005/sparql-results#", "variable");
private static final QName s_results = new QName("http://www.w3.org/2005/sparql-results#", "results");
private static final QName s_result = new QName("http://www.w3.org/2005/sparql-results#", "result");
private static final QName s_binding = new QName("http://www.w3.org/2005/sparql-results#", "binding");
private static final QName s_literal = new QName("http://www.w3.org/2005/sparql-results#", "literal");
private static final QName s_uri = new QName("http://www.w3.org/2005/sparql-results#", "uri");
private static final QName s_bnode = new QName("http://www.w3.org/2005/sparql-results#", "bnode");
private static final QName _name = new QName("", "name");
private ReadablePipe query = null;
public Sparql(XProcRuntime runtime, XAtomicStep step) {
super(runtime,step);
}
@Override
public void setInput(String port, ReadablePipe pipe) {
if ("source".equals(port)) {
source = pipe;
} else if ("query".equals(port)) {
query = pipe;
}
}
public void run() throws SaxonApiException {
super.run();
while (source.moreDocuments()) {
XdmNode doc = source.read();
loadRdf(dataset, doc);
}
XdmNode root = S9apiUtils.getDocumentElement(query.read());
String queryString = null;
if ((XProcConstants.c_data.equals(root.getNodeName())
&& "application/octet-stream".equals(root.getAttributeValue(_content_type)))
|| "base64".equals(root.getAttributeValue(_encoding))) {
byte[] decoded = Base64.decode(root.getStringValue());
queryString = new String(decoded);
} else {
queryString = root.getStringValue();
}
Query query = QueryFactory.create(queryString);
QueryExecution qe = null;
ResultSet results = null;
/*
qe = QueryExecutionFactory.create(query, dataset);
results = qe.execSelect();
ResultSetFormatter.out(System.out, results, query);
qe.close();
*/
qe = QueryExecutionFactory.create(query, dataset);
results = qe.execSelect();
TreeWriter tree = new TreeWriter(runtime);
tree.startDocument(step.getNode().getBaseURI());
tree.addStartElement(s_sparql);
tree.startContent();
tree.addStartElement(s_head);
tree.startContent();
for (String var : results.getResultVars()) {
tree.addStartElement(s_variable);
tree.addAttribute(_name, var);
tree.startContent();
tree.addEndElement();
}
tree.addEndElement();
tree.addStartElement(s_results);
tree.startContent();
while (results.hasNext()) {
QuerySolution soln = results.next();
tree.addStartElement(s_result);
tree.startContent();
Iterator iter = soln.varNames();
while (iter.hasNext()) {
String var = iter.next();
tree.addStartElement(s_binding);
tree.addAttribute(_name, var);
tree.startContent();
RDFNode node = soln.get(var);
if (node.isLiteral()) {
Literal lit = node.asLiteral();
tree.addStartElement(s_literal);
if (lit.getLanguage() == null || "".equals(lit.getLanguage())) {
String dt = lit.getDatatypeURI();
if (dt == null || "".equals(dt)) {
// nop
} else {
tree.addAttribute(_datatype, dt);
}
} else {
tree.addAttribute(XProcConstants.xml_lang, node.asLiteral().getLanguage());
}
tree.addText(node.asLiteral().toString());
tree.addEndElement();
} else if (node.isResource()) {
Resource rsrc = node.asResource();
if (rsrc.toString().startsWith("http://marklogic.com/semantics/blank/")) {
tree.addStartElement(s_bnode);
tree.startContent();
tree.addText(rsrc.toString());
tree.addEndElement();
} else {
tree.addStartElement(s_uri);
tree.startContent();
tree.addText(rsrc.toString());
tree.addEndElement();
}
} else {
throw new XProcException("Unexpected node type in sparql results");
}
tree.addEndElement();
}
tree.addEndElement();
}
tree.addEndElement();
tree.addEndElement();
tree.endDocument();
qe.close();
result.write(tree.getResult());
}
public static void configureStep(XProcRuntime runtime) {
XProcURIResolver resolver = runtime.getResolver();
URIResolver uriResolver = resolver.getUnderlyingURIResolver();
URIResolver myResolver = new StepResolver(uriResolver);
resolver.setUnderlyingURIResolver(myResolver);
}
private static class StepResolver implements URIResolver {
Logger logger = LoggerFactory.getLogger(Sparql.class);
URIResolver nextResolver = null;
public StepResolver(URIResolver next) {
nextResolver = next;
}
@Override
public Source resolve(String href, String base) throws TransformerException {
try {
URI baseURI = new URI(base);
URI xpl = baseURI.resolve(href);
if (library_xpl.equals(xpl.toASCIIString())) {
URL url = Sparql.class.getResource(library_url);
logger.debug("Reading library.xpl for cx:sparql from " + url);
InputStream s = Sparql.class.getResourceAsStream(library_url);
if (s != null) {
SAXSource source = new SAXSource(new InputSource(s));
return source;
} else {
logger.info("Failed to read " + library_url + " for cx:sparql");
}
}
} catch (URISyntaxException e) {
// nevermind
}
if (nextResolver != null) {
return nextResolver.resolve(href, base);
} else {
return null;
}
}
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy