com.xmlcalabash.extensions.RDFLoad Maven / Gradle / Ivy
package com.xmlcalabash.extensions;
import com.hp.hpl.jena.graph.Node;
import com.hp.hpl.jena.query.Dataset;
import com.hp.hpl.jena.query.DatasetFactory;
import com.hp.hpl.jena.rdf.model.Literal;
import com.hp.hpl.jena.rdf.model.Model;
import com.hp.hpl.jena.rdf.model.ModelFactory;
import com.hp.hpl.jena.rdf.model.Property;
import com.hp.hpl.jena.rdf.model.RDFNode;
import com.hp.hpl.jena.rdf.model.Resource;
import com.hp.hpl.jena.rdf.model.Statement;
import com.hp.hpl.jena.rdf.model.StmtIterator;
import com.xmlcalabash.core.XProcConstants;
import com.xmlcalabash.core.XProcException;
import com.xmlcalabash.core.XProcRuntime;
import com.xmlcalabash.io.ReadablePipe;
import com.xmlcalabash.io.WritablePipe;
import com.xmlcalabash.library.DefaultStep;
import com.xmlcalabash.runtime.XAtomicStep;
import com.xmlcalabash.util.RelevantNodes;
import com.xmlcalabash.util.S9apiUtils;
import com.xmlcalabash.util.TreeWriter;
import net.sf.saxon.s9api.Axis;
import net.sf.saxon.s9api.QName;
import net.sf.saxon.s9api.SaxonApiException;
import net.sf.saxon.s9api.XdmNode;
import org.apache.jena.riot.Lang;
import org.apache.jena.riot.RDFDataMgr;
import org.apache.jena.riot.RiotReader;
import org.apache.jena.riot.lang.LangRIOT;
import org.apache.jena.riot.system.ErrorHandler;
import org.apache.jena.riot.system.ParserProfile;
import org.apache.jena.riot.system.RiotLib;
import org.apache.jena.riot.system.StreamRDF;
import org.apache.jena.riot.system.StreamRDFLib;
import java.io.IOException;
import java.net.MalformedURLException;
import java.net.URI;
import java.net.URL;
import java.net.URLConnection;
import java.util.Calendar;
import java.util.Iterator;
import java.util.Random;
import java.util.regex.Pattern;
/**
* Created by IntelliJ IDEA.
* User: ndw
* Date: Oct 8, 2008
* Time: 7:44:07 AM
* To change this template use File | Settings | File Templates.
*/
public class RDFLoad extends RDFStep {
/**
* Creates a new instance of Identity
*/
public RDFLoad(XProcRuntime runtime, XAtomicStep step) {
super(runtime,step);
}
public void run() throws SaxonApiException {
super.run();
while (source.moreDocuments()) {
XdmNode doc = source.read();
loadRdf(dataset, doc);
}
String href = getOption(_href).getString();
String graphName = getOption(_graph, (String) null);
Lang lang = getLanguage(href);
if (lang == null) {
throw new XProcException("Could not deduce language for RDFLoad data.");
}
Iterator graphNameIter = null;
StmtIterator statementIter = null;
try {
URI baseURI = step.getNode().getBaseURI();
URL url = baseURI.resolve(href).toURL();
URLConnection conn = url.openConnection();
StreamRDF dest = StreamRDFLib.dataset(dataset.asDatasetGraph());
LangRIOT parser = RiotReader.createParser(conn.getInputStream(), lang, href, dest);
ErrorHandler handler = new ParserErrorHandler(href);
ParserProfile prof = RiotLib.profile(lang, href, handler);
parser.setProfile(prof);
try {
parser.parse();
} catch (Throwable e) {
System.err.println("Parse error in RDFLoad document; processing partial document");
e.printStackTrace();
}
conn.getInputStream().close();
} catch (MalformedURLException e) {
throw new XProcException(e);
} catch (IOException e) {
throw new XProcException(e);
}
if (graphName == null) {
statementIter = dataset.getDefaultModel().listStatements();
dumpStatements(statementIter, null);
graphNameIter = dataset.listNames();
while (graphNameIter.hasNext()) {
String collection = graphNameIter.next();
statementIter = dataset.getNamedModel(collection).listStatements();
dumpStatements(statementIter, collection);
}
} else {
statementIter = dataset.getNamedModel(graphName).listStatements();
dumpStatements(statementIter, graphName);
}
}
}