All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.eclipse.rdf4j.rio.turtle.TurtleWriter Maven / Gradle / Ivy

/*******************************************************************************
 * Copyright (c) 2015 Eclipse RDF4J contributors, Aduna, and others.
 *
 * All rights reserved. This program and the accompanying materials
 * are made available under the terms of the Eclipse Distribution License v1.0
 * which accompanies this distribution, and is available at
 * http://www.eclipse.org/org/documents/edl-v10.php.
 *
 * SPDX-License-Identifier: BSD-3-Clause
 *******************************************************************************/
package org.eclipse.rdf4j.rio.turtle;

import java.io.BufferedWriter;
import java.io.IOException;
import java.io.OutputStream;
import java.io.OutputStreamWriter;
import java.io.Writer;
import java.nio.charset.StandardCharsets;
import java.util.ArrayDeque;
import java.util.Collection;
import java.util.Deque;
import java.util.HashSet;
import java.util.Map;
import java.util.Objects;
import java.util.Optional;
import java.util.Set;
import java.util.StringTokenizer;

import org.eclipse.rdf4j.common.io.CharSink;
import org.eclipse.rdf4j.common.io.IndentingWriter;
import org.eclipse.rdf4j.common.net.ParsedIRI;
import org.eclipse.rdf4j.common.text.StringUtil;
import org.eclipse.rdf4j.model.BNode;
import org.eclipse.rdf4j.model.IRI;
import org.eclipse.rdf4j.model.Literal;
import org.eclipse.rdf4j.model.Model;
import org.eclipse.rdf4j.model.ModelFactory;
import org.eclipse.rdf4j.model.Resource;
import org.eclipse.rdf4j.model.Statement;
import org.eclipse.rdf4j.model.Triple;
import org.eclipse.rdf4j.model.Value;
import org.eclipse.rdf4j.model.datatypes.XMLDatatypeUtil;
import org.eclipse.rdf4j.model.impl.LinkedHashModelFactory;
import org.eclipse.rdf4j.model.impl.SimpleIRI;
import org.eclipse.rdf4j.model.util.Literals;
import org.eclipse.rdf4j.model.util.ModelException;
import org.eclipse.rdf4j.model.util.Models;
import org.eclipse.rdf4j.model.util.RDFCollections;
import org.eclipse.rdf4j.model.vocabulary.RDF;
import org.eclipse.rdf4j.model.vocabulary.XSD;
import org.eclipse.rdf4j.rio.RDFFormat;
import org.eclipse.rdf4j.rio.RDFHandlerException;
import org.eclipse.rdf4j.rio.RioSetting;
import org.eclipse.rdf4j.rio.helpers.AbstractRDFWriter;
import org.eclipse.rdf4j.rio.helpers.BasicParserSettings;
import org.eclipse.rdf4j.rio.helpers.BasicWriterSettings;

/**
 * An implementation of the RDFWriter interface that writes RDF documents in Turtle format. The Turtle format is defined
 * in in this document.
 */
public class TurtleWriter extends AbstractRDFWriter implements CharSink {

	private static final int LINE_WRAP = 80;

	private static final long DEFAULT_BUFFER_SIZE = 1000l;

	private static final IRI FIRST = new SimpleIRI(RDF.FIRST.stringValue()) {
		private static final long serialVersionUID = -7951518099940758898L;
	};

	private static final IRI REST = new SimpleIRI(RDF.REST.stringValue()) {
		private static final long serialVersionUID = -7951518099940758898L;
	};

	/**
	 * Size of statement buffer used for pretty printing and blank node inlining. Set to Long.MAX_VALUE to buffer
	 * everything until the end (necessary when blank node inlining).
	 */
	private long bufferSize = DEFAULT_BUFFER_SIZE;
	protected Model bufferedStatements;
	private final Object bufferLock = new Object();

	protected ParsedIRI baseIRI;
	protected IndentingWriter writer;

	/**
	 * Flag indicating whether the last written statement has been closed.
	 */
	protected boolean statementClosed = true;
	protected Resource lastWrittenSubject;
	protected IRI lastWrittenPredicate;

	private final Deque stack = new ArrayDeque<>();
	private final Deque path = new ArrayDeque<>();

	private Boolean xsdStringToPlainLiteral;
	private Boolean prettyPrint;
	private boolean inlineBNodes;
	private Boolean abbreviateNumbers;

	private ModelFactory modelFactory = new LinkedHashModelFactory();

	/**
	 * Creates a new TurtleWriter that will write to the supplied OutputStream.
	 *
	 * @param out The OutputStream to write the Turtle document to.
	 */
	public TurtleWriter(OutputStream out) {
		this(out, null);
	}

	/**
	 * Creates a new TurtleWriter that will write to the supplied OutputStream.
	 *
	 * @param out     The OutputStream to write the Turtle document to.
	 * @param baseIRI
	 */
	public TurtleWriter(OutputStream out, ParsedIRI baseIRI) {
		this.baseIRI = baseIRI;
		// The BufferedWriter is here to avoid to many calls to the CharEncoder
		// see javadoc of OutputStreamWriter.
		this.writer = new IndentingWriter(new BufferedWriter(new OutputStreamWriter(out, StandardCharsets.UTF_8)));
	}

	/**
	 * Creates a new TurtleWriter that will write to the supplied Writer.
	 *
	 * @param writer The Writer to write the Turtle document to.
	 */
	public TurtleWriter(Writer writer) {
		this(writer, null);
	}

	/**
	 * Creates a new TurtleWriter that will write to the supplied Writer.
	 *
	 * @param writer  The Writer to write the Turtle document to.
	 * @param baseIRI
	 */
	public TurtleWriter(Writer writer, ParsedIRI baseIRI) {
		this.baseIRI = baseIRI;
		this.writer = new IndentingWriter(writer);
	}

	@Override
	public Writer getWriter() {
		return writer;
	}

	@Override
	public RDFFormat getRDFFormat() {
		return RDFFormat.TURTLE;
	}

	@Override
	public Collection> getSupportedSettings() {
		final Collection> settings = new HashSet<>(super.getSupportedSettings());
		settings.add(BasicWriterSettings.BASE_DIRECTIVE);
		settings.add(BasicWriterSettings.XSD_STRING_TO_PLAIN_LITERAL);
		settings.add(BasicWriterSettings.PRETTY_PRINT);
		settings.add(BasicWriterSettings.INLINE_BLANK_NODES);
		settings.add(TurtleWriterSettings.ABBREVIATE_NUMBERS);
		return settings;
	}

	@Override
	public void startRDF() throws RDFHandlerException {
		super.startRDF();

		try {
			xsdStringToPlainLiteral = getWriterConfig().get(BasicWriterSettings.XSD_STRING_TO_PLAIN_LITERAL);
			prettyPrint = getWriterConfig().get(BasicWriterSettings.PRETTY_PRINT);
			inlineBNodes = getWriterConfig().get(BasicWriterSettings.INLINE_BLANK_NODES);
			abbreviateNumbers = getWriterConfig().get(TurtleWriterSettings.ABBREVIATE_NUMBERS);

			if (isBuffering()) {
				this.bufferedStatements = getModelFactory().createEmptyModel();
				this.bufferSize = inlineBNodes ? Long.MAX_VALUE : DEFAULT_BUFFER_SIZE;
			}

			if (prettyPrint) {
				writer.setIndentationString("  ");
			} else {
				writer.setIndentationString("");
			}
			if (baseIRI != null && getWriterConfig().get(BasicWriterSettings.BASE_DIRECTIVE)) {
				writeBase(baseIRI.toString());
			}

			// Write namespace declarations
			for (Map.Entry entry : namespaceTable.entrySet()) {
				String name = entry.getKey();
				String prefix = entry.getValue();

				writeNamespace(prefix, name);
			}

			if (!namespaceTable.isEmpty()) {
				writer.writeEOL();
			}
		} catch (IOException e) {
			throw new RDFHandlerException(e);
		}
	}

	@Override
	public void endRDF() throws RDFHandlerException {
		checkWritingStarted();
		synchronized (bufferLock) {
			processBuffer();
		}
		try {
			closePreviousStatement();
			writer.flush();
		} catch (IOException e) {
			throw new RDFHandlerException(e);
		}
	}

	@Override
	public void handleNamespace(String prefix, String name) throws RDFHandlerException {
		checkWritingStarted();
		try {
			if (!namespaceTable.containsKey(name)) {
				// Namespace not yet mapped to a prefix, try to give it the
				// specified prefix

				boolean isLegalPrefix = prefix.isEmpty() || TurtleUtil.isPN_PREFIX(prefix);

				if (!isLegalPrefix || namespaceTable.containsValue(prefix)) {
					// Specified prefix is not legal or the prefix is already in
					// use,
					// generate a legal unique prefix

					if (prefix.isEmpty() || !isLegalPrefix) {
						prefix = "ns";
					}

					int number = 1;

					while (namespaceTable.containsValue(prefix + number)) {
						number++;
					}

					prefix += number;
				}

				namespaceTable.put(name, prefix);

				closePreviousStatement();

				writeNamespace(prefix, name);
			}
		} catch (IOException e) {
			throw new RDFHandlerException(e);
		}
	}

	/**
	 * Set a {@link ModelFactory} to use for creating internal Models for statement processing/buffering purposes.
	 *
	 * @param modelFactory a {@link ModelFactory} to use for internal buffering / statement processing purposes. May not
	 *                     be null.
	 */
	public void setModelFactory(ModelFactory modelFactory) {
		this.modelFactory = Objects.requireNonNull(modelFactory);
	}

	protected ModelFactory getModelFactory() {
		return modelFactory;
	}

	@Override
	protected void consumeStatement(Statement st) throws RDFHandlerException {
		if (isBuffering()) {
			synchronized (bufferLock) {
				bufferedStatements.add(st);
				if (bufferedStatements.size() >= this.bufferSize) {
					processBuffer();
				}
			}
		} else {
			handleStatementInternal(st, false, false, false);
		}
	}

	/**
	 * Internal method that differentiates between the pretty-print and streaming writer cases.
	 *
	 * @param st                     The next statement to write
	 * @param endRDFCalled           True if endRDF has been called before this method is called. This is used to buffer
	 *                               statements for pretty-printing before dumping them when all statements have been
	 *                               delivered to us.
	 * @param canShortenSubjectBNode True if, in the current context, we may be able to shorten the subject of this
	 *                               statement iff it is an instance of {@link BNode}.
	 * @param canShortenObjectBNode  True if, in the current context, we may be able to shorten the object of this
	 *                               statement iff it is an instance of {@link BNode}.
	 */
	protected void handleStatementInternal(Statement st, boolean endRDFCalled, boolean canShortenSubjectBNode,
			boolean canShortenObjectBNode) {
		Resource subj = st.getSubject();
		IRI pred = st.getPredicate();
		Value obj = st.getObject();

		try {
			if (inlineBNodes) {
				if ((pred.equals(RDF.FIRST) || pred.equals(RDF.REST)) && isWellFormedCollection(subj)) {
					// we only use list shorthand syntax if the collection is considered well-formed
					handleList(st, canShortenObjectBNode);
				} else if (!subj.equals(lastWrittenSubject) && stack.contains(subj)) {
					handleInlineNode(st, canShortenSubjectBNode, canShortenObjectBNode);
				} else {
					writeStatement(subj, pred, obj, st.getContext(), canShortenSubjectBNode, canShortenObjectBNode);
				}
			} else {
				writeStatement(subj, pred, obj, st.getContext(), canShortenSubjectBNode, canShortenObjectBNode);
			}
		} catch (IOException e) {
			throw new RDFHandlerException(e);
		}
	}

	/**
	 * Check that the collection started with the supplied subject node is a well-formed RDF Collection.
	 * 

* It specifically checks that any collection subject blank nodes (the subjects of the rdf:first and rdf:rest * statements) are _not_ reused for any other, unrelated statements, and there are no things like multiple rdf:first * or rdf:rest statements for the same subject. *

* * @return true if the collection is considered well-formed false otherwise. */ private boolean isWellFormedCollection(Resource subj) { try { // first check is if we can process as a collection. This is not enough to establish it's well-formed but a // useful first step. final Model collection = RDFCollections.getCollection(bufferedStatements, subj, getModelFactory().createEmptyModel()); // check that collection subject nodes are not re-used for non-collection purposes for (Resource s : Models.subjectBNodes(collection)) { boolean firstFound = false, restFound = false; for (Statement st : bufferedStatements.getStatements(s, null, null)) { IRI pred = st.getPredicate(); if (pred.equals(RDF.FIRST)) { if (!firstFound) { firstFound = true; } else { // second rdf:first statement on same subject is invalid. return false; } } else if (pred.equals(RDF.REST)) { if (!restFound) { restFound = true; } else { // second rdf:rest statement on same subject is invalid. return false; } } else { // non-list-structure statement connected to collection subject blank node return false; } } } return true; } catch (ModelException e) { // collection util could not process the collection return false; } } protected void writeStatement(Resource subj, IRI pred, Value obj, Resource context, boolean canShortenSubjectBNode, boolean canShortenObjectBNode) throws IOException { closeHangingResource(); if (subj.equals(lastWrittenSubject)) { if (pred.equals(lastWrittenPredicate)) { // Identical subject and predicate writer.write(","); wrapLine(prettyPrint); } else { // Identical subject, new predicate writer.write(";"); writer.writeEOL(); // Write new predicate writer.decreaseIndentation(); writePredicate(pred); writer.increaseIndentation(); wrapLine(true); path.removeLast(); path.addLast(pred); lastWrittenPredicate = pred; } } else { // New subject closePreviousStatement(); stack.addLast(subj); // Write new subject: if (prettyPrint) { writer.writeEOL(); } writeResource(subj, canShortenSubjectBNode); wrapLine(true); writer.increaseIndentation(); lastWrittenSubject = subj; // Write new predicate writePredicate(pred); wrapLine(true); path.addLast(pred); lastWrittenPredicate = pred; statementClosed = false; writer.increaseIndentation(); } writeValue(obj, canShortenObjectBNode); // Don't close the line just yet. Maybe the next // statement has the same subject and/or predicate. } @Override public void handleComment(String comment) throws RDFHandlerException { checkWritingStarted(); try { closePreviousStatement(); if (comment.indexOf('\r') != -1 || comment.indexOf('\n') != -1) { // Comment is not allowed to contain newlines or line feeds. // Split comment in individual lines and write comment lines // for each of them. StringTokenizer st = new StringTokenizer(comment, "\r\n"); while (st.hasMoreTokens()) { writeCommentLine(st.nextToken()); } } else { writeCommentLine(comment); } } catch (IOException e) { throw new RDFHandlerException(e); } } protected void writeCommentLine(String line) throws IOException { writer.write("# "); writer.write(line); writer.writeEOL(); } protected void writeBase(String baseURI) throws IOException { writer.write("@base <"); StringUtil.simpleEscapeIRI(baseURI, writer, false); writer.write("> ."); writer.writeEOL(); } protected void writeNamespace(String prefix, String name) throws IOException { writer.write("@prefix "); writer.write(prefix); writer.write(": <"); StringUtil.simpleEscapeIRI(name, writer, false); writer.write("> ."); writer.writeEOL(); } protected void writePredicate(IRI predicate) throws IOException { if (predicate.equals(RDF.TYPE)) { // Write short-cut for rdf:type writer.write("a"); } else { writeURI(predicate); } } /** * @param val The {@link Value} to write. * @throws IOException * @deprecated Use {@link #writeValue(Value, boolean)} instead. */ @Deprecated protected void writeValue(Value val) throws IOException { writeValue(val, false); } /** * Writes a value, optionally shortening it if it is an {@link IRI} and has a namespace definition that is suitable * for use in this context for shortening or a {@link BNode} that has been confirmed to be able to be shortened in * this context. * * @param val The {@link Value} to write. * @param canShorten True if, in the current context, we can shorten this value if it is an instance of * {@link BNode} . * @throws IOException */ protected void writeValue(Value val, boolean canShorten) throws IOException { if (val instanceof BNode && canShorten && !val.equals(stack.peekLast()) && !val.equals(lastWrittenSubject)) { stack.addLast((BNode) val); } else if (val instanceof Resource) { writeResource((Resource) val, canShorten); } else { writeLiteral((Literal) val); } } /** * @param res The {@link Resource} to write. * @throws IOException * @deprecated Use {@link #writeResource(Resource, boolean)} instead. */ @Deprecated protected void writeResource(Resource res) throws IOException { writeResource(res, false); } /** * Writes a {@link Resource}, optionally shortening it if it is an {@link IRI} and has a namespace definition that * is suitable for use in this context for shortening or a {@link BNode} that has been confirmed to be able to be * shortened in this context. * * @param res The {@link Resource} to write. * @param canShorten True if, in the current context, we can shorten this value if it is an instance of * {@link BNode} . * @throws IOException */ protected void writeResource(Resource res, boolean canShorten) throws IOException { if (res instanceof IRI) { writeURI((IRI) res); } else if (res instanceof BNode) { writeBNode((BNode) res, canShorten); } else { writeTriple((Triple) res, canShorten); } } protected void writeURI(IRI uri) throws IOException { String prefix = null; if (TurtleUtil.isValidPrefixedName(uri.getLocalName())) { prefix = namespaceTable.get(uri.getNamespace()); if (prefix != null) { // Namespace is mapped to a prefix; write abbreviated URI writer.write(prefix); writer.write(":"); writer.write(uri.getLocalName()); return; } } // Try to find a prefix for the URI's namespace String uriString = uri.toString(); int splitIdx = TurtleUtil.findURISplitIndex(uriString); if (splitIdx > 0) { String namespace = uriString.substring(0, splitIdx); prefix = namespaceTable.get(namespace); } if (prefix != null) { // Namespace is mapped to a prefix; write abbreviated URI writer.write(prefix); writer.write(":"); writer.write(uriString.substring(splitIdx)); } else if (baseIRI != null) { // Write relative URI writer.write("<"); StringUtil.simpleEscapeIRI(baseIRI.relativize(uriString), writer, false); writer.write(">"); } else { // Write full URI writer.write("<"); StringUtil.simpleEscapeIRI(uriString, writer, false); writer.write(">"); } } /** * @param bNode The {@link BNode} to write. * @throws IOException * @deprecated Use {@link #writeBNode(BNode, boolean)} instead. */ @Deprecated protected void writeBNode(BNode bNode) throws IOException { writeBNode(bNode, false); } protected void writeBNode(BNode bNode, boolean canShorten) throws IOException { if (canShorten) { writer.write("[]"); return; } writer.write("_:"); String id = bNode.getID(); if (id.isEmpty()) { if (this.getWriterConfig().get(BasicParserSettings.PRESERVE_BNODE_IDS)) { throw new IOException("Cannot consistently write blank nodes with empty internal identifiers"); } writer.write("genid-hash-"); writer.write(Integer.toHexString(System.identityHashCode(bNode))); } else { if (!TurtleUtil.isNameStartChar(id.charAt(0))) { writer.write("genid-start-"); writer.write(Integer.toHexString(id.charAt(0))); } else { writer.write(id.charAt(0)); } for (int i = 1; i < id.length() - 1; i++) { if (TurtleUtil.isPN_CHARS(id.charAt(i))) { writer.write(id.charAt(i)); } else { writer.write(Integer.toHexString(id.charAt(i))); } } if (id.length() > 1) { if (!TurtleUtil.isNameEndChar(id.charAt(id.length() - 1))) { writer.write(Integer.toHexString(id.charAt(id.length() - 1))); } else { writer.write(id.charAt(id.length() - 1)); } } } } protected void writeTriple(Triple triple, boolean canShorten) throws IOException { throw new IOException(getRDFFormat().getName() + " does not support RDF-star triples"); } protected void writeTripleRDFStar(Triple triple, boolean canShorten) throws IOException { writer.write("<<"); writeResource(triple.getSubject()); writer.write(" "); writeURI(triple.getPredicate()); writer.write(" "); Value object = triple.getObject(); if (object instanceof Literal) { writeLiteral((Literal) object); } else { writeResource((Resource) object, canShorten); } writer.write(">>"); } protected void writeLiteral(Literal lit) throws IOException { String label = lit.getLabel(); IRI datatype = lit.getDatatype(); if (prettyPrint && abbreviateNumbers) { if (XSD.INTEGER.equals(datatype) || XSD.DECIMAL.equals(datatype) || XSD.DOUBLE.equals(datatype) || XSD.BOOLEAN.equals(datatype)) { try { String normalized = XMLDatatypeUtil.normalize(label, datatype); if (!normalized.equals(XMLDatatypeUtil.POSITIVE_INFINITY) && !normalized.equals(XMLDatatypeUtil.NEGATIVE_INFINITY) && !normalized.equals(XMLDatatypeUtil.NaN)) { writer.write(normalized); return; // done } } catch (IllegalArgumentException e) { // not a valid numeric typed literal. ignore error and write // as // quoted string instead. } } } if (label.indexOf('\n') != -1 || label.indexOf('\r') != -1 || label.indexOf('\t') != -1) { // Write label as long string writer.write("\"\"\""); writer.write(TurtleUtil.encodeLongString(label)); writer.write("\"\"\""); } else { // Write label as normal string writer.write("\""); writer.write(TurtleUtil.encodeString(label)); writer.write("\""); } if (Literals.isLanguageLiteral(lit)) { // Append the literal's language writer.write("@"); writer.write(lit.getLanguage().get()); } else if (!xsdStringToPlainLiteral || !XSD.STRING.equals(datatype)) { // Append the literal's datatype (possibly written as an abbreviated // URI) writer.write("^^"); writeURI(datatype); } } protected void closePreviousStatement() throws IOException { closeNestedResources(null); if (!statementClosed) { // The previous statement still needs to be closed: writer.write(" ."); writer.writeEOL(); writer.decreaseIndentation(); writer.decreaseIndentation(); stack.pollLast(); path.pollLast(); assert stack.isEmpty(); assert path.isEmpty(); statementClosed = true; lastWrittenSubject = null; lastWrittenPredicate = null; } } private boolean isHanging() { return !stack.isEmpty() && lastWrittenSubject != null && !lastWrittenSubject.equals(stack.peekLast()); } private void closeHangingResource() throws IOException { if (isHanging()) { Value val = stack.pollLast(); if (val instanceof Resource) { writeResource((Resource) val, inlineBNodes); } else { writeLiteral((Literal) val); } assert lastWrittenSubject.equals(stack.peekLast()); } } private void closeNestedResources(Resource subj) throws IOException { closeHangingResource(); while (stack.size() > 1 && !stack.peekLast().equals(subj)) { if (prettyPrint) { writer.writeEOL(); } writer.decreaseIndentation(); writer.decreaseIndentation(); writer.write("]"); stack.pollLast(); path.pollLast(); lastWrittenSubject = stack.peekLast(); lastWrittenPredicate = path.peekLast(); } } private void handleInlineNode(Statement st, boolean inlineSubject, boolean inlineObject) throws IOException { Resource subj = st.getSubject(); IRI pred = st.getPredicate(); if (isHanging() && subj.equals(stack.peekLast())) { // blank subject lastWrittenSubject = subj; writer.write("["); if (prettyPrint && !RDF.TYPE.equals(pred)) { writer.writeEOL(); } else { wrapLine(prettyPrint); } writer.increaseIndentation(); // Write new predicate writePredicate(pred); writer.increaseIndentation(); wrapLine(true); path.addLast(pred); lastWrittenPredicate = pred; writeValue(st.getObject(), inlineObject); } else if (!subj.equals(lastWrittenSubject) && stack.contains(subj)) { closeNestedResources(subj); writeStatement(subj, pred, st.getObject(), st.getContext(), inlineSubject, inlineObject); } else { assert false; } } private void handleList(Statement st, boolean canInlineObjectBNode) throws IOException { Resource subj = st.getSubject(); boolean first = RDF.FIRST.equals(st.getPredicate()); boolean rest = RDF.REST.equals(st.getPredicate()) && !RDF.NIL.equals(st.getObject()); boolean nil = RDF.REST.equals(st.getPredicate()) && RDF.NIL.equals(st.getObject()); if (first && REST != lastWrittenPredicate && isHanging()) { // new collection writer.write("("); writer.increaseIndentation(); wrapLine(false); lastWrittenSubject = subj; path.addLast(FIRST); lastWrittenPredicate = FIRST; writeValue(st.getObject(), canInlineObjectBNode); } else if (first && REST == lastWrittenPredicate) { // item in existing collection lastWrittenSubject = subj; path.addLast(FIRST); lastWrittenPredicate = FIRST; writeValue(st.getObject(), canInlineObjectBNode); } else { closeNestedResources(subj); if (rest && FIRST == lastWrittenPredicate) { // next item wrapLine(true); path.removeLast(); // RDF.FIRST path.addLast(REST); lastWrittenPredicate = REST; writeValue(st.getObject(), inlineBNodes); } else if (nil && FIRST == lastWrittenPredicate) { writer.decreaseIndentation(); writer.write(")"); path.removeLast(); // RDF.FIRST path.addLast(REST); while (REST == path.peekLast()) { stack.pollLast(); path.pollLast(); lastWrittenSubject = stack.peekLast(); lastWrittenPredicate = path.peekLast(); } } else { writeStatement(subj, st.getPredicate(), st.getObject(), st.getContext(), inlineBNodes, inlineBNodes); } } } private void wrapLine(boolean space) throws IOException { if (prettyPrint && writer.getCharactersSinceEOL() > LINE_WRAP) { writer.writeEOL(); } else if (space) { writer.write(" "); } } /** * not synchronized, assumes calling method has obtained a lock on {@link #bufferLock}. */ private void processBuffer() throws RDFHandlerException { if (!isBuffering()) { return; } if (this.getRDFFormat().supportsContexts()) { // to allow use in Turtle extensions such a TriG // primary grouping per context. for (Resource context : bufferedStatements.contexts()) { Model contextData = bufferedStatements.filter(null, null, null, context); Set processedSubjects = new HashSet<>(); Optional nextSubject = nextSubject(contextData, processedSubjects); while (nextSubject.isPresent()) { processSubject(contextData, nextSubject.get(), processedSubjects); nextSubject = nextSubject(contextData, processedSubjects); } } } else { // group by subject Set processedSubjects = new HashSet<>(); Optional nextSubject = nextSubject(bufferedStatements, processedSubjects); while (nextSubject.isPresent()) { processSubject(bufferedStatements, nextSubject.get(), processedSubjects); nextSubject = nextSubject(bufferedStatements, processedSubjects); } } bufferedStatements.clear(); } private Optional nextSubject(Model contextData, Set processedSubjects) { // first try finding a subject that has not yet been processed and is not the object of another // unprocessed subject for (Resource subject : contextData.subjects()) { if (processedSubjects.contains(subject)) { continue; } if (subject.isBNode() && inlineBNodes) { Set otherSubjects = contextData.filter(null, null, subject).subjects(); if (otherSubjects.stream().anyMatch(s -> !processedSubjects.contains(s))) { // Other unprocessed subject using this subject as an object is present. Skip this one for now. continue; } } return Optional.of(subject); } // Ensure we did not inadvertently miss any subjects. This can happen when there is a cyclic relation between // blank nodes. return contextData.subjects().stream().filter(subject -> !processedSubjects.contains(subject)).findAny(); } private void processSubject(Model contextData, Resource subject, Set processedSubjects) { if (processedSubjects.contains(subject)) { return; } Set processedPredicates = new HashSet<>(); // give rdf:type preference over other predicates. processPredicate(contextData, subject, RDF.TYPE, processedSubjects, processedPredicates); // handle RDF Collection statements separately, to make sure we process them in the correct order processPredicate(contextData, subject, RDF.FIRST, processedSubjects, processedPredicates); // retrieve other statement from this context with the same // subject, and output them grouped by predicate for (IRI predicate : contextData.filter(subject, null, null).predicates()) { if (!processedPredicates.contains(predicate)) { processPredicate(contextData, subject, predicate, processedSubjects, processedPredicates); } } processedSubjects.add(subject); } private void processPredicate(Model contextData, Resource subject, IRI predicate, Set processedSubjects, Set processedPredicates) { for (Statement st : contextData.getStatements(subject, predicate, null)) { boolean canInlineObject = canInlineValue(contextData, st.getObject()); handleStatementInternal(st, false, canInlineValue(contextData, st.getSubject()), canInlineObject); if (canInlineObject && st.getObject() instanceof BNode) { processSubject(contextData, (BNode) st.getObject(), processedSubjects); } } processedPredicates.add(predicate); } private boolean canInlineValue(Model contextData, Value v) { if (!inlineBNodes) { return false; } if (v instanceof BNode) { return (contextData.filter(null, null, v).size() <= 1); } return true; } /** * Checks if the writer is configured such that it needs statement buffering. * * @return true if the writer is buffering, false otherwise. */ private boolean isBuffering() { return inlineBNodes || prettyPrint; } }




© 2015 - 2025 Weber Informatics LLC | Privacy Policy