All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.eclipse.rdf4j.rio.RDFFormat Maven / Gradle / Ivy

/*******************************************************************************
 * Copyright (c) 2015 Eclipse RDF4J contributors, Aduna, and others.
 * All rights reserved. This program and the accompanying materials
 * are made available under the terms of the Eclipse Distribution License v1.0
 * which accompanies this distribution, and is available at
 * http://www.eclipse.org/org/documents/edl-v10.php.
 *******************************************************************************/
package org.eclipse.rdf4j.rio;

import java.nio.charset.Charset;
import java.nio.charset.StandardCharsets;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.Collection;
import java.util.List;

import org.eclipse.rdf4j.common.lang.FileFormat;
import org.eclipse.rdf4j.model.IRI;
import org.eclipse.rdf4j.model.Statement;
import org.eclipse.rdf4j.model.impl.SimpleValueFactory;

/**
 * Represents the concept of an RDF data serialization format. RDF formats are identified by a {@link #getName() name}
 * and can have one or more associated MIME types, zero or more associated file extensions and can specify a (default)
 * character encoding. Some formats are able to encode context information while other are not; this is indicated by the
 * value of {@link #supportsContexts}.
 *
 * @author Arjohn Kampman
 */
public class RDFFormat extends FileFormat {

	/*-----------*
	 * Constants *
	 *-----------*/

	/**
	 * Indicates that calls to {@link RDFHandler#handleNamespace(String, String)} may be serialised when serializing to
	 * this format.
	 */
	public static final boolean SUPPORTS_NAMESPACES = true;

	/**
	 * Indicates that all calls to {@link RDFHandler#handleNamespace(String, String)} will be ignored when serializing
	 * to this format.
	 */
	public static final boolean NO_NAMESPACES = false;

	/**
	 * Indicates that the {@link Statement#getContext()} URI may be serialized for this format.
	 */
	public static final boolean SUPPORTS_CONTEXTS = true;

	/**
	 * Indicates that the {@link Statement#getContext()} URI will NOT be serialized for this format.
	 */
	public static final boolean NO_CONTEXTS = false;

	/**
	 * Indicates that RDF* triples can be serialized natively for this format.
	 */
	public static final boolean SUPPORTS_RDF_STAR = true;

	/**
	 * Indicates that RDF* triples will NOT be serialized natively for this format.
	 */
	public static final boolean NO_RDF_STAR = false;

	/**
	 * The RDF/XML file format.
	 * 

* Several file extensions are accepted for RDF/XML documents, including .rdf, .rdfs (for * RDF Schema files), .owl (for OWL ontologies), and .xml. The media type is * application/rdf+xml, but application/xml and text/xml are also accepted. * The character encoding is UTF-8. *

* * @see RDF/XML Syntax Specification (Revised) */ public static final RDFFormat RDFXML = new RDFFormat("RDF/XML", Arrays.asList("application/rdf+xml", "application/xml", "text/xml"), StandardCharsets.UTF_8, Arrays.asList("rdf", "rdfs", "owl", "xml"), SimpleValueFactory.getInstance().createIRI("http://www.w3.org/ns/formats/RDF_XML"), SUPPORTS_NAMESPACES, NO_CONTEXTS, NO_RDF_STAR); /** * The N-Triples file format. *

* The file extension .nt is recommend for N-Triples documents. The media type is * application/n-triples and encoding is in UTF-8. *

* * @see N-Triples */ public static final RDFFormat NTRIPLES = new RDFFormat("N-Triples", Arrays.asList("application/n-triples", "text/plain"), StandardCharsets.UTF_8, Arrays.asList("nt"), SimpleValueFactory.getInstance().createIRI("http://www.w3.org/ns/formats/N-Triples"), NO_NAMESPACES, NO_CONTEXTS, NO_RDF_STAR); /** * The Turtle file format. *

* The file extension .ttl is recommend for Turtle documents. The media type is * text/turtle, but application/x-turtle is also accepted. Character encoding is UTF-8. *

* * @see Turtle - Terse RDF Triple Language */ public static final RDFFormat TURTLE = new RDFFormat("Turtle", Arrays.asList("text/turtle", "application/x-turtle"), StandardCharsets.UTF_8, Arrays.asList("ttl"), SimpleValueFactory.getInstance().createIRI("http://www.w3.org/ns/formats/Turtle"), SUPPORTS_NAMESPACES, NO_CONTEXTS, NO_RDF_STAR); /** * The Turtle* (TurtleStar) file format, a Turtle-based RDF serialization format that supports RDF* triples. *

* The file extension .ttls is recommended for Turtle* documents. The media type is * application/x-turtlestar and the encoding is UTF-8. *

* * @see Foundations of an Alternative Approach to Reification in * RDF */ public static final RDFFormat TURTLESTAR = new RDFFormat("Turtle*", Arrays.asList("text/x-turtlestar", "application/x-turtlestar"), StandardCharsets.UTF_8, Arrays.asList("ttls"), SUPPORTS_NAMESPACES, NO_CONTEXTS, SUPPORTS_RDF_STAR); /** * The N3/Notation3 file format. *

* The file extension .n3 is recommended for N3 documents. The media type is text/n3, but * text/rdf+n3 is also accepted. Character encoding is UTF-8. *

* * @see Notation3 (N3): A readable RDF syntax */ public static final RDFFormat N3 = new RDFFormat("N3", Arrays.asList("text/n3", "text/rdf+n3"), StandardCharsets.UTF_8, Arrays.asList("n3"), SimpleValueFactory.getInstance().createIRI("http://www.w3.org/ns/formats/N3"), SUPPORTS_NAMESPACES, NO_CONTEXTS, NO_RDF_STAR); /** * The TriX file format, an XML-based RDF serialization format that * supports recording of named graphs. *

* The file extension .xml is recommended for TriX documents, .trix is also accepted. The * media type is application/trix and the encoding is UTF-8. *

* * @see TriX: RDF Triples in XML */ public static final RDFFormat TRIX = new RDFFormat("TriX", Arrays.asList("application/trix"), StandardCharsets.UTF_8, Arrays.asList("xml", "trix"), null, SUPPORTS_NAMESPACES, SUPPORTS_CONTEXTS, NO_RDF_STAR); /** * The TriG file format, a Turtle-based RDF serialization format that * supports recording of named graphs. *

* The file extension .trig is recommend for TriG documents. The media type is * application/trig and the encoding is UTF-8. *

* * @see The TriG Syntax */ public static final RDFFormat TRIG = new RDFFormat("TriG", Arrays.asList("application/trig", "application/x-trig"), StandardCharsets.UTF_8, Arrays.asList("trig"), SimpleValueFactory.getInstance().createIRI("http://www.w3.org/ns/formats/TriG"), SUPPORTS_NAMESPACES, SUPPORTS_CONTEXTS, NO_RDF_STAR); /** * The TriG* (TriGStar) file format, a TriG-based RDF serialization format that supports RDF* triples. This builds * upon the idea for the Turtle* format but adds support for named graphs. *

* The file extension .trigs is recommended for TriG* documents. The media type is * application/x-trigstar and the encoding is UTF-8. *

* * @see Foundations of an Alternative Approach to Reification in * RDF */ public static final RDFFormat TRIGSTAR = new RDFFormat("TriG*", "application/x-trigstar", StandardCharsets.UTF_8, "trigs", SUPPORTS_NAMESPACES, SUPPORTS_CONTEXTS, SUPPORTS_RDF_STAR); /** * A binary RDF format. *

* The file extension .brf is recommend for binary RDF documents. The media type is * application/x-binary-rdf. *

* * @see Binary RDF in Sesame */ public static final RDFFormat BINARY = new RDFFormat("BinaryRDF", Arrays.asList("application/x-binary-rdf"), null, Arrays.asList("brf"), null, SUPPORTS_NAMESPACES, SUPPORTS_CONTEXTS, SUPPORTS_RDF_STAR); /** * The N-Quads file format, an RDF serialization format that supports * recording of named graphs. *

* The file extension .nq is recommended for N-Quads documents. The media type is * application/n-quads and the encoding is UTF-8. *

* * @see N-Quads: Extending N-Triples with Context */ public static final RDFFormat NQUADS = new RDFFormat("N-Quads", Arrays.asList("application/n-quads", "text/x-nquads", "text/nquads"), StandardCharsets.UTF_8, Arrays.asList("nq"), SimpleValueFactory.getInstance().createIRI("http://www.w3.org/ns/formats/N-Quads"), NO_NAMESPACES, SUPPORTS_CONTEXTS, NO_RDF_STAR); /** * The JSON-LD file format, an RDF serialization format that supports * recording of named graphs. *

* The file extension .jsonld is recommended for JSON-LD documents. The media type is * application/ld+json and the encoding is UTF-8. *

* * @see JSON-LD 1.0 */ public static final RDFFormat JSONLD = new RDFFormat("JSON-LD", Arrays.asList("application/ld+json"), StandardCharsets.UTF_8, Arrays.asList("jsonld"), SimpleValueFactory.getInstance().createIRI("http://www.w3.org/ns/formats/JSON-LD"), SUPPORTS_NAMESPACES, SUPPORTS_CONTEXTS, NO_RDF_STAR); /** * The RDF/JSON file format, an RDF serialization format that supports * recording of named graphs. *

* The file extension .rj is recommended for RDF/JSON documents. The media type is * application/rdf+json and the encoding is UTF-8. *

* * @see RDF 1.1 JSON Alternate Serialization (RDF/JSON) */ public static final RDFFormat RDFJSON = new RDFFormat("RDF/JSON", Arrays.asList("application/rdf+json"), StandardCharsets.UTF_8, Arrays.asList("rj"), SimpleValueFactory.getInstance().createIRI("http://www.w3.org/ns/formats/RDF_JSON"), NO_NAMESPACES, SUPPORTS_CONTEXTS, NO_RDF_STAR); /** * The RDFa file format, an RDF serialization format. *

* The file extension .xhtml is recommended for RDFa documents. The preferred media type is * application/xhtml+xml and the encoding is UTF-8. *

* * @see XHTML+RDFa 1.1 */ public static final RDFFormat RDFA = new RDFFormat("RDFa", Arrays.asList("application/xhtml+xml", "application/html", "text/html"), StandardCharsets.UTF_8, Arrays.asList("xhtml", "html"), SimpleValueFactory.getInstance().createIRI("http://www.w3.org/ns/formats/RDFa"), SUPPORTS_NAMESPACES, NO_CONTEXTS, NO_RDF_STAR); /** * The HDT file format, an RDF serialization format. *

* The file extension .hdt is recommended for HDT documents. *

* * @see HDT v1.0 */ public static final RDFFormat HDT = new RDFFormat("HDT", Arrays.asList("application/vnd.hdt"), null, Arrays.asList("hdt"), null, SUPPORTS_NAMESPACES, NO_CONTEXTS, NO_RDF_STAR); /*----------------* * Static methods * *----------------*/ /** * Processes the supplied collection of {@link RDFFormat}s and assigns quality values to each based on whether * context must be supported and whether the format is preferred. * * @param rdfFormats The {@link RDFFormat}s to process. * @param requireContext True to decrease the quality value for formats where {@link RDFFormat#supportsContexts()} * returns false. * @param preferredFormat The preferred RDFFormat. If it is not in the list then the quality of all formats will be * processed as if they are not preferred. * @return A list of strings containing the content types and an attached q-value specifying the quality for the * format for each type. */ public static List getAcceptParams(Iterable rdfFormats, boolean requireContext, RDFFormat preferredFormat) { List acceptParams = new ArrayList<>(); for (RDFFormat format : rdfFormats) { // Determine a q-value that reflects the necessity of context // support and the user specified preference int qValue = 10; if (requireContext && !format.supportsContexts()) { // Prefer context-supporting formats over pure triple-formats qValue -= 5; } if (preferredFormat != null && !preferredFormat.equals(format)) { // Prefer specified format over other formats qValue -= 2; } if (!format.supportsNamespaces()) { // We like reusing namespace prefixes qValue -= 1; } if (RDFXML.equals(format)) { // We explicitly dislike RDF/XML as it has limitations in what it can serialize. See #299. qValue -= 4; } // ensure q-value does not go below 0.1. qValue = Math.max(1, qValue); for (String mimeType : format.getMIMETypes()) { String acceptParam = mimeType; if (qValue < 10) { acceptParam += ";q=0." + qValue; } acceptParams.add(acceptParam); } } return acceptParams; } /*-----------* * Variables * *-----------*/ /** * Flag indicating whether the RDFFormat can encode namespace information. */ private final boolean supportsNamespaces; /** * Flag indicating whether the RDFFormat can encode context information. */ private final boolean supportsContexts; /** * Flag indicating whether the RDFFormat can encode RDF* triples natively. */ private final boolean supportsRDFStar; /** * A standard URI published by the W3C or another standards body to uniquely denote this format. * * @see Unique URIs for File Formats */ private IRI standardURI; /*--------------* * Constructors * *--------------*/ /** * Creates a new RDFFormat object. * * @param name The name of the RDF file format, e.g. "RDF/XML". * @param mimeType The MIME type of the RDF file format, e.g. application/rdf+xml for the RDF/XML * file format. * @param charset The default character encoding of the RDF file format. Specify null if not * applicable. * @param fileExtension The (default) file extension for the RDF file format, e.g. rdf for RDF/XML * files. * @param supportsNamespaces True if the RDFFormat supports the encoding of namespace/prefix information * and false otherwise. * @param supportsContexts True if the RDFFormat supports the encoding of contexts/named graphs and * false otherwise. * @deprecated since 3.2.0 */ @Deprecated public RDFFormat(String name, String mimeType, Charset charset, String fileExtension, boolean supportsNamespaces, boolean supportsContexts) { this(name, mimeType, charset, fileExtension, supportsNamespaces, supportsContexts, NO_RDF_STAR); } /** * Creates a new RDFFormat object. * * @param name The name of the RDF file format, e.g. "RDF/XML". * @param mimeType The MIME type of the RDF file format, e.g. application/rdf+xml for the RDF/XML * file format. * @param charset The default character encoding of the RDF file format. Specify null if not * applicable. * @param fileExtension The (default) file extension for the RDF file format, e.g. rdf for RDF/XML * files. * @param supportsNamespaces True if the RDFFormat supports the encoding of namespace/prefix information * and false otherwise. * @param supportsContexts True if the RDFFormat supports the encoding of contexts/named graphs and * false otherwise. * @param supportsRDFStar True if the RDFFormat supports the encoding of RDF* triples natively and * false otherwise. */ public RDFFormat(String name, String mimeType, Charset charset, String fileExtension, boolean supportsNamespaces, boolean supportsContexts, boolean supportsRDFStar) { this(name, Arrays.asList(mimeType), charset, Arrays.asList(fileExtension), supportsNamespaces, supportsContexts, supportsRDFStar); } /** * Creates a new RDFFormat object. * * @param name The name of the RDF file format, e.g. "RDF/XML". * @param mimeType The MIME type of the RDF file format, e.g. application/rdf+xml for the RDF/XML * file format. * @param charset The default character encoding of the RDF file format. Specify null if not * applicable. * @param fileExtensions The RDF format's file extensions, e.g. rdf for RDF/XML files. The first item * in the list is interpreted as the default file extension for the format. * @param supportsNamespaces True if the RDFFormat supports the encoding of namespace/prefix information * and false otherwise. * @param supportsContexts True if the RDFFormat supports the encoding of contexts/named graphs and * false otherwise. * @deprecated since 3.2.0 */ @Deprecated public RDFFormat(String name, String mimeType, Charset charset, Collection fileExtensions, boolean supportsNamespaces, boolean supportsContexts) { this(name, mimeType, charset, fileExtensions, supportsNamespaces, supportsContexts, NO_RDF_STAR); } /** * Creates a new RDFFormat object. * * @param name The name of the RDF file format, e.g. "RDF/XML". * @param mimeType The MIME type of the RDF file format, e.g. application/rdf+xml for the RDF/XML * file format. * @param charset The default character encoding of the RDF file format. Specify null if not * applicable. * @param fileExtensions The RDF format's file extensions, e.g. rdf for RDF/XML files. The first item * in the list is interpreted as the default file extension for the format. * @param supportsNamespaces True if the RDFFormat supports the encoding of namespace/prefix information * and false otherwise. * @param supportsContexts True if the RDFFormat supports the encoding of contexts/named graphs and * false otherwise. * @param supportsRDFStar True if the RDFFormat supports the encoding of RDF* triples natively and * false otherwise. */ public RDFFormat(String name, String mimeType, Charset charset, Collection fileExtensions, boolean supportsNamespaces, boolean supportsContexts, boolean supportsRDFStar) { this(name, Arrays.asList(mimeType), charset, fileExtensions, supportsNamespaces, supportsContexts, supportsRDFStar); } /** * Creates a new RDFFormat object. * * @param name The name of the RDF file format, e.g. "RDF/XML". * @param mimeTypes The MIME types of the RDF file format, e.g. application/rdf+xml for the * RDF/XML file format. The first item in the list is interpreted as the default MIME type * for the format. * @param charset The default character encoding of the RDF file format. Specify null if not * applicable. * @param fileExtensions The RDF format's file extensions, e.g. rdf for RDF/XML files. The first item * in the list is interpreted as the default file extension for the format. * @param supportsNamespaces True if the RDFFormat supports the encoding of namespace/prefix information * and false otherwise. * @param supportsContexts True if the RDFFormat supports the encoding of contexts/named graphs and * false otherwise. * @deprecated since 3.2.0 */ @Deprecated public RDFFormat(String name, Collection mimeTypes, Charset charset, Collection fileExtensions, boolean supportsNamespaces, boolean supportsContexts) { this(name, mimeTypes, charset, fileExtensions, null, supportsNamespaces, supportsContexts, NO_RDF_STAR); } /** * Creates a new RDFFormat object. * * @param name The name of the RDF file format, e.g. "RDF/XML". * @param mimeTypes The MIME types of the RDF file format, e.g. application/rdf+xml for the * RDF/XML file format. The first item in the list is interpreted as the default MIME type * for the format. * @param charset The default character encoding of the RDF file format. Specify null if not * applicable. * @param fileExtensions The RDF format's file extensions, e.g. rdf for RDF/XML files. The first item * in the list is interpreted as the default file extension for the format. * @param supportsNamespaces True if the RDFFormat supports the encoding of namespace/prefix information * and false otherwise. * @param supportsContexts True if the RDFFormat supports the encoding of contexts/named graphs and * false otherwise. * @param supportsRDFStar True if the RDFFormat supports the encoding of RDF* triples natively and * false otherwise. */ public RDFFormat(String name, Collection mimeTypes, Charset charset, Collection fileExtensions, boolean supportsNamespaces, boolean supportsContexts, boolean supportsRDFStar) { this(name, mimeTypes, charset, fileExtensions, null, supportsNamespaces, supportsContexts, supportsRDFStar); } /** * Creates a new RDFFormat object. * * @param name The name of the RDF file format, e.g. "RDF/XML". * @param mimeTypes The MIME types of the RDF file format, e.g. application/rdf+xml for the * RDF/XML file format. The first item in the list is interpreted as the default MIME type * for the format. * @param charset The default character encoding of the RDF file format. Specify null if not * applicable. * @param fileExtensions The RDF format's file extensions, e.g. rdf for RDF/XML files. The first item * in the list is interpreted as the default file extension for the format. * @param standardURI The standard URI that has been assigned to this format by a standards organisation or * null if it does not currently have a standard URI. * @param supportsNamespaces True if the RDFFormat supports the encoding of namespace/prefix information * and false otherwise. * @param supportsContexts True if the RDFFormat supports the encoding of contexts/named graphs and * false otherwise. * @deprecated since 3.2.0 */ @Deprecated public RDFFormat(String name, Collection mimeTypes, Charset charset, Collection fileExtensions, IRI standardURI, boolean supportsNamespaces, boolean supportsContexts) { this(name, mimeTypes, charset, fileExtensions, standardURI, supportsNamespaces, supportsContexts, NO_RDF_STAR); } /** * Creates a new RDFFormat object. * * @param name The name of the RDF file format, e.g. "RDF/XML". * @param mimeTypes The MIME types of the RDF file format, e.g. application/rdf+xml for the * RDF/XML file format. The first item in the list is interpreted as the default MIME type * for the format. * @param charset The default character encoding of the RDF file format. Specify null if not * applicable. * @param fileExtensions The RDF format's file extensions, e.g. rdf for RDF/XML files. The first item * in the list is interpreted as the default file extension for the format. * @param standardURI The standard URI that has been assigned to this format by a standards organisation or * null if it does not currently have a standard URI. * @param supportsNamespaces True if the RDFFormat supports the encoding of namespace/prefix information * and false otherwise. * @param supportsContexts True if the RDFFormat supports the encoding of contexts/named graphs and * false otherwise. * @param supportsRDFStar True if the RDFFormat supports the encoding of RDF* triples natively and * false otherwise. */ public RDFFormat(String name, Collection mimeTypes, Charset charset, Collection fileExtensions, IRI standardURI, boolean supportsNamespaces, boolean supportsContexts, boolean supportsRDFStar) { super(name, mimeTypes, charset, fileExtensions); this.standardURI = standardURI; this.supportsNamespaces = supportsNamespaces; this.supportsContexts = supportsContexts; this.supportsRDFStar = supportsRDFStar; } /*---------* * Methods * *---------*/ /** * Return true if the RDFFormat supports the encoding of namespace/prefix information. */ public boolean supportsNamespaces() { return supportsNamespaces; } /** * Return true if the RDFFormat supports the encoding of contexts/named graphs. */ public boolean supportsContexts() { return supportsContexts; } /** * Return true if the RDFFormat supports the encoding of RDF* triples natively. */ public boolean supportsRDFStar() { return supportsRDFStar; } /** * @return True if a standard URI has been assigned to this format by a standards organisation. */ public boolean hasStandardURI() { return standardURI != null; } /** * @return The standard URI that has been assigned to this format by a standards organisation or null if it does not * currently have a standard URI. */ public IRI getStandardURI() { return standardURI; } }




© 2015 - 2025 Weber Informatics LLC | Privacy Policy