All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.eclipse.rdf4j.rio.ndjsonld.legacy.NDJSONLDParser Maven / Gradle / Ivy

There is a newer version: 5.1.0
Show newest version
/*******************************************************************************
 * Copyright (c) 2024 Eclipse RDF4J contributors.
 *
 * All rights reserved. This program and the accompanying materials
 * are made available under the terms of the Eclipse Distribution License v1.0
 * which accompanies this distribution, and is available at
 * http://www.eclipse.org/org/documents/edl-v10.php.
 *
 * SPDX-License-Identifier: BSD-3-Clause
 ******************************************************************************/
package org.eclipse.rdf4j.rio.ndjsonld.legacy;

import java.io.BufferedReader;
import java.io.ByteArrayInputStream;
import java.io.IOException;
import java.io.InputStream;
import java.io.InputStreamReader;
import java.io.Reader;
import java.nio.charset.StandardCharsets;
import java.util.LinkedList;
import java.util.List;

import org.apache.commons.io.input.BOMInputStream;
import org.eclipse.rdf4j.model.Value;
import org.eclipse.rdf4j.model.ValueFactory;
import org.eclipse.rdf4j.rio.RDFFormat;
import org.eclipse.rdf4j.rio.RDFHandlerException;
import org.eclipse.rdf4j.rio.RDFParseException;
import org.eclipse.rdf4j.rio.jsonld.legacy.JSONLDParser;

import com.fasterxml.jackson.core.JsonFactory;
import com.fasterxml.jackson.core.JsonParser;
import com.github.jsonldjava.utils.JsonUtils;

/**
 * Introduce a parser capable of parsing Newline Delimited JSON-LD, where each line is a serialized JSON-LD record. The
 * format is inspired by Newline Delimited JSON formathttp://ndjson.org/. Even though each line is a separate
 * JSON-LD document, the whole document is treated as a single RDF document, having one single BNodes context to
 * preserve BNodes identifiers.
 *
 * @author Desislava Hristova
 */
public class NDJSONLDParser extends JSONLDParser {

	/**
	 * Default constructor
	 */
	public NDJSONLDParser() {
		super();
	}

	/**
	 * Creates a RDF4J NDJSONLD Parser using the given {@link ValueFactory} to create new {@link Value}s.
	 *
	 * @param valueFactory The ValueFactory to use
	 */
	public NDJSONLDParser(final ValueFactory valueFactory) {
		super(valueFactory);
	}

	@Override
	public RDFFormat getRDFFormat() {
		return RDFFormat.NDJSONLD;
	}

	@Override
	protected Object getJSONObject(InputStream in, Reader reader, JsonFactory factory) throws IOException {
		List arrayOfJSONLD = new LinkedList<>();
		try (BufferedReader bufferedReader = new BufferedReader(reader)) {
			String line;
			while ((line = bufferedReader.readLine()) != null) {
				if (!line.isEmpty()) {
					JsonParser nextParser = factory
							.createParser(new ByteArrayInputStream(line.getBytes(StandardCharsets.UTF_8)));
					Object singleJSONLD = JsonUtils.fromJsonParser(nextParser);
					if (singleJSONLD instanceof List) {
						arrayOfJSONLD.addAll((List) singleJSONLD);
					} else {
						arrayOfJSONLD.add(singleJSONLD);
					}
				}
			}
			return arrayOfJSONLD;
		}
	}

	@Override
	public void parse(InputStream in, String baseURI) throws RDFParseException, RDFHandlerException, IOException {
		if (in == null) {
			throw new IllegalArgumentException("Input stream must not be 'null'");
		}

		parse(new InputStreamReader(new BOMInputStream(in, false), StandardCharsets.UTF_8), baseURI);
	}
}