All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.marklogic.client.example.cookbook.DocumentWriteTransform Maven / Gradle / Ivy

/*
 * Copyright 2012-2015 MarkLogic Corporation
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *    http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package com.marklogic.client.example.cookbook;

import java.io.File;
import java.io.IOException;
import java.io.InputStream;

import com.marklogic.client.DatabaseClient;
import com.marklogic.client.DatabaseClientFactory;
import com.marklogic.client.DatabaseClientFactory.Authentication;
import com.marklogic.client.FailedRequestException;
import com.marklogic.client.ForbiddenUserException;
import com.marklogic.client.ResourceNotFoundException;
import com.marklogic.client.ResourceNotResendableException;
import com.marklogic.client.admin.ExtensionMetadata;
import com.marklogic.client.admin.TransformExtensionsManager;
import com.marklogic.client.document.ServerTransform;
import com.marklogic.client.document.TextDocumentManager;
import com.marklogic.client.document.XMLDocumentManager;
import com.marklogic.client.example.cookbook.Util.ExampleProperties;
import com.marklogic.client.io.InputStreamHandle;
import com.marklogic.client.io.StringHandle;

/**
 * DocumentWriteTransform installs a server transform for converting HTML documents
 * to XHTML documents so HTML documents can be written to the database, indexed,
 * and easily modified.
 */
public class DocumentWriteTransform {
	static final private String TRANSFORM_NAME = "html2xhtml";

	public static void main(String[] args)
	throws IOException, ResourceNotFoundException, ForbiddenUserException, FailedRequestException, ResourceNotResendableException {
		run(Util.loadProperties());
	}

	// install the transform and then write a transformed document 
	public static void run(ExampleProperties props)
	throws IOException, ResourceNotFoundException, ForbiddenUserException, FailedRequestException, ResourceNotResendableException {
		System.out.println("example: "+DocumentWriteTransform.class.getName());

		installTransform(props.host, props.port,
				props.adminUser, props.adminPassword, props.authType);

		writeDocument(props.host, props.port,
				props.writerUser, props.writerPassword, props.authType);

		tearDownExample(props.host, props.port,
				props.adminUser, props.adminPassword, props.authType);
	}

	public static void installTransform(String host, int port, String user, String password, Authentication authType)
	throws IOException, ResourceNotFoundException, ResourceNotResendableException, ForbiddenUserException, FailedRequestException {
		// create the client
		DatabaseClient client = DatabaseClientFactory.newClient(host, port, user, password, authType);

		// create a manager for transform extensions
		TransformExtensionsManager transMgr = client.newServerConfigManager().newTransformExtensionsManager();

		// specify metadata about the transform extension
		ExtensionMetadata metadata = new ExtensionMetadata();
		metadata.setTitle("HTML-TO-XHTML XQuery Transform");
		metadata.setDescription("This plugin transforms an HTML document to XHTML");
		metadata.setProvider("MarkLogic");
		metadata.setVersion("0.1");

		// acquire the transform source code
		InputStream transStream = Util.openStream(
				"scripts"+File.separator+TRANSFORM_NAME+".xqy");
		if (transStream == null)
			throw new IOException("Could not read example transform");

		// create a handle on the transform source code
		InputStreamHandle handle = new InputStreamHandle();
		handle.set(transStream);

		// write the transform extension to the database
		transMgr.writeXQueryTransform(TRANSFORM_NAME, handle, metadata);

		System.out.println("Installed the "+TRANSFORM_NAME+" transform");

		// release the client
		client.release();
	}

	public static void writeDocument(String host, int port, String user, String password, Authentication authType)
	throws IOException, ResourceNotFoundException, ForbiddenUserException, FailedRequestException {
		String filename = "sentiment.html";

		// create the client
		DatabaseClient client = DatabaseClientFactory.newClient(host, port, user, password, authType);

		// acquire the content
		InputStream docStream = Util.openStream("data"+File.separator+filename);
		if (docStream == null)
			throw new IOException("Could not read document example");

		// create a manager for writing text documents
		TextDocumentManager writeMgr = client.newTextDocumentManager();

		// create an identifier for the document
		String docId = "/example/"+filename;

		// create a handle on the content
		InputStreamHandle writeHandle = new InputStreamHandle();
		writeHandle.set(docStream);

		// specify the mime type for the content
		writeHandle.setMimetype("text/html");

		// specify the transform and its parameters
		ServerTransform transform = new ServerTransform(TRANSFORM_NAME);
		transform.put("drop-font-tags",              "yes");
		transform.put("drop-proprietary-attributes", "yes");
		transform.put("enclose-block-text",          "yes");
		transform.put("enclose-text",                "yes");
		transform.put("logical-emphasis",            "yes");

		// write the HTML content as XHTML by transforming in the database
		writeMgr.write(docId, writeHandle, transform);

		System.out.println("Wrote "+docId+" with transform");

		// read back the transformed XHTML document
		XMLDocumentManager readMgr = client.newXMLDocumentManager();

		StringHandle readHandle = new StringHandle();
		readMgr.read(docId, readHandle);

		System.out.println(readHandle.get());

		// release the client
		client.release();
	}

	// clean up by deleting the written document and the example transform
	public static void tearDownExample(
			String host, int port, String user, String password, Authentication authType)
	throws ResourceNotFoundException, ForbiddenUserException, FailedRequestException {
		DatabaseClient client = DatabaseClientFactory.newClient(host, port, user, password, authType);

		TextDocumentManager docMgr = client.newTextDocumentManager();

		docMgr.delete("/example/sentiment.html");

		TransformExtensionsManager transMgr =
			client.newServerConfigManager().newTransformExtensionsManager();

		transMgr.deleteTransform(TRANSFORM_NAME);

		client.release();
	}
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy