
org.fit.pdfdom.PDFDomTreeConfig Maven / Gradle / Ivy
Go to download
Pdf2Dom is a PDF parser that converts the documents to a HTML DOM representation. The obtained DOM tree may be then serialized to a HTML file or further processed. The inline CSS definitions contained in the resulting document are used for making the HTML page as similar as possible to the PDF input. A command-line utility for converting the PDF documents to HTML is included in the distribution package. Pdf2Dom may be also used as an independent Java library with a standard DOM interface for your DOM-based applications or as an alternative parser for the CSSBox rendering engine in order to add the PDF processing capability to CSSBox.
/*
* Copyright (c) Matthew Abboud 2016
*
* Pdf2Dom is free software: you can redistribute it and/or modify
* it under the terms of the GNU Lesser General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* Pdf2Dom is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public License
* along with CSSBox. If not, see .
*/
package org.fit.pdfdom;
import org.fit.pdfdom.resource.EmbedAsBase64Handler;
import org.fit.pdfdom.resource.HtmlResourceHandler;
import org.fit.pdfdom.resource.IgnoreResourceHandler;
import org.fit.pdfdom.resource.SaveResourceToDirHandler;
import java.io.File;
public class PDFDomTreeConfig
{
private HtmlResourceHandler imageHandler;
private HtmlResourceHandler fontHandler;
public static PDFDomTreeConfig createDefaultConfig() {
PDFDomTreeConfig config = new PDFDomTreeConfig();
config.setFontHandler(embedAsBase64());
config.setImageHandler(embedAsBase64());
return config;
}
public static HtmlResourceHandler embedAsBase64() {
return new EmbedAsBase64Handler();
}
public static HtmlResourceHandler saveToDirectory(File directory) {
return new SaveResourceToDirHandler(directory);
}
public static HtmlResourceHandler ignoreResource() {
return new IgnoreResourceHandler();
}
private PDFDomTreeConfig() {
}
public HtmlResourceHandler getImageHandler()
{
return imageHandler;
}
public void setImageHandler(HtmlResourceHandler imageHandler)
{
this.imageHandler = imageHandler;
}
public HtmlResourceHandler getFontHandler()
{
return fontHandler;
}
public void setFontHandler(HtmlResourceHandler fontHandler)
{
this.fontHandler = fontHandler;
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy