All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.fit.pdfdom.resource.SaveResourceToDirHandler Maven / Gradle / Ivy

Go to download

Pdf2Dom is a PDF parser that converts the documents to a HTML DOM representation. The obtained DOM tree may be then serialized to a HTML file or further processed. The inline CSS definitions contained in the resulting document are used for making the HTML page as similar as possible to the PDF input. A command-line utility for converting the PDF documents to HTML is included in the distribution package. Pdf2Dom may be also used as an independent Java library with a standard DOM interface for your DOM-based applications or as an alternative parser for the CSSBox rendering engine in order to add the PDF processing capability to CSSBox.

There is a newer version: 2.0.3
Show newest version
/*
 *  Copyright (c) Matthew Abboud 2016
 *
 *  Pdf2Dom is free software: you can redistribute it and/or modify
 *  it under the terms of the GNU Lesser General Public License as published by
 *  the Free Software Foundation, either version 3 of the License, or
 *  (at your option) any later version.
 *
 *  Pdf2Dom is distributed in the hope that it will be useful,
 *  but WITHOUT ANY WARRANTY; without even the implied warranty of
 *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
 *  GNU Lesser General Public License for more details.
 *
 *  You should have received a copy of the GNU Lesser General Public License
 *  along with CSSBox. If not, see .
 */

package org.fit.pdfdom.resource;

import org.apache.commons.io.FileUtils;

import java.io.File;
import java.io.IOException;
import java.util.LinkedList;
import java.util.List;

public class SaveResourceToDirHandler implements HtmlResourceHandler
{
    public static final String DEFAULT_RESOURCE_DIR = "resources/";

    private final File directory;
    private List writtenFileNames = new LinkedList();

    public SaveResourceToDirHandler()
    {
        directory = null;
    }

    public SaveResourceToDirHandler(File directory)
    {
        this.directory = directory;
    }

    public String handleResource(HtmlResource resource) throws IOException
    {
        String dir = DEFAULT_RESOURCE_DIR;
        if (directory != null)
            dir = directory.getPath() + "/";

        String fileName = findNextUnusedFileName(resource.getName());
        String resourcePath = dir + fileName + "." + resource.getFileEnding();

        File file = new File(resourcePath);
        FileUtils.writeByteArrayToFile(file, resource.getData());

        writtenFileNames.add(fileName);

        return resourcePath;
    }

    private String findNextUnusedFileName(String fileName)
    {
        int i = 1;
        String usedName = fileName;
        while (writtenFileNames.contains(usedName)) {
            usedName = fileName + i;
            i++;
        }

        return usedName;
    }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy