org.apache.pdfbox.examples.pdmodel.ExtractTTFFonts Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of pdfbox-examples Show documentation
Show all versions of pdfbox-examples Show documentation
The Apache PDFBox library is an open source Java tool for working with PDF documents.
This artefact contains examples on how the library can be used.
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.pdfbox.examples.pdmodel;
import java.io.File;
import java.io.FileOutputStream;
import java.io.IOException;
import org.apache.pdfbox.cos.COSName;
import org.apache.pdfbox.io.IOUtils;
import org.apache.pdfbox.pdmodel.PDDocument;
import org.apache.pdfbox.pdmodel.PDPage;
import org.apache.pdfbox.pdmodel.PDResources;
import org.apache.pdfbox.pdmodel.common.PDStream;
import org.apache.pdfbox.pdmodel.font.PDCIDFont;
import org.apache.pdfbox.pdmodel.font.PDCIDFontType2;
import org.apache.pdfbox.pdmodel.font.PDFont;
import org.apache.pdfbox.pdmodel.font.PDFontDescriptor;
import org.apache.pdfbox.pdmodel.font.PDTrueTypeFont;
import org.apache.pdfbox.pdmodel.font.PDType0Font;
import org.apache.pdfbox.pdmodel.graphics.PDXObject;
import org.apache.pdfbox.pdmodel.graphics.form.PDFormXObject;
/**
* This will extract all true type-fonts of a pdf.
*
*/
public final class ExtractTTFFonts
{
private int fontCounter = 1;
private static final String PASSWORD = "-password";
private static final String PREFIX = "-prefix";
private static final String ADDKEY = "-addkey";
private ExtractTTFFonts()
{
}
/**
* This is the entry point for the application.
*
* @param args The command-line arguments.
*
* @throws IOException If there is an error decrypting the document.
*/
public static void main(String[] args) throws IOException
{
ExtractTTFFonts extractor = new ExtractTTFFonts();
extractor.extractFonts(args);
}
private void extractFonts(String[] args) throws IOException
{
if (args.length < 1 || args.length > 4)
{
usage();
}
else
{
String pdfFile = null;
String password = "";
String prefix = null;
boolean addKey = false;
for (int i = 0; i < args.length; i++)
{
if (args[i].equals(PASSWORD))
{
i++;
if (i >= args.length)
{
usage();
}
password = args[i];
}
else if (args[i].equals(PREFIX))
{
i++;
if (i >= args.length)
{
usage();
}
prefix = args[i];
}
else if (args[i].equals(ADDKEY))
{
addKey = true;
}
else
{
if (pdfFile == null)
{
pdfFile = args[i];
}
}
}
if (pdfFile == null)
{
usage();
}
else
{
if (prefix == null && pdfFile.length() > 4)
{
prefix = pdfFile.substring(0, pdfFile.length() - 4);
}
PDDocument document = null;
try
{
document = PDDocument.load(new File(pdfFile), password);
for (PDPage page : document.getPages())
{
PDResources resources = page.getResources();
// extract all fonts which are part of the page resources
processResources(resources, prefix, addKey);
}
}
finally
{
if (document != null)
{
document.close();
}
}
}
}
}
private void processResources(PDResources resources, String prefix, boolean addKey) throws IOException
{
if (resources == null)
{
return;
}
for (COSName key : resources.getFontNames())
{
PDFont font = resources.getFont(key);
// write the font
if (font instanceof PDTrueTypeFont)
{
String name = null;
if (addKey)
{
name = getUniqueFileName(prefix + "_" + key, "ttf");
}
else
{
name = getUniqueFileName(prefix, "ttf");
}
writeFont(font.getFontDescriptor(), name);
}
else if (font instanceof PDType0Font)
{
PDCIDFont descendantFont = ((PDType0Font) font).getDescendantFont();
if (descendantFont instanceof PDCIDFontType2)
{
String name = null;
if (addKey)
{
name = getUniqueFileName(prefix + "_" + key, "ttf");
}
else
{
name = getUniqueFileName(prefix, "ttf");
}
writeFont(descendantFont.getFontDescriptor(), name);
}
}
}
for (COSName name : resources.getXObjectNames())
{
PDXObject xobject = resources.getXObject(name);
if (xobject instanceof PDFormXObject)
{
PDFormXObject xObjectForm = (PDFormXObject) xobject;
PDResources formResources = xObjectForm.getResources();
processResources(formResources, prefix, addKey);
}
}
}
private void writeFont(PDFontDescriptor fd, String name) throws IOException
{
if (fd != null)
{
PDStream ff2Stream = fd.getFontFile2();
if (ff2Stream != null)
{
FileOutputStream fos = null;
try
{
System.out.println("Writing font:" + name);
fos = new FileOutputStream(new File(name + ".ttf"));
IOUtils.copy(ff2Stream.createInputStream(), fos);
}
finally
{
if (fos != null)
{
fos.close();
}
}
}
}
}
private String getUniqueFileName(String prefix, String suffix)
{
String uniqueName = null;
File f = null;
while (f == null || f.exists())
{
uniqueName = prefix + "-" + fontCounter;
f = new File(uniqueName + "." + suffix);
fontCounter++;
}
return uniqueName;
}
/**
* This will print the usage requirements and exit.
*/
private static void usage()
{
System.err.println("Usage: java " + ExtractTTFFonts.class.getName() + " [OPTIONS] \n"
+ " -password Password to decrypt document\n"
+ " -prefix Font prefix(default to pdf name)\n"
+ " -addkey add the internal font key to the file name\n"
+ " The PDF document to use\n");
System.exit(1);
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy