com.aowagie.text.xml.SAXiTextHandler Maven / Gradle / Ivy
/*
* $Id: SAXiTextHandler.java 3427 2008-05-24 18:32:31Z xlv $
*
* Copyright 2001, 2002 by Bruno Lowagie.
*
* The contents of this file are subject to the Mozilla Public License Version 1.1
* (the "License"); you may not use this file except in compliance with the License.
* You may obtain a copy of the License at http://www.mozilla.org/MPL/
*
* Software distributed under the License is distributed on an "AS IS" basis,
* WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License
* for the specific language governing rights and limitations under the License.
*
* The Original Code is 'iText, a free JAVA-PDF library'.
*
* The Initial Developer of the Original Code is Bruno Lowagie. Portions created by
* the Initial Developer are Copyright (C) 1999, 2000, 2001, 2002 by Bruno Lowagie.
* All Rights Reserved.
* Co-Developer of the code is Paulo Soares. Portions created by the Co-Developer
* are Copyright (C) 2000, 2001, 2002 by Paulo Soares. All Rights Reserved.
*
* Contributor(s): all the names of the contributors are added in the source code
* where applicable.
*
* Alternatively, the contents of this file may be used under the terms of the
* LGPL license (the "GNU LIBRARY GENERAL PUBLIC LICENSE"), in which case the
* provisions of LGPL are applicable instead of those above. If you wish to
* allow use of your version of this file only under the terms of the LGPL
* License and not to allow others to use your version of this file under
* the MPL, indicate your decision by deleting the provisions above and
* replace them with the notice and other provisions required by the LGPL.
* If you do not delete the provisions above, a recipient may use your version
* of this file under either the MPL or the GNU LIBRARY GENERAL PUBLIC LICENSE.
*
* This library is free software; you can redistribute it and/or modify it
* under the terms of the MPL as stated above or under the terms of the GNU
* Library General Public License as published by the Free Software Foundation;
* either version 2 of the License, or any later version.
*
* This library is distributed in the hope that it will be useful, but WITHOUT
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
* FOR A PARTICULAR PURPOSE. See the GNU Library general Public License for more
* details.
*
* If you didn't download this code from the following link, you should check if
* you aren't using an obsolete version:
* http://www.lowagie.com/iText/
*/
package com.aowagie.text.xml;
import java.lang.reflect.Field;
import java.util.ArrayList;
import java.util.Collections;
import java.util.EmptyStackException;
import java.util.HashMap;
import java.util.Iterator;
import java.util.Properties;
import java.util.Stack;
import org.xml.sax.Attributes;
import org.xml.sax.helpers.DefaultHandler;
import com.aowagie.text.Anchor;
import com.aowagie.text.Annotation;
import com.aowagie.text.BadElementException;
import com.aowagie.text.Cell;
import com.aowagie.text.Chapter;
import com.aowagie.text.Chunk;
import com.aowagie.text.DocListener;
import com.aowagie.text.DocumentException;
import com.aowagie.text.Element;
import com.aowagie.text.ElementTags;
import com.aowagie.text.ExceptionConverter;
import com.aowagie.text.Font;
import com.aowagie.text.Image;
import com.aowagie.text.List;
import com.aowagie.text.ListItem;
import com.aowagie.text.Meta;
import com.aowagie.text.PageSize;
import com.aowagie.text.Paragraph;
import com.aowagie.text.Rectangle;
import com.aowagie.text.Section;
import com.aowagie.text.Table;
import com.aowagie.text.TextElementArray;
import com.aowagie.text.factories.ElementFactory;
import com.aowagie.text.html.HtmlTagMap;
import com.aowagie.text.pdf.BaseFont;
import com.aowagie.text.pdf.draw.LineSeparator;
import com.aowagie.text.xml.simpleparser.EntitiesToSymbol;
/**
* This class is a Handler that controls the iText XML to PDF conversion.
* Subclass it, if you want to change the way iText translates XML to PDF.
*/
class SAXiTextHandler extends DefaultHandler {
/** This is the resulting document. */
private final DocListener document;
/**
* This is a Stack
of objects, waiting to be added to the
* document.
*/
private final Stack stack;
/** This is the current chunk to which characters can be added. */
private Chunk currentChunk = null;
/** This is the current chunk to which characters can be added. */
private boolean ignore = false;
/**
* This is a flag that can be set, if you want to open and close the
* Document-object yourself.
*/
private boolean controlOpenClose = true;
/** current margin of a page. */
private float topMargin = 36;
/** current margin of a page. */
private float rightMargin = 36;
/** current margin of a page. */
private float leftMargin = 36;
/** current margin of a page. */
private float bottomMargin = 36;
/**
* @param document Document
*/
SAXiTextHandler(final DocListener document) {
super();
this.document = document;
this.stack = new Stack();
}
/** This hashmap contains all the custom keys and peers. */
protected HashMap myTags;
/**
* @param document Document
* @param myTags tags
*/
private SAXiTextHandler(final DocListener document, final HtmlTagMap myTags) {
this(document);
this.myTags = myTags;
}
/**
* @param document Document
* @param myTags tags
*/
SAXiTextHandler(final DocListener document, final HashMap myTags) {
this(document);
this.myTags = myTags;
}
/**
* Sets the parameter that allows you to enable/disable the control over the
* Document.open() and Document.close() method.
*
* If you set this parameter to true (= default), the parser will open the
* Document object when the start-root-tag is encountered and close it when
* the end-root-tag is met. If you set it to false, you have to open and
* close the Document object yourself.
*
* @param controlOpenClose
* set this to false if you plan to open/close the Document
* yourself
*/
public void setControlOpenClose(final boolean controlOpenClose) {
this.controlOpenClose = controlOpenClose;
}
/**
* This method gets called when a start tag is encountered.
*
* @param uri
* the Uniform Resource Identifier
* @param lname
* the local name (without prefix), or the empty string if
* Namespace processing is not being performed.
* @param name
* the name of the tag that is encountered
* @param attrs
* the list of attributes
*/
@Override
public void startElement(final String uri, final String lname, final String name,
final Attributes attrs) {
final Properties attributes = new Properties();
if (attrs != null) {
for (int i = 0; i < attrs.getLength(); i++) {
final String attribute = attrs.getQName(i);
attributes.setProperty(attribute, attrs.getValue(i));
}
}
handleStartingTags(name, attributes);
}
/**
* This method deals with the starting tags.
*
* @param name
* the name of the tag
* @param attributes
* the list of attributes
*/
void handleStartingTags(final String name, final Properties attributes) {
// System.err.println("Start: " + name);
if (this.ignore || ElementTags.IGNORE.equals(name)) {
this.ignore = true;
return;
}
// maybe there is some meaningful data that wasn't between tags
if (this.currentChunk != null) {
TextElementArray current;
try {
current = (TextElementArray) this.stack.pop();
} catch (final EmptyStackException ese) {
if (this.bf == null) {
current = new Paragraph("", new Font());
}
else {
current = new Paragraph("", new Font(this.bf));
}
}
current.add(this.currentChunk);
this.stack.push(current);
this.currentChunk = null;
}
// chunks
if (ElementTags.CHUNK.equals(name)) {
this.currentChunk = ElementFactory.getChunk(attributes);
if (this.bf != null) {
this.currentChunk.setFont(new Font(this.bf));
}
return;
}
// symbols
if (ElementTags.ENTITY.equals(name)) {
Font f = new Font();
if (this.currentChunk != null) {
handleEndingTags(ElementTags.CHUNK);
f = this.currentChunk.getFont();
}
this.currentChunk = EntitiesToSymbol.get(attributes.getProperty(ElementTags.ID),
f);
return;
}
// phrases
if (ElementTags.PHRASE.equals(name)) {
this.stack.push(ElementFactory.getPhrase(attributes));
return;
}
// anchors
if (ElementTags.ANCHOR.equals(name)) {
this.stack.push(ElementFactory.getAnchor(attributes));
return;
}
// paragraphs and titles
if (ElementTags.PARAGRAPH.equals(name) || ElementTags.TITLE.equals(name)) {
this.stack.push(ElementFactory.getParagraph(attributes));
return;
}
// lists
if (ElementTags.LIST.equals(name)) {
this.stack.push(ElementFactory.getList(attributes));
return;
}
// listitems
if (ElementTags.LISTITEM.equals(name)) {
this.stack.push(ElementFactory.getListItem(attributes));
return;
}
// cells
if (ElementTags.CELL.equals(name)) {
this.stack.push(ElementFactory.getCell(attributes));
return;
}
// tables
if (ElementTags.TABLE.equals(name)) {
final Table table = ElementFactory.getTable(attributes);
final float widths[] = table.getProportionalWidths();
for (int i = 0; i < widths.length; i++) {
if (widths[i] == 0) {
widths[i] = 100.0f / widths.length;
}
}
try {
table.setWidths(widths);
} catch (final BadElementException bee) {
// this shouldn't happen
throw new ExceptionConverter(bee);
}
this.stack.push(table);
return;
}
// sections
if (ElementTags.SECTION.equals(name)) {
final Element previous = (Element) this.stack.pop();
Section section;
try {
section = ElementFactory.getSection((Section) previous, attributes);
} catch (final ClassCastException cce) {
throw new ExceptionConverter(cce);
}
this.stack.push(previous);
this.stack.push(section);
return;
}
// chapters
if (ElementTags.CHAPTER.equals(name)) {
this.stack.push(ElementFactory.getChapter(attributes));
return;
}
// images
if (ElementTags.IMAGE.equals(name)) {
try {
final Image img = ElementFactory.getImage(attributes);
try {
addImage(img);
return;
} catch (final EmptyStackException ese) {
// if there is no element on the stack, the Image is added
// to the document
try {
this.document.add(img);
} catch (final DocumentException de) {
throw new ExceptionConverter(de);
}
return;
}
} catch (final Exception e) {
throw new ExceptionConverter(e);
}
}
// annotations
if (ElementTags.ANNOTATION.equals(name)) {
final Annotation annotation = ElementFactory.getAnnotation(attributes);
TextElementArray current;
try {
try {
current = (TextElementArray) this.stack.pop();
try {
current.add(annotation);
} catch (final Exception e) {
this.document.add(annotation);
}
this.stack.push(current);
} catch (final EmptyStackException ese) {
this.document.add(annotation);
}
return;
} catch (final DocumentException de) {
throw new ExceptionConverter(de);
}
}
// newlines
if (isNewline(name)) {
TextElementArray current;
try {
current = (TextElementArray) this.stack.pop();
current.add(Chunk.NEWLINE);
this.stack.push(current);
} catch (final EmptyStackException ese) {
if (this.currentChunk == null) {
try {
this.document.add(Chunk.NEWLINE);
} catch (final DocumentException de) {
throw new ExceptionConverter(de);
}
} else {
this.currentChunk.append("\n");
}
}
return;
}
// newpage
if (isNewpage(name)) {
TextElementArray current;
try {
current = (TextElementArray) this.stack.pop();
final Chunk newPage = new Chunk("");
newPage.setNewPage();
if (this.bf != null) {
newPage.setFont(new Font(this.bf));
}
current.add(newPage);
this.stack.push(current);
} catch (final EmptyStackException ese) {
this.document.newPage();
}
return;
}
if (ElementTags.HORIZONTALRULE.equals(name)) {
TextElementArray current;
final LineSeparator hr = new LineSeparator(1.0f, 100.0f, null, Element.ALIGN_CENTER, 0);
try {
current = (TextElementArray) this.stack.pop();
current.add(hr);
this.stack.push(current);
} catch (final EmptyStackException ese) {
try {
this.document.add(hr);
} catch (final DocumentException de) {
throw new ExceptionConverter(de);
}
}
return;
}
// documentroot
if (isDocumentRoot(name)) {
String key;
String value;
// pagesize and orientation specific code suggested by Samuel Gabriel
// Updated by Ricardo Coutinho. Only use if set in html!
Rectangle pageSize = null;
String orientation = null;
for (final Object element : attributes.keySet()) {
key = (String) element;
value = attributes.getProperty(key);
try {
// margin specific code suggested by Reza Nasiri
if (ElementTags.LEFT.equalsIgnoreCase(key)) {
this.leftMargin = Float.parseFloat(value + "f");
}
if (ElementTags.RIGHT.equalsIgnoreCase(key)) {
this.rightMargin = Float.parseFloat(value + "f");
}
if (ElementTags.TOP.equalsIgnoreCase(key)) {
this.topMargin = Float.parseFloat(value + "f");
}
if (ElementTags.BOTTOM.equalsIgnoreCase(key)) {
this.bottomMargin = Float.parseFloat(value + "f");
}
} catch (final Exception ex) {
throw new ExceptionConverter(ex);
}
if (ElementTags.PAGE_SIZE.equals(key)) {
try {
final String pageSizeName = value;
final Field pageSizeField = PageSize.class
.getField(pageSizeName);
pageSize = (Rectangle) pageSizeField.get(null);
} catch (final Exception ex) {
throw new ExceptionConverter(ex);
}
} else if (ElementTags.ORIENTATION.equals(key)) {
try {
if ("landscape".equals(value)) {
orientation = "landscape";
}
} catch (final Exception ex) {
throw new ExceptionConverter(ex);
}
} else {
try {
this.document.add(new Meta(key, value));
} catch (final DocumentException de) {
throw new ExceptionConverter(de);
}
}
}
if(pageSize != null) {
if ("landscape".equals(orientation)) {
pageSize = pageSize.rotate();
}
this.document.setPageSize(pageSize);
}
this.document.setMargins(this.leftMargin, this.rightMargin, this.topMargin,
this.bottomMargin);
if (this.controlOpenClose) {
this.document.open();
}
}
}
private void addImage(final Image img) throws EmptyStackException {
// if there is an element on the stack...
Object current = this.stack.pop();
// ...and it's a Chapter or a Section, the Image can be
// added directly
if (current instanceof Chapter
|| current instanceof Section
|| current instanceof Cell) {
((TextElementArray) current).add(img);
this.stack.push(current);
return;
}
// ...if not, we need to to a lot of stuff
else {
final Stack newStack = new Stack();
while (!(current instanceof Chapter
|| current instanceof Section || current instanceof Cell)) {
newStack.push(current);
if (current instanceof Anchor) {
img.setAnnotation(new Annotation(0, 0, 0,
0, ((Anchor) current).getReference()));
}
current = this.stack.pop();
}
((TextElementArray) current).add(img);
this.stack.push(current);
while (!newStack.empty()) {
this.stack.push(newStack.pop());
}
return;
}
}
/**
* This method gets called when ignorable white space encountered.
*
* @param ch
* an array of characters
* @param start
* the start position in the array
* @param length
* the number of characters to read from the array
*/
@Override
public void ignorableWhitespace(final char[] ch, final int start, final int length) {
characters(ch, start, length);
}
/**
* This method gets called when characters are encountered.
*
* @param ch
* an array of characters
* @param start
* the start position in the array
* @param length
* the number of characters to read from the array
*/
@Override
public void characters(final char[] ch, final int start, final int length) {
if (this.ignore) {
return;
}
final String content = new String(ch, start, length);
// System.err.println("'" + content + "'");
if (content.trim().length() == 0 && content.indexOf(' ') < 0) {
return;
}
final StringBuffer buf = new StringBuffer();
final int len = content.length();
char character;
boolean newline = false;
for (int i = 0; i < len; i++) {
switch (character = content.charAt(i)) {
case ' ':
if (!newline) {
buf.append(character);
}
break;
case '\n':
if (i > 0) {
newline = true;
buf.append(' ');
}
break;
case '\r':
break;
case '\t':
break;
default:
newline = false;
buf.append(character);
}
}
if (this.currentChunk == null) {
if (this.bf == null) {
this.currentChunk = new Chunk(buf.toString());
}
else {
this.currentChunk = new Chunk(buf.toString(), new Font(this.bf));
}
} else {
this.currentChunk.append(buf.toString());
}
}
private BaseFont bf = null;
/**
* Sets the font that has to be used.
* @param bf Base font
*/
public void setBaseFont(final BaseFont bf) {
this.bf = bf;
}
/**
* This method gets called when an end tag is encountered.
*
* @param uri
* the Uniform Resource Identifier
* @param lname
* the local name (without prefix), or the empty string if
* Namespace processing is not being performed.
* @param name
* the name of the tag that ends
*/
@Override
public void endElement(final String uri, final String lname, final String name) {
handleEndingTags(name);
}
/**
* This method deals with the starting tags.
*
* @param name
* the name of the tag
*/
void handleEndingTags(final String name) {
// System.err.println("Stop: " + name);
if (ElementTags.IGNORE.equals(name)) {
this.ignore = false;
return;
}
if (this.ignore) {
return;
}
// tags that don't have any content
if (isNewpage(name) || ElementTags.ANNOTATION.equals(name) || ElementTags.IMAGE.equals(name)
|| isNewline(name)) {
return;
}
try {
// titles of sections and chapters
if (ElementTags.TITLE.equals(name)) {
final Paragraph current = (Paragraph) this.stack.pop();
if (this.currentChunk != null) {
current.add(this.currentChunk);
this.currentChunk = null;
}
final Section previous = (Section) this.stack.pop();
previous.setTitle(current);
this.stack.push(previous);
return;
}
// all other endtags
if (this.currentChunk != null) {
TextElementArray current;
try {
current = (TextElementArray) this.stack.pop();
} catch (final EmptyStackException ese) {
current = new Paragraph();
}
current.add(this.currentChunk);
this.stack.push(current);
this.currentChunk = null;
}
// chunks
if (ElementTags.CHUNK.equals(name)) {
return;
}
// phrases, anchors, lists, tables
if (ElementTags.PHRASE.equals(name) || ElementTags.ANCHOR.equals(name) || ElementTags.LIST.equals(name)
|| ElementTags.PARAGRAPH.equals(name)) {
final Element current = (Element) this.stack.pop();
try {
final TextElementArray previous = (TextElementArray) this.stack.pop();
previous.add(current);
this.stack.push(previous);
} catch (final EmptyStackException ese) {
this.document.add(current);
}
return;
}
// listitems
if (ElementTags.LISTITEM.equals(name)) {
final ListItem listItem = (ListItem) this.stack.pop();
final List list = (List) this.stack.pop();
list.add(listItem);
this.stack.push(list);
}
// tables
if (ElementTags.TABLE.equals(name)) {
final Table table = (Table) this.stack.pop();
try {
final TextElementArray previous = (TextElementArray) this.stack.pop();
previous.add(table);
this.stack.push(previous);
} catch (final EmptyStackException ese) {
this.document.add(table);
}
return;
}
// rows
if (ElementTags.ROW.equals(name)) {
final ArrayList cells = new ArrayList();
int columns = 0;
Table table;
Cell cell;
while (true) {
final Element element = (Element) this.stack.pop();
if (element.type() == Element.CELL) {
cell = (Cell) element;
columns += cell.getColspan();
cells.add(cell);
} else {
table = (Table) element;
break;
}
}
if (table.getColumns() < columns) {
table.addColumns(columns - table.getColumns());
}
Collections.reverse(cells);
String width;
final float[] cellWidths = new float[columns];
final boolean[] cellNulls = new boolean[columns];
for (int i = 0; i < columns; i++) {
cellWidths[i] = 0;
cellNulls[i] = true;
}
float total = 0;
int j = 0;
for (final Iterator i = cells.iterator(); i.hasNext();) {
cell = (Cell) i.next();
width = cell.getWidthAsString();
if (cell.getWidth() == 0) {
if (cell.getColspan() == 1 && cellWidths[j] == 0) {
try {
cellWidths[j] = 100f / columns;
total += cellWidths[j];
} catch (final Exception e) {
// empty on purpose
}
} else if (cell.getColspan() == 1) {
cellNulls[j] = false;
}
} else if (cell.getColspan() == 1 && width.endsWith("%")) {
try {
cellWidths[j] = Float.parseFloat(
width.substring(0, width.length() - 1)
+ "f");
total += cellWidths[j];
} catch (final Exception e) {
// empty on purpose
}
}
j += cell.getColspan();
table.addCell(cell);
}
final float widths[] = table.getProportionalWidths();
if (widths.length == columns) {
float left = 0.0f;
for (int i = 0; i < columns; i++) {
if (cellNulls[i] && widths[i] != 0) {
left += widths[i];
cellWidths[i] = widths[i];
}
}
if (100.0 >= total) {
for (int i = 0; i < widths.length; i++) {
if (cellWidths[i] == 0 && widths[i] != 0) {
cellWidths[i] = widths[i] / left
* (100.0f - total);
}
}
}
table.setWidths(cellWidths);
}
this.stack.push(table);
}
// cells
if (ElementTags.CELL.equals(name)) {
return;
}
// sections
if (ElementTags.SECTION.equals(name)) {
this.stack.pop();
return;
}
// chapters
if (ElementTags.CHAPTER.equals(name)) {
this.document.add((Element) this.stack.pop());
return;
}
// the documentroot
if (isDocumentRoot(name)) {
try {
while (true) {
final Element element = (Element) this.stack.pop();
try {
final TextElementArray previous = (TextElementArray) this.stack
.pop();
previous.add(element);
this.stack.push(previous);
} catch (final EmptyStackException es) {
this.document.add(element);
}
}
} catch (final EmptyStackException ese) {
// empty on purpose
}
if (this.controlOpenClose) {
this.document.close();
}
return;
}
} catch (final DocumentException de) {
throw new ExceptionConverter(de);
}
}
/**
* Checks if a certain tag corresponds with the newpage-tag.
*
* @param tag
* a presumed tagname
* @return true
or false
*/
private boolean isNewpage(final String tag) {
return ElementTags.NEWPAGE.equals(tag);
}
/**
* Checks if a certain tag corresponds with the newpage-tag.
*
* @param tag
* a presumed tagname
* @return true
or false
*/
private boolean isNewline(final String tag) {
return ElementTags.NEWLINE.equals(tag);
}
/**
* Checks if a certain tag corresponds with the roottag.
*
* @param tag
* a presumed tagname
* @return true
if tag equals itext
*
,false
otherwise.
*/
private boolean isDocumentRoot(final String tag) {
return ElementTags.ITEXT.equals(tag);
}
}