com.lowagie.text.html.SAXmyHtmlHandler Maven / Gradle / Ivy
The newest version!
/*
* $Id: SAXmyHtmlHandler.java 3373 2008-05-12 16:21:24Z xlv $
*
* Copyright 2001, 2002 by Bruno Lowagie.
*
* The contents of this file are subject to the Mozilla Public License Version 1.1
* (the "License"); you may not use this file except in compliance with the License.
* You may obtain a copy of the License at http://www.mozilla.org/MPL/
*
* Software distributed under the License is distributed on an "AS IS" basis,
* WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License
* for the specific language governing rights and limitations under the License.
*
* The Original Code is 'iText, a free JAVA-PDF library'.
*
* The Initial Developer of the Original Code is Bruno Lowagie. Portions created by
* the Initial Developer are Copyright (C) 1999, 2000, 2001, 2002 by Bruno Lowagie.
* All Rights Reserved.
* Co-Developer of the code is Paulo Soares. Portions created by the Co-Developer
* are Copyright (C) 2000, 2001, 2002 by Paulo Soares. All Rights Reserved.
*
* Contributor(s): all the names of the contributors are added in the source code
* where applicable.
*
* Alternatively, the contents of this file may be used under the terms of the
* LGPL license (the "GNU LIBRARY GENERAL PUBLIC LICENSE"), in which case the
* provisions of LGPL are applicable instead of those above. If you wish to
* allow use of your version of this file only under the terms of the LGPL
* License and not to allow others to use your version of this file under
* the MPL, indicate your decision by deleting the provisions above and
* replace them with the notice and other provisions required by the LGPL.
* If you do not delete the provisions above, a recipient may use your version
* of this file under either the MPL or the GNU LIBRARY GENERAL PUBLIC LICENSE.
*
* This library is free software; you can redistribute it and/or modify it
* under the terms of the MPL as stated above or under the terms of the GNU
* Library General Public License as published by the Free Software Foundation;
* either version 2 of the License, or any later version.
*
* This library is distributed in the hope that it will be useful, but WITHOUT
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
* FOR A PARTICULAR PURPOSE. See the GNU Library general Public License for more
* details.
*
* If you didn't download this code from the following link, you should check if
* you aren't using an obsolete version:
* http://www.lowagie.com/iText/
*/
package com.lowagie.text.html;
import java.util.HashMap;
import java.util.Properties;
import org.xml.sax.Attributes;
import com.lowagie.text.DocListener;
import com.lowagie.text.DocumentException;
import com.lowagie.text.Element;
import com.lowagie.text.ElementTags;
import com.lowagie.text.ExceptionConverter;
import com.lowagie.text.pdf.BaseFont;
import com.lowagie.text.xml.SAXiTextHandler;
import com.lowagie.text.xml.XmlPeer;
/**
* The Tags
-class maps several XHTML-tags to iText-objects.
*/
public class SAXmyHtmlHandler extends SAXiTextHandler // SAXmyHandler
{
/** These are the properties of the body section. */
private Properties bodyAttributes = new Properties();
/** This is the status of the table border. */
private boolean tableBorder = false;
/**
* Constructs a new SAXiTextHandler that will translate all the events
* triggered by the parser to actions on the Document
-object.
*
* @param document
* this is the document on which events must be triggered
*/
public SAXmyHtmlHandler(DocListener document) {
super(document, new HtmlTagMap());
}
/**
* Constructs a new SAXiTextHandler that will translate all the events
* triggered by the parser to actions on the Document
-object.
*
* @param document
* this is the document on which events must be triggered
* @param bf
*/
public SAXmyHtmlHandler(DocListener document, BaseFont bf) {
super(document, new HtmlTagMap(), bf);
}
/**
* Constructs a new SAXiTextHandler that will translate all the events
* triggered by the parser to actions on the Document
-object.
*
* @param document
* this is the document on which events must be triggered
* @param htmlTags
* a tagmap translating HTML tags to iText tags
*/
public SAXmyHtmlHandler(DocListener document, HashMap htmlTags) {
super(document, htmlTags);
}
/**
* This method gets called when a start tag is encountered.
*
* @param uri
* the Uniform Resource Identifier
* @param lname
* the local name (without prefix), or the empty string if
* Namespace processing is not being performed.
* @param name
* the name of the tag that is encountered
* @param attrs
* the list of attributes
*/
public void startElement(String uri, String lname, String name,
Attributes attrs) {
// System.err.println("Start: " + name);
// super.handleStartingTags is replaced with handleStartingTags
// suggestion by Vu Ngoc Tan/Hop
name = name.toLowerCase();
if (HtmlTagMap.isHtml(name)) {
// we do nothing
return;
}
if (HtmlTagMap.isHead(name)) {
// we do nothing
return;
}
if (HtmlTagMap.isTitle(name)) {
// we do nothing
return;
}
if (HtmlTagMap.isMeta(name)) {
// we look if we can change the body attributes
String meta = null;
String content = null;
if (attrs != null) {
for (int i = 0; i < attrs.getLength(); i++) {
String attribute = attrs.getQName(i);
if (attribute.equalsIgnoreCase(HtmlTags.CONTENT))
content = attrs.getValue(i);
else if (attribute.equalsIgnoreCase(HtmlTags.NAME))
meta = attrs.getValue(i);
}
}
if (meta != null && content != null) {
bodyAttributes.put(meta, content);
}
return;
}
if (HtmlTagMap.isLink(name)) {
// we do nothing for the moment, in a later version we could extract
// the style sheet
return;
}
if (HtmlTagMap.isBody(name)) {
// maybe we could extract some info about the document: color,
// margins,...
// but that's for a later version...
XmlPeer peer = new XmlPeer(ElementTags.ITEXT, name);
peer.addAlias(ElementTags.TOP, HtmlTags.TOPMARGIN);
peer.addAlias(ElementTags.BOTTOM, HtmlTags.BOTTOMMARGIN);
peer.addAlias(ElementTags.RIGHT, HtmlTags.RIGHTMARGIN);
peer.addAlias(ElementTags.LEFT, HtmlTags.LEFTMARGIN);
bodyAttributes.putAll(peer.getAttributes(attrs));
handleStartingTags(peer.getTag(), bodyAttributes);
return;
}
if (myTags.containsKey(name)) {
XmlPeer peer = (XmlPeer) myTags.get(name);
if (ElementTags.TABLE.equals(peer.getTag()) || ElementTags.CELL.equals(peer.getTag())) {
Properties p = peer.getAttributes(attrs);
String value;
if (ElementTags.TABLE.equals(peer.getTag())
&& (value = p.getProperty(ElementTags.BORDERWIDTH)) != null) {
if (Float.parseFloat(value + "f") > 0) {
tableBorder = true;
}
}
if (tableBorder) {
p.put(ElementTags.LEFT, String.valueOf(true));
p.put(ElementTags.RIGHT, String.valueOf(true));
p.put(ElementTags.TOP, String.valueOf(true));
p.put(ElementTags.BOTTOM, String.valueOf(true));
}
handleStartingTags(peer.getTag(), p);
return;
}
handleStartingTags(peer.getTag(), peer.getAttributes(attrs));
return;
}
Properties attributes = new Properties();
if (attrs != null) {
for (int i = 0; i < attrs.getLength(); i++) {
String attribute = attrs.getQName(i).toLowerCase();
attributes.setProperty(attribute, attrs.getValue(i).toLowerCase());
}
}
handleStartingTags(name, attributes);
}
/**
* This method gets called when an end tag is encountered.
*
* @param uri
* the Uniform Resource Identifier
* @param lname
* the local name (without prefix), or the empty string if
* Namespace processing is not being performed.
* @param name
* the name of the tag that ends
*/
public void endElement(String uri, String lname, String name) {
// System.err.println("End: " + name);
name = name.toLowerCase();
if (ElementTags.PARAGRAPH.equals(name)) {
try {
document.add((Element) stack.pop());
return;
} catch (DocumentException e) {
throw new ExceptionConverter(e);
}
}
if (HtmlTagMap.isHead(name)) {
// we do nothing
return;
}
if (HtmlTagMap.isTitle(name)) {
if (currentChunk != null) {
bodyAttributes.put(ElementTags.TITLE, currentChunk.getContent());
}
return;
}
if (HtmlTagMap.isMeta(name)) {
// we do nothing
return;
}
if (HtmlTagMap.isLink(name)) {
// we do nothing
return;
}
if (HtmlTagMap.isBody(name)) {
// we do nothing
return;
}
if (myTags.containsKey(name)) {
XmlPeer peer = (XmlPeer) myTags.get(name);
if (ElementTags.TABLE.equals(peer.getTag())) {
tableBorder = false;
}
super.handleEndingTags(peer.getTag());
return;
}
// super.handleEndingTags is replaced with handleEndingTags
// suggestion by Ken Auer
handleEndingTags(name);
}
}