com.caucho.xml.LooseHtml Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of resin Show documentation
Show all versions of resin Show documentation
Resin Java Application Server
/*
* Copyright (c) 1998-2018 Caucho Technology -- all rights reserved
*
* This file is part of Resin(R) Open Source
*
* Each copy or derived work must preserve the copyright notice and this
* notice unmodified.
*
* Resin Open Source is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2 of the License, or
* (at your option) any later version.
*
* Resin Open Source is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE, or any warranty
* of NON-INFRINGEMENT. See the GNU General Public License for more
* details.
*
* You should have received a copy of the GNU General Public License
* along with Resin Open Source; if not, write to the
* Free SoftwareFoundation, Inc.
* 59 Temple Place, Suite 330
* Boston, MA 02111-1307 USA
*
* @author Scott Ferguson
*/
package com.caucho.xml;
/**
* A forgiving HTML parser interface.
*
* The forgiving HTML parser is useful for extracting information from
* the web since many sites have not-quite-standard HTML.
*
*
To parse a file into a DOM Document use
*
* Document doc = new Html().parseDocument("foo.html");
*
*
* To parse a string into a DOM Document use
*
* String html = "<h1>small test</h1>";
* Document doc = new Html().parseDocumentString(html);
*
*
* To parse a file using the SAX API use
*
* Html html = new Html();
* html.setContentHandler(myContentHandler);
* html.parse("foo.html");
*
*/
public class LooseHtml extends XmlParser {
/**
* Create a new forgiving HTML parser
*/
public LooseHtml()
{
super(new HtmlPolicy(), null);
_policy.forgiving = true;
_forgiving = true;
_extraForgiving = true;
}
}