All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.attoparser.dom.IDOMMarkupParser Maven / Gradle / Ivy

There is a newer version: 2.0.7.RELEASE
Show newest version
/*
 * =============================================================================
 * 
 *   Copyright (c) 2012-2014, The ATTOPARSER team (http://www.attoparser.org)
 * 
 *   Licensed under the Apache License, Version 2.0 (the "License");
 *   you may not use this file except in compliance with the License.
 *   You may obtain a copy of the License at
 * 
 *       http://www.apache.org/licenses/LICENSE-2.0
 * 
 *   Unless required by applicable law or agreed to in writing, software
 *   distributed under the License is distributed on an "AS IS" BASIS,
 *   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 *   See the License for the specific language governing permissions and
 *   limitations under the License.
 * 
 * =============================================================================
 */
package org.attoparser.dom;

import java.io.Reader;

import org.attoparser.ParseException;


/**
 * 

* Interface to be implemented by all DOM Markup Parsers. * Default implementation is {@link org.attoparser.dom.DOMMarkupParser}. *

*

* DOM trees created by this class are made with objects of the classes from the org.attoparser.dom * package. *

*

* Note that this parser interface is actually a convenience artifact aimed at using * the {@link org.attoparser.dom.DOMBuilderMarkupHandler} DOM-conversion handler * more easily. *

*

* Sample usage: *

*

 *   // Obtain a java.io.Reader on the document to be parsed
 *   final Reader documentReader = ...;
 *
 *   // Create or obtain the parser instance (note this is not the 'simple' one!)
 *   final IDOMMarkupParser parser = new DOMMarkupParser(ParseConfiguration.htmlConfiguration());
 *
 *   // Parse it and return the Document Object Model
 *   final Document document = parser.parse("Some document", documentReader);
 * 
*

* Note that implementations of this interface should be thread-safe, and therefore parsers * should be reusable through several parsing operations and any number of concurrent threads. *

* * @author Daniel Fernández * * @since 2.0.0 * */ public interface IDOMMarkupParser { /** *

* Parse a document and convert it into a DOM tree, using the classes at the * org.attoparser.dom package. *

* * @param document the document to be parsed, as a String. * @return the {@link org.attoparser.dom.Document} object resulting from parsing. * @throws ParseException if the document cannot be parsed. */ public Document parse(final String document) throws ParseException; /** *

* Parse a document and convert it into a DOM tree, using the classes at the * org.attoparser.dom package. *

* * @param document the document to be parsed, as a char[]. * @return the {@link org.attoparser.dom.Document} object resulting from parsing. * @throws ParseException if the document cannot be parsed. */ public Document parse(final char[] document) throws ParseException; /** *

* Parse a document and convert it into a DOM tree, using the classes at the * org.attoparser.dom package. *

* * @param document the document to be parsed, as a char[]. * @param offset the offset to be applied on the char[] document to determine the * start of the document contents. * @param len the length (in chars) of the document stored in the char[]. * @return the {@link org.attoparser.dom.Document} object resulting from parsing. * @throws ParseException if the document cannot be parsed. */ public Document parse(final char[] document, final int offset, final int len) throws ParseException; /** *

* Parse a document and convert it into a DOM tree, using the classes at the * org.attoparser.dom package. *

*

* Implementations of this interface must close the provided {@link Reader} * object after parsing. *

* * @param reader a Reader on the document. * @return the {@link org.attoparser.dom.Document} object resulting from parsing. * @throws ParseException if the document cannot be parsed. */ public Document parse(final Reader reader) throws ParseException; /** *

* Parse a document and convert it into a DOM tree, using the classes at the * org.attoparser.dom package. *

* * @param documentName the name of the document to be parsed. * @param document the document to be parsed, as a String. * @return the {@link org.attoparser.dom.Document} object resulting from parsing. * @throws ParseException if the document cannot be parsed. */ public Document parse(final String documentName, final String document) throws ParseException; /** *

* Parse a document and convert it into a DOM tree, using the classes at the * org.attoparser.dom package. *

* * @param documentName the name of the document to be parsed. * @param document the document to be parsed, as a char[]. * @return the {@link org.attoparser.dom.Document} object resulting from parsing. * @throws ParseException if the document cannot be parsed. */ public Document parse(final String documentName, final char[] document) throws ParseException; /** *

* Parse a document and convert it into a DOM tree, using the classes at the * org.attoparser.dom package. *

* * @param documentName the name of the document to be parsed. * @param document the document to be parsed, as a char[]. * @param offset the offset to be applied on the char[] document to determine the * start of the document contents. * @param len the length (in chars) of the document stored in the char[]. * @return the {@link org.attoparser.dom.Document} object resulting from parsing. * @throws ParseException if the document cannot be parsed. */ public Document parse(final String documentName, final char[] document, final int offset, final int len) throws ParseException; /** *

* Parse a document and convert it into a DOM tree, using the classes at the * org.attoparser.dom package. *

*

* Implementations of this interface must close the provided {@link Reader} * object after parsing. *

* * @param documentName the name of the document to be parsed. * @param reader a Reader on the document. * @return the {@link org.attoparser.dom.Document} object resulting from parsing. * @throws ParseException if the document cannot be parsed. */ public Document parse(final String documentName, final Reader reader) throws ParseException; }




© 2015 - 2024 Weber Informatics LLC | Privacy Policy