org.apache.abdera.parser.stax.FOMParser Maven / Gradle / Ivy
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. The ASF licenses this file to You
* under the Apache License, Version 2.0 (the "License"); you may not
* use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License. For additional information regarding
* copyright in this work, please see the NOTICE file in the top level
* directory of this distribution.
*/
package org.apache.abdera.parser.stax;
import java.io.InputStream;
import java.io.Reader;
import javax.xml.stream.XMLInputFactory;
import javax.xml.stream.XMLStreamException;
import javax.xml.stream.XMLStreamReader;
import org.apache.abdera.Abdera;
import org.apache.abdera.factory.Factory;
import org.apache.abdera.i18n.iri.IRI;
import org.apache.abdera.i18n.text.Localizer;
import org.apache.abdera.i18n.text.io.CompressionUtil;
import org.apache.abdera.model.Document;
import org.apache.abdera.model.Element;
import org.apache.abdera.parser.ParseException;
import org.apache.abdera.parser.Parser;
import org.apache.abdera.parser.ParserOptions;
import org.apache.abdera.parser.stax.util.FOMSniffingInputStream;
import org.apache.abdera.parser.stax.util.FOMXmlRestrictedCharReader;
import org.apache.abdera.util.AbstractParser;
import org.apache.axiom.om.OMDocument;
import org.apache.axiom.om.util.StAXParserConfiguration;
import org.apache.axiom.om.util.StAXUtils;
import org.apache.axiom.util.stax.dialect.StAXDialect;
public class FOMParser extends AbstractParser implements Parser {
private static final StAXParserConfiguration ABDERA_PARSER_CONFIGURATION = new StAXParserConfiguration() {
public XMLInputFactory configure(XMLInputFactory factory, StAXDialect dialect) {
factory.setProperty(XMLInputFactory.IS_REPLACING_ENTITY_REFERENCES, Boolean.FALSE);
return factory;
}
// This is used in log statements inside Axiom
@Override
public String toString() {
return "ABDERA";
}
};
public FOMParser() {
super();
}
public FOMParser(Abdera abdera) {
super(abdera);
}
private FOMFactory getFomFactory(ParserOptions options) {
FOMFactory factory =
(options != null && options.getFactory() != null) ? (FOMFactory)options.getFactory() : null;
if (factory == null) {
Factory f = getFactory();
factory = (f instanceof FOMFactory) ? (FOMFactory)f : new FOMFactory();
}
return factory;
}
private Document getDocument(FOMBuilder builder, IRI base, ParserOptions options)
throws ParseException {
Document document = builder.getFomDocument();
try {
if (base != null)
document.setBaseUri(base.toString());
if (options != null && options.getCharset() != null)
((OMDocument)document).setCharsetEncoding(options.getCharset());
if (options != null)
document.setMustPreserveWhitespace(options.getMustPreserveWhitespace());
} catch (Exception e) {
if (!(e instanceof ParseException))
e = new ParseException(e);
throw (ParseException)e;
}
return document;
}
public Document parse(InputStream in, String base, ParserOptions options)
throws ParseException {
if (in == null)
throw new IllegalArgumentException(Localizer.get("INPUTSTREAM.NOT.NULL"));
try {
if (options == null)
options = getDefaultParserOptions();
if (options.getCompressionCodecs() != null) {
in = CompressionUtil.getDecodingInputStream(in, options.getCompressionCodecs());
}
String charset = options.getCharset();
if (charset == null && options.getAutodetectCharset()) {
FOMSniffingInputStream sin =
(in instanceof FOMSniffingInputStream) ? (FOMSniffingInputStream)in
: new FOMSniffingInputStream(in);
charset = sin.getEncoding();
if (charset != null)
options.setCharset(charset);
in = sin;
}
if (options.getFilterRestrictedCharacters()) {
Reader rdr =
(charset == null)
? new FOMXmlRestrictedCharReader(in, options.getFilterRestrictedCharacterReplacement())
: new FOMXmlRestrictedCharReader(in, charset, options.getFilterRestrictedCharacterReplacement());
return parse(StAXUtils.createXMLStreamReader(rdr), base, options);
} else {
XMLStreamReader xmlreader =
(charset == null) ? createXMLStreamReader(in) : createXMLStreamReader(in, charset);
return parse(xmlreader, base, options);
}
} catch (Exception e) {
if (!(e instanceof ParseException))
e = new ParseException(e);
throw (ParseException)e;
}
}
public Document parse(Reader in, String base, ParserOptions options) throws ParseException {
if (in == null)
throw new IllegalArgumentException(Localizer.get("READER.NOT.NULL"));
try {
if (options == null)
options = getDefaultParserOptions();
if (options.getFilterRestrictedCharacters() && !(in instanceof FOMXmlRestrictedCharReader)) {
in = new FOMXmlRestrictedCharReader(in, options.getFilterRestrictedCharacterReplacement());
}
// return parse(StAXUtils.createXMLStreamReader(in), base, options);
return parse(createXMLStreamReader(in), base, options);
} catch (Exception e) {
if (!(e instanceof ParseException))
e = new ParseException(e);
throw (ParseException)e;
}
}
public static XMLStreamReader createXMLStreamReader(InputStream in, String encoding) throws XMLStreamException {
return StAXUtils.createXMLStreamReader(ABDERA_PARSER_CONFIGURATION, in, encoding);
}
public static XMLStreamReader createXMLStreamReader(InputStream in) throws XMLStreamException {
return StAXUtils.createXMLStreamReader(ABDERA_PARSER_CONFIGURATION, in);
}
private XMLStreamReader createXMLStreamReader(Reader in) throws XMLStreamException {
return StAXUtils.createXMLStreamReader(ABDERA_PARSER_CONFIGURATION, in);
}
public Document parse(XMLStreamReader reader, String base, ParserOptions options)
throws ParseException {
try {
FOMBuilder builder = new FOMBuilder(getFomFactory(options), reader, options);
return getDocument(builder, base != null ? new IRI(base) : null, options);
} catch (Exception e) {
if (!(e instanceof ParseException))
e = new ParseException(e);
throw (ParseException)e;
}
}
@Override
protected ParserOptions initDefaultParserOptions() {
return new FOMParserOptions(getFactory());
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy