org.sweble.wikitext.lazy.LazyParser Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of swc-parser-lazy Show documentation
Show all versions of swc-parser-lazy Show documentation
A parser for MediaWiki's Wikitext.
/**
* Copyright 2011 The Open Source Research Group,
* University of Erlangen-Nürnberg
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.sweble.wikitext.lazy;
import java.io.IOException;
import java.io.Reader;
import java.io.StringReader;
import org.sweble.wikitext.lazy.parser.LazyParsedPage;
import org.sweble.wikitext.lazy.parser.LazyRatsParser;
import org.sweble.wikitext.lazy.preprocessor.PreprocessedWikitext;
import xtc.parser.ParseError;
import xtc.parser.ParseException;
import xtc.parser.Result;
import xtc.parser.SemanticValue;
import de.fau.cs.osr.ptk.common.EntityMap;
import de.fau.cs.osr.ptk.common.ParserCommon;
import de.fau.cs.osr.ptk.common.ast.AstNode;
public class LazyParser
extends
ParserCommon
{
private final ParserConfigInterface config;
private LazyRatsParser parser;
// =========================================================================
public LazyParser(ParserConfigInterface config)
{
this.config = config;
}
// =========================================================================
@Override
public AstNode parseArticle(String src, String title) throws IOException, ParseException
{
PreprocessedWikitext ppWt =
new PreprocessedWikitext(src, new EntityMap());
return parseArticle(ppWt, title);
}
public AstNode parseArticle(PreprocessedWikitext wikitext, String title) throws IOException, ParseException
{
Reader in = new StringReader(wikitext.getWikitext());
int inputSize = wikitext.getWikitext().getBytes().length;
parser = new LazyRatsParser(in, title, inputSize);
parser.getState().init(config, wikitext.getEntityMap());
Result r = null;
//LazyRatsParser.enableStats();
{
r = this.parser.pArticle(0);
}
if (LazyRatsParser.isStatsEnabled())
LazyRatsParser.getStats().dump(System.err);
if (r.hasValue())
{
SemanticValue v = (SemanticValue) r;
if (v.value instanceof LazyParsedPage)
{
return process((LazyParsedPage) v.value);
}
else
{
throw new ParseException(
"Internal parser error: Unexpected parser result type!");
}
}
else
{
ParseError err = (ParseError) r;
if (err.index == -1)
{
throw new ParseException(
"Parse error: No information available");
}
else
{
throw new ParseException(String.format(
"%s: %s",
parser.location(err.index),
err.msg));
}
}
}
}