All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.sweble.wikitext.lazy.LazyParser Maven / Gradle / Ivy

There is a newer version: 3.1.9
Show newest version
/**
 * Copyright 2011 The Open Source Research Group,
 *                University of Erlangen-Nürnberg
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.sweble.wikitext.lazy;

import java.io.IOException;
import java.io.Reader;
import java.io.StringReader;

import org.sweble.wikitext.lazy.parser.LazyParsedPage;
import org.sweble.wikitext.lazy.parser.LazyRatsParser;
import org.sweble.wikitext.lazy.preprocessor.PreprocessedWikitext;

import xtc.parser.ParseError;
import xtc.parser.ParseException;
import xtc.parser.Result;
import xtc.parser.SemanticValue;
import de.fau.cs.osr.ptk.common.EntityMap;
import de.fau.cs.osr.ptk.common.ParserCommon;
import de.fau.cs.osr.ptk.common.ast.AstNode;

public class LazyParser
        extends
            ParserCommon
{
	private final ParserConfigInterface config;
	
	private LazyRatsParser parser;
	
	// =========================================================================
	
	public LazyParser(ParserConfigInterface config)
	{
		this.config = config;
	}
	
	// =========================================================================
	
	@Override
	public AstNode parseArticle(String src, String title) throws IOException, ParseException
	{
		PreprocessedWikitext ppWt =
		        new PreprocessedWikitext(src, new EntityMap());
		
		return parseArticle(ppWt, title);
	}
	
	public AstNode parseArticle(PreprocessedWikitext wikitext, String title) throws IOException, ParseException
	{
		Reader in = new StringReader(wikitext.getWikitext());
		
		int inputSize = wikitext.getWikitext().getBytes().length;
		
		parser = new LazyRatsParser(in, title, inputSize);
		
		parser.getState().init(config, wikitext.getEntityMap());
		
		Result r = null;
		
		//LazyRatsParser.enableStats();
		{
			r = this.parser.pArticle(0);
		}
		if (LazyRatsParser.isStatsEnabled())
			LazyRatsParser.getStats().dump(System.err);
		
		if (r.hasValue())
		{
			SemanticValue v = (SemanticValue) r;
			
			if (v.value instanceof LazyParsedPage)
			{
				return process((LazyParsedPage) v.value);
			}
			else
			{
				throw new ParseException(
				        "Internal parser error: Unexpected parser result type!");
			}
		}
		else
		{
			ParseError err = (ParseError) r;
			
			if (err.index == -1)
			{
				throw new ParseException(
				        "Parse error: No information available");
			}
			else
			{
				throw new ParseException(String.format(
				        "%s: %s",
				        parser.location(err.index),
				        err.msg));
			}
		}
	}
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy