opennlp.tools.parser.ParserEvaluator Maven / Gradle / Ivy
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package opennlp.tools.parser;
import java.util.ArrayList;
import java.util.List;
import java.util.Stack;
import opennlp.tools.cmdline.parser.ParserTool;
import opennlp.tools.util.Span;
import opennlp.tools.util.eval.Evaluator;
import opennlp.tools.util.eval.FMeasure;
/**
* This implementation of {@link Evaluator} behaves like {@code EVALB} with no exceptions,
* e.g, without removing punctuation tags, or equality between {@code ADVP} and {@code PRT}, as
* in
* COLLINS convention.
*
* To follow parsing evaluation conventions (Bikel, Collins, Charniak, etc.) as in {@code EVALB},
* options are to be added to the {@code ParserEvaluatorTool}.
*
* @see Parser
* @see Evaluator
* @see Parse
*/
public class ParserEvaluator extends Evaluator {
/*
* Holds the evaluation results for the last run of {@link #processSample}.
*/
private final FMeasure fmeasure = new FMeasure();
/*
* The parser to evaluate.
*/
private final Parser parser;
/**
* Initializes a {@link ParserEvaluator} instance with the given {@link Parser}.
*
* @param aParser The {@link Parser} to evaluate.
* @param monitors The {@link ParserEvaluationMonitor evaluation listeners}.
*/
public ParserEvaluator(final Parser aParser, final ParserEvaluationMonitor... monitors) {
super(monitors);
this.parser = aParser;
}
/**
* Obtains {@link Span spans} for every parse in a sentence.
*
* @param parse The parse from which to obtain {@link Span spans}.
*
* @return An array of {@link Span spans} for the parse
*/
private static Span[] getConstituencySpans(final Parse parse) {
Stack stack = new Stack<>();
if (parse.getChildCount() > 0) {
for (Parse child : parse.getChildren()) {
stack.push(child);
}
}
List consts = new ArrayList<>();
while (!stack.isEmpty()) {
Parse constSpan = stack.pop();
if (!constSpan.isPosTag()) {
Span span = constSpan.getSpan();
consts.add(new Span(span.getStart(), span.getEnd(), constSpan.getType()));
for (Parse child : constSpan.getChildren()) {
stack.push(child);
}
}
}
return consts.toArray(new Span[0]);
}
@Override
protected final Parse processSample(final Parse reference) {
List tokens = new ArrayList<>();
for (Parse token : reference.getTokenNodes()) {
tokens.add(token.getSpan().getCoveredText(reference.getText()).toString());
}
Parse[] predictions = ParserTool.parseLine(String.join(" ", tokens), parser, 1);
Parse prediction = null;
if (predictions.length > 0) {
prediction = predictions[0];
fmeasure.updateScores(getConstituencySpans(reference), getConstituencySpans(prediction));
}
return prediction;
}
public final FMeasure getFMeasure() {
return fmeasure;
}
}