simplenlg.format.english.MarkupRealiser Maven / Gradle / Ivy
package simplenlg.format.english;
/*
* The contents of this file are subject to the Mozilla Public License
* Version 1.1 (the "License"); you may not use this file except in
* compliance with the License. You may obtain a copy of the License at
* http://www.mozilla.org/MPL/
*
* Software distributed under the License is distributed on an "AS IS"
* basis, WITHOUT WARRANTY OF ANY KIND, either express or implied. See the
* License for the specific language governing rights and limitations
* under the License.
*
* The Original Code is "Simplenlg".
*
* The Initial Developer of the Original Code is Ehud Reiter, Albert Gatt and Dave Westwater.
* Portions created by Ehud Reiter, Albert Gatt and Dave Westwater are Copyright (C) 2010-11 The University of Aberdeen. All Rights Reserved.
*
* Contributor(s): Ehud Reiter, Albert Gatt,4 Dave Wewstwater, Roman Kutlak, Margaret Mitchell.
*/
import java.util.ArrayList;
import java.util.List;
import simplenlg.format.english.TextFormatter;
import simplenlg.framework.DocumentCategory;
import simplenlg.framework.DocumentElement;
import simplenlg.framework.NLGElement;
import simplenlg.framework.NLGModule;
import simplenlg.lexicon.Lexicon;
import simplenlg.morphology.english.MorphologyProcessor;
import simplenlg.orthography.english.OrthographyProcessor;
import simplenlg.realiser.english.Realiser;
import simplenlg.syntax.english.SyntaxProcessor;
import static simplenlg.format.english.MarkupMorphologyProcessor.propagateMarkup;
/**
* @author D. Westwater, Data2Text Ltd
*
*/
public class MarkupRealiser extends Realiser {
public MorphologyProcessor morphology;
public OrthographyProcessor orthography;
public SyntaxProcessor syntax;
private NLGModule formatter = null;
private boolean debug = false;
/**
* create a realiser (no lexicon)
*/
public MarkupRealiser() {
super();
initialise();
}
/**
* Create a realiser with a lexicon (should match lexicon used for
* NLGFactory)
*
* @param lexicon
*/
public MarkupRealiser(Lexicon lexicon) {
this();
setLexicon(lexicon);
}
/**
* Check whether this processor separates premodifiers using a comma.
*
*
* Implementation note: this method checks whether the
* {simplenlg.orthography.english.OrthographyProcessor} has the
* parameter set.
*
* @return true
if premodifiers in the noun phrase are
* comma-separated.
*/
public boolean isCommaSepPremodifiers() {
return this.orthography == null ? false : this.orthography.isCommaSepPremodifiers();
}
/**
* Set whether to separate premodifiers using a comma. If true
,
* premodifiers will be comma-separated, as in the long, dark road.
* If false
, they won't.
* Implementation note:: this method sets the relevant
* parameter in the
* { simplenlg.orthography.english.OrthographyProcessor}.
*
* @param commaSepPremodifiers
* the commaSepPremodifiers to set
*/
public void setCommaSepPremodifiers(boolean commaSepPremodifiers) {
if(this.orthography != null) {
this.orthography.setCommaSepPremodifiers(commaSepPremodifiers);
}
}
/**
* Check whether this processor separates cue phrases from the matrix clause using a comma.
*
*
* Implementation note: this method checks whether the
* { simplenlg.orthography.english.OrthographyProcessor} has the
* parameter set.
*
* @return true
if cue phrases have a comma before the remainder of the host phrase
*/
public boolean isCommaSepCuephrase() {
return this.orthography == null ? false : this.orthography.isCommaSepCuephrase();
}
/**
* Set whether to separate cue phrases from the host phrase using a comma. If true
,
* a comma will be inserted, as in however, Bill arrived late.
* If false
, they won't.
* Implementation note:: this method sets the relevant
* parameter in the
* { simplenlg.orthography.english.OrthographyProcessor}.
*
* @param commaSepCuephrase
*/
public void setCommaSepCuephrase(boolean commaSepCuephrase) {
if(this.orthography != null) {
this.orthography.setCommaSepCuephrase(commaSepCuephrase);
}
}
@Override
public void initialise() {
this.morphology = new MorphologyProcessor();
this.morphology.initialise();
this.orthography = new OrthographyProcessor();
this.orthography.initialise();
this.syntax = new SyntaxProcessor();
this.syntax.initialise();
this.formatter = new TextFormatter();
// AG: added call to initialise for formatter
this.formatter.initialise();
}
@Override
public NLGElement realise(NLGElement element) {
StringBuilder debug = new StringBuilder();
if(this.debug) {
System.out.println("INITIAL TREE\n"); //$NON-NLS-1$
System.out.println(element.printTree(null));
debug.append("INITIAL TREE
");
debug.append(element.printTree(" ").replaceAll("\n", "
"));
}
NLGElement postSyntax = this.syntax.realise(element);
if(this.debug) {
System.out.println("
POST-SYNTAX TREE
"); //$NON-NLS-1$
System.out.println(postSyntax.printTree(null));
debug.append("
POST-SYNTAX TREE
");
debug.append(postSyntax.printTree(" ").replaceAll("\n", "
"));
}
NLGElement postMorphology = this.morphology.realise(postSyntax);
if(this.debug) {
System.out.println("\nPOST-MORPHOLOGY TREE\n"); //$NON-NLS-1$
System.out.println(postMorphology.printTree(null));
debug.append("
POST-MORPHOLOGY TREE
");
debug.append(postMorphology.printTree(" ").replaceAll("\n", "
"));
}
NLGElement postOrthography = this.orthography.realise(postMorphology);
if(this.debug) {
System.out.println("\nPOST-ORTHOGRAPHY TREE\n"); //$NON-NLS-1$
System.out.println(postOrthography.printTree(null));
debug.append("
POST-ORTHOGRAPHY TREE
");
debug.append(postOrthography.printTree(" ").replaceAll("\n", "
"));
}
NLGElement postFormatter = null;
if(this.formatter != null) {
postFormatter = this.formatter.realise(postOrthography);
if(this.debug) {
System.out.println("\nPOST-FORMATTER TREE\n"); //$NON-NLS-1$
System.out.println(postFormatter.printTree(null));
debug.append("
POST-FORMATTER TREE
");
debug.append(postFormatter.printTree(" ").replaceAll("\n", "
"));
}
} else {
postFormatter = postOrthography;
}
if(this.debug) {
postFormatter.setFeature("debug", debug.toString());
}
return postFormatter;
}
/**
* Convenience class to realise any NLGElement as a sentence
*
* @param element
* @return String realisation of the NLGElement
*/
public String realiseSentence(NLGElement element) {
NLGElement realised = null;
if(element instanceof DocumentElement)
realised = realise(element);
else {
DocumentElement sentence = new DocumentElement(DocumentCategory.SENTENCE, null);
sentence.addComponent(element);
propagateMarkup(element, sentence);
realised = realise(sentence);
}
if(realised == null)
return null;
else
return realised.getRealisation();
}
@Override
public List realise(List elements) {
List realisedElements = new ArrayList();
if(null != elements) {
for(NLGElement element : elements) {
NLGElement realisedElement = realise(element);
realisedElements.add(realisedElement);
}
}
return realisedElements;
}
@Override
public void setLexicon(Lexicon newLexicon) {
this.syntax.setLexicon(newLexicon);
this.morphology.setLexicon(newLexicon);
this.orthography.setLexicon(newLexicon);
}
public void setFormatter(NLGModule formatter) {
this.formatter = formatter;
}
public void setDebugMode(boolean debugOn) {
this.debug = debugOn;
}
}