All Downloads are FREE. Search and download functionalities are using the official Maven repository.

simplenlg.format.english.MarkupRealiser Maven / Gradle / Ivy

There is a newer version: 2.2.0
Show newest version
package simplenlg.format.english;

/*
 * The contents of this file are subject to the Mozilla Public License
 * Version 1.1 (the "License"); you may not use this file except in
 * compliance with the License. You may obtain a copy of the License at
 * http://www.mozilla.org/MPL/
 *
 * Software distributed under the License is distributed on an "AS IS"
 * basis, WITHOUT WARRANTY OF ANY KIND, either express or implied. See the
 * License for the specific language governing rights and limitations
 * under the License.
 *
 * The Original Code is "Simplenlg".
 *
 * The Initial Developer of the Original Code is Ehud Reiter, Albert Gatt and Dave Westwater.
 * Portions created by Ehud Reiter, Albert Gatt and Dave Westwater are Copyright (C) 2010-11 The University of Aberdeen. All Rights Reserved.
 *
 * Contributor(s): Ehud Reiter, Albert Gatt,4 Dave Wewstwater, Roman Kutlak, Margaret Mitchell.
 */

import java.util.ArrayList;
import java.util.List;

import simplenlg.format.english.TextFormatter;
import simplenlg.framework.DocumentCategory;
import simplenlg.framework.DocumentElement;
import simplenlg.framework.NLGElement;
import simplenlg.framework.NLGModule;
import simplenlg.lexicon.Lexicon;
import simplenlg.morphology.english.MorphologyProcessor;
import simplenlg.orthography.english.OrthographyProcessor;
import simplenlg.realiser.english.Realiser;
import simplenlg.syntax.english.SyntaxProcessor;

import static simplenlg.format.english.MarkupMorphologyProcessor.propagateMarkup;

/**
 * @author D. Westwater, Data2Text Ltd
 *
 */
public class MarkupRealiser extends Realiser {

    public MorphologyProcessor  morphology;
    public OrthographyProcessor orthography;
    public SyntaxProcessor      syntax;
    private NLGModule            formatter = null;
    private boolean              debug     = false;

    /**
     * create a realiser (no lexicon)
     */
    public MarkupRealiser() {
        super();
        initialise();
    }

    /**
     * Create a realiser with a lexicon (should match lexicon used for
     * NLGFactory)
     *
     * @param lexicon
     */
    public MarkupRealiser(Lexicon lexicon) {
        this();
        setLexicon(lexicon);
    }

    /**
     * Check whether this processor separates premodifiers using a comma.
     *
     * 
* Implementation note: this method checks whether the * {simplenlg.orthography.english.OrthographyProcessor} has the * parameter set. * * @return true if premodifiers in the noun phrase are * comma-separated. */ public boolean isCommaSepPremodifiers() { return this.orthography == null ? false : this.orthography.isCommaSepPremodifiers(); } /** * Set whether to separate premodifiers using a comma. If true, * premodifiers will be comma-separated, as in the long, dark road. * If false, they won't.
* Implementation note:: this method sets the relevant * parameter in the * { simplenlg.orthography.english.OrthographyProcessor}. * * @param commaSepPremodifiers * the commaSepPremodifiers to set */ public void setCommaSepPremodifiers(boolean commaSepPremodifiers) { if(this.orthography != null) { this.orthography.setCommaSepPremodifiers(commaSepPremodifiers); } } /** * Check whether this processor separates cue phrases from the matrix clause using a comma. * *
* Implementation note: this method checks whether the * { simplenlg.orthography.english.OrthographyProcessor} has the * parameter set. * * @return true if cue phrases have a comma before the remainder of the host phrase */ public boolean isCommaSepCuephrase() { return this.orthography == null ? false : this.orthography.isCommaSepCuephrase(); } /** * Set whether to separate cue phrases from the host phrase using a comma. If true, * a comma will be inserted, as in however, Bill arrived late. * If false, they won't.
* Implementation note:: this method sets the relevant * parameter in the * { simplenlg.orthography.english.OrthographyProcessor}. * * @param commaSepCuephrase */ public void setCommaSepCuephrase(boolean commaSepCuephrase) { if(this.orthography != null) { this.orthography.setCommaSepCuephrase(commaSepCuephrase); } } @Override public void initialise() { this.morphology = new MorphologyProcessor(); this.morphology.initialise(); this.orthography = new OrthographyProcessor(); this.orthography.initialise(); this.syntax = new SyntaxProcessor(); this.syntax.initialise(); this.formatter = new TextFormatter(); // AG: added call to initialise for formatter this.formatter.initialise(); } @Override public NLGElement realise(NLGElement element) { StringBuilder debug = new StringBuilder(); if(this.debug) { System.out.println("INITIAL TREE\n"); //$NON-NLS-1$ System.out.println(element.printTree(null)); debug.append("INITIAL TREE
"); debug.append(element.printTree("  ").replaceAll("\n", "
")); } NLGElement postSyntax = this.syntax.realise(element); if(this.debug) { System.out.println("
POST-SYNTAX TREE
"); //$NON-NLS-1$ System.out.println(postSyntax.printTree(null)); debug.append("
POST-SYNTAX TREE
"); debug.append(postSyntax.printTree("  ").replaceAll("\n", "
")); } NLGElement postMorphology = this.morphology.realise(postSyntax); if(this.debug) { System.out.println("\nPOST-MORPHOLOGY TREE\n"); //$NON-NLS-1$ System.out.println(postMorphology.printTree(null)); debug.append("
POST-MORPHOLOGY TREE
"); debug.append(postMorphology.printTree("  ").replaceAll("\n", "
")); } NLGElement postOrthography = this.orthography.realise(postMorphology); if(this.debug) { System.out.println("\nPOST-ORTHOGRAPHY TREE\n"); //$NON-NLS-1$ System.out.println(postOrthography.printTree(null)); debug.append("
POST-ORTHOGRAPHY TREE
"); debug.append(postOrthography.printTree("  ").replaceAll("\n", "
")); } NLGElement postFormatter = null; if(this.formatter != null) { postFormatter = this.formatter.realise(postOrthography); if(this.debug) { System.out.println("\nPOST-FORMATTER TREE\n"); //$NON-NLS-1$ System.out.println(postFormatter.printTree(null)); debug.append("
POST-FORMATTER TREE
"); debug.append(postFormatter.printTree("  ").replaceAll("\n", "
")); } } else { postFormatter = postOrthography; } if(this.debug) { postFormatter.setFeature("debug", debug.toString()); } return postFormatter; } /** * Convenience class to realise any NLGElement as a sentence * * @param element * @return String realisation of the NLGElement */ public String realiseSentence(NLGElement element) { NLGElement realised = null; if(element instanceof DocumentElement) realised = realise(element); else { DocumentElement sentence = new DocumentElement(DocumentCategory.SENTENCE, null); sentence.addComponent(element); propagateMarkup(element, sentence); realised = realise(sentence); } if(realised == null) return null; else return realised.getRealisation(); } @Override public List realise(List elements) { List realisedElements = new ArrayList(); if(null != elements) { for(NLGElement element : elements) { NLGElement realisedElement = realise(element); realisedElements.add(realisedElement); } } return realisedElements; } @Override public void setLexicon(Lexicon newLexicon) { this.syntax.setLexicon(newLexicon); this.morphology.setLexicon(newLexicon); this.orthography.setLexicon(newLexicon); } public void setFormatter(NLGModule formatter) { this.formatter = formatter; } public void setDebugMode(boolean debugOn) { this.debug = debugOn; } }




© 2015 - 2024 Weber Informatics LLC | Privacy Policy