simplenlg.format.english.MarkupRealiser Maven / Gradle / Ivy

Go to download
Show more of this group Show more artifacts with this name
Show all versions of nlg-wrapper Show documentation
There is a newer version: 2.2.0
package simplenlg.format.english;

/*
 * The contents of this file are subject to the Mozilla Public License
 * Version 1.1 (the "License"); you may not use this file except in
 * compliance with the License. You may obtain a copy of the License at
 * http://www.mozilla.org/MPL/
 *
 * Software distributed under the License is distributed on an "AS IS"
 * basis, WITHOUT WARRANTY OF ANY KIND, either express or implied. See the
 * License for the specific language governing rights and limitations
 * under the License.
 *
 * The Original Code is "Simplenlg".
 *
 * The Initial Developer of the Original Code is Ehud Reiter, Albert Gatt and Dave Westwater.
 * Portions created by Ehud Reiter, Albert Gatt and Dave Westwater are Copyright (C) 2010-11 The University of Aberdeen. All Rights Reserved.
 *
 * Contributor(s): Ehud Reiter, Albert Gatt,4 Dave Wewstwater, Roman Kutlak, Margaret Mitchell.
 */

import java.util.ArrayList;
import java.util.List;

import simplenlg.format.english.TextFormatter;
import simplenlg.framework.DocumentCategory;
import simplenlg.framework.DocumentElement;
import simplenlg.framework.NLGElement;
import simplenlg.framework.NLGModule;
import simplenlg.lexicon.Lexicon;
import simplenlg.morphology.english.MorphologyProcessor;
import simplenlg.orthography.english.OrthographyProcessor;
import simplenlg.realiser.english.Realiser;
import simplenlg.syntax.english.SyntaxProcessor;

import static simplenlg.format.english.MarkupMorphologyProcessor.propagateMarkup;

/**
 * @author D. Westwater, Data2Text Ltd
 *
 */
public class MarkupRealiser extends Realiser {

    public MorphologyProcessor  morphology;
    public OrthographyProcessor orthography;
    public SyntaxProcessor      syntax;
    private NLGModule            formatter = null;
    private boolean              debug     = false;

    /**
     * create a realiser (no lexicon)
     */
    public MarkupRealiser() {
        super();
        initialise();
    }

    /**
     * Create a realiser with a lexicon (should match lexicon used for
     * NLGFactory)
     *
     * @param lexicon
     */
    public MarkupRealiser(Lexicon lexicon) {
        this();
        setLexicon(lexicon);
    }

    /**
     * Check whether this processor separates premodifiers using a comma.
     *
     * 

     * Implementation note: this method checks whether the
     * {simplenlg.orthography.english.OrthographyProcessor} has the
     * parameter set.
     *
     * @return true if premodifiers in the noun phrase are
     *         comma-separated.
     */
    public boolean isCommaSepPremodifiers() {
        return this.orthography == null ? false : this.orthography.isCommaSepPremodifiers();
    }

    /**
     * Set whether to separate premodifiers using a comma. If true,
     * premodifiers will be comma-separated, as in the long, dark road.
     * If false, they won't. 

     * Implementation note:: this method sets the relevant
     * parameter in the
     * { simplenlg.orthography.english.OrthographyProcessor}.
     *
     * @param commaSepPremodifiers
     *            the commaSepPremodifiers to set
     */
    public void setCommaSepPremodifiers(boolean commaSepPremodifiers) {
        if(this.orthography != null) {
            this.orthography.setCommaSepPremodifiers(commaSepPremodifiers);
        }
    }

    /**
     * Check whether this processor separates cue phrases from the matrix clause using a comma.
     *
     * 

     * Implementation note: this method checks whether the
     * { simplenlg.orthography.english.OrthographyProcessor} has the
     * parameter set.
     *
     * @return true if cue phrases have a comma before the remainder of the host phrase
     */
    public boolean isCommaSepCuephrase() {
        return this.orthography == null ? false : this.orthography.isCommaSepCuephrase();
    }

    /**
     * Set whether to separate cue phrases from the host phrase using a comma. If true,
     * a comma will be inserted, as in however, Bill arrived late.
     * If false, they won't. 

     * Implementation note:: this method sets the relevant
     * parameter in the
     * { simplenlg.orthography.english.OrthographyProcessor}.
     *
     * @param commaSepCuephrase
     */
    public void setCommaSepCuephrase(boolean commaSepCuephrase) {
        if(this.orthography != null) {
            this.orthography.setCommaSepCuephrase(commaSepCuephrase);
        }
    }

    @Override
    public void initialise() {
        this.morphology = new MorphologyProcessor();
        this.morphology.initialise();
        this.orthography = new OrthographyProcessor();
        this.orthography.initialise();
        this.syntax = new SyntaxProcessor();
        this.syntax.initialise();
        this.formatter = new TextFormatter();
        // AG: added call to initialise for formatter
        this.formatter.initialise();
    }

    @Override
    public NLGElement realise(NLGElement element) {

        StringBuilder debug = new StringBuilder();

        if(this.debug) {
            System.out.println("INITIAL TREE\n"); //$NON-NLS-1$
            System.out.println(element.printTree(null));
            debug.append("INITIAL TREE
");
            debug.append(element.printTree("  ").replaceAll("\n", "
"));
        }

        NLGElement postSyntax = this.syntax.realise(element);
        if(this.debug) {
            System.out.println("
POST-SYNTAX TREE
"); //$NON-NLS-1$
            System.out.println(postSyntax.printTree(null));
            debug.append("
POST-SYNTAX TREE
");
            debug.append(postSyntax.printTree("  ").replaceAll("\n", "
"));
        }

        NLGElement postMorphology = this.morphology.realise(postSyntax);
        if(this.debug) {
            System.out.println("\nPOST-MORPHOLOGY TREE\n"); //$NON-NLS-1$
            System.out.println(postMorphology.printTree(null));
            debug.append("
POST-MORPHOLOGY TREE
");
            debug.append(postMorphology.printTree("  ").replaceAll("\n", "
"));
        }

        NLGElement postOrthography = this.orthography.realise(postMorphology);
        if(this.debug) {
            System.out.println("\nPOST-ORTHOGRAPHY TREE\n"); //$NON-NLS-1$
            System.out.println(postOrthography.printTree(null));
            debug.append("
POST-ORTHOGRAPHY TREE
");
            debug.append(postOrthography.printTree("  ").replaceAll("\n", "
"));
        }

        NLGElement postFormatter = null;
        if(this.formatter != null) {
            postFormatter = this.formatter.realise(postOrthography);
            if(this.debug) {
                System.out.println("\nPOST-FORMATTER TREE\n"); //$NON-NLS-1$
                System.out.println(postFormatter.printTree(null));
                debug.append("
POST-FORMATTER TREE
");
                debug.append(postFormatter.printTree("  ").replaceAll("\n", "
"));
            }

        } else {
            postFormatter = postOrthography;
        }

        if(this.debug) {
            postFormatter.setFeature("debug", debug.toString());
        }

        return postFormatter;
    }

    /**
     * Convenience class to realise any NLGElement as a sentence
     *
     * @param element
     * @return String realisation of the NLGElement
     */
    public String realiseSentence(NLGElement element) {
        NLGElement realised = null;
        if(element instanceof DocumentElement)
            realised = realise(element);
        else {
            DocumentElement sentence = new DocumentElement(DocumentCategory.SENTENCE, null);
            sentence.addComponent(element);
            propagateMarkup(element, sentence);
            realised = realise(sentence);
        }

        if(realised == null)
            return null;
        else
            return realised.getRealisation();
    }

    @Override
    public List realise(List elements) {
        List realisedElements = new ArrayList();
        if(null != elements) {
            for(NLGElement element : elements) {
                NLGElement realisedElement = realise(element);
                realisedElements.add(realisedElement);
            }
        }
        return realisedElements;
    }

    @Override
    public void setLexicon(Lexicon newLexicon) {
        this.syntax.setLexicon(newLexicon);
        this.morphology.setLexicon(newLexicon);
        this.orthography.setLexicon(newLexicon);
    }

    public void setFormatter(NLGModule formatter) {
        this.formatter = formatter;
    }

    public void setDebugMode(boolean debugOn) {
        this.debug = debugOn;
    }
}