All Downloads are FREE. Search and download functionalities are using the official Maven repository.

jvnpostag.POSTrainGenerating Maven / Gradle / Ivy

Go to download

HeidelTime is a multilingual cross-domain temporal tagger that extracts temporal expressions from documents and normalizes them according to the TIMEX3 annotation standard.

There is a newer version: 2.2.1
Show newest version
/*
 Copyright (C) 2010 by
 * 
 * 	Cam-Tu Nguyen 
 *  [email protected] or [email protected]
 *
 *  Xuan-Hieu Phan  
 *  [email protected] 
 *
 *  College of Technology, Vietnamese University, Hanoi
 * 	Graduate School of Information Sciences, Tohoku University
 *
 * JVnTextPro-v.2.0 is a free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published
 * by the Free Software Foundation; either version 2 of the License,
 * or (at your option) any later version.
 *
 * JVnTextPro-v.2.0 is distributed in the hope that it will be useful, but
 * WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with  JVnTextPro-v.2.0); if not, write to the Free Software Foundation,
 * Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA.
 */
package jvnpostag;
import jvntextpro.data.TaggingData;
import jvntextpro.data.TrainDataGenerating;

// TODO: Auto-generated Javadoc
/**
 * The Class POSTrainGenerating.
 */
public class POSTrainGenerating extends TrainDataGenerating {
	
	/** The template file. */
	String templateFile;
	
	/**
	 * Instantiates a new pOS train generating.
	 *
	 * @param templateFile the template file (in xml format) to generate context predicates
	 * using POSContextGenerator
	 */
	public POSTrainGenerating(String templateFile){
		this.templateFile = templateFile;
		init();
	}
	
	/* (non-Javadoc)
	 * @see jvntextpro.data.TrainDataGenerating#init()
	 */
	@Override
	public void init() {
		// TODO Auto-generated method stub
		this.reader =  new POSDataReader(true);
		this.tagger = new TaggingData();
		tagger.addContextGenerator(new POSContextGenerator(templateFile));
	}

	/**
	 * The main method.
	 *
	 * @param args the arguments
	 */
	public static void main(String [] args){
		  //tagging
		if (args.length != 2){
			System.out.println("POSTrainGenerating [template File] [File/Folder]");
			System.out.println("Generating training data for word segmentation with FlexCRFs++ or jvnmaxent (in JVnTextPro)");
			System.out.println("Template File: featuretemplate to generate context predicates");
			System.out.println("Input File/Folder: file/folder name containing data manually tagged for training");
			return;
		}
		
		POSTrainGenerating trainGen = new POSTrainGenerating(args[0]);
		trainGen.generateTrainData(args[1], args[1]);		
	}
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy