jvnpostag.POSTrainGenerating Maven / Gradle / Ivy
/*
Copyright (C) 2010 by
*
* Cam-Tu Nguyen
* [email protected] or [email protected]
*
* Xuan-Hieu Phan
* [email protected]
*
* College of Technology, Vietnamese University, Hanoi
* Graduate School of Information Sciences, Tohoku University
*
* JVnTextPro-v.2.0 is a free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published
* by the Free Software Foundation; either version 2 of the License,
* or (at your option) any later version.
*
* JVnTextPro-v.2.0 is distributed in the hope that it will be useful, but
* WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with JVnTextPro-v.2.0); if not, write to the Free Software Foundation,
* Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA.
*/
package jvnpostag;
import jvntextpro.data.TaggingData;
import jvntextpro.data.TrainDataGenerating;
// TODO: Auto-generated Javadoc
/**
* The Class POSTrainGenerating.
*/
public class POSTrainGenerating extends TrainDataGenerating {
/** The template file. */
String templateFile;
/**
* Instantiates a new pOS train generating.
*
* @param templateFile the template file (in xml format) to generate context predicates
* using POSContextGenerator
*/
public POSTrainGenerating(String templateFile){
this.templateFile = templateFile;
init();
}
/* (non-Javadoc)
* @see jvntextpro.data.TrainDataGenerating#init()
*/
@Override
public void init() {
// TODO Auto-generated method stub
this.reader = new POSDataReader(true);
this.tagger = new TaggingData();
tagger.addContextGenerator(new POSContextGenerator(templateFile));
}
/**
* The main method.
*
* @param args the arguments
*/
public static void main(String [] args){
//tagging
if (args.length != 2){
System.out.println("POSTrainGenerating [template File] [File/Folder]");
System.out.println("Generating training data for word segmentation with FlexCRFs++ or jvnmaxent (in JVnTextPro)");
System.out.println("Template File: featuretemplate to generate context predicates");
System.out.println("Input File/Folder: file/folder name containing data manually tagged for training");
return;
}
POSTrainGenerating trainGen = new POSTrainGenerating(args[0]);
trainGen.generateTrainData(args[1], args[1]);
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy