All Downloads are FREE. Search and download functionalities are using the official Maven repository.

jvntextpro.data.TaggingData Maven / Gradle / Ivy

Go to download

HeidelTime is a multilingual cross-domain temporal tagger that extracts temporal expressions from documents and normalizes them according to the TIMEX3 annotation standard.

There is a newer version: 2.2.1
Show newest version
/*
 Copyright (C) 2010 by
 * 
 * 	Cam-Tu Nguyen 
 *  [email protected] or [email protected]
 *
 *  Xuan-Hieu Phan  
 *  [email protected] 
 *
 *  College of Technology, Vietnamese University, Hanoi
 * 	Graduate School of Information Sciences, Tohoku University
 *
 * JVnTextPro-v.2.0 is a free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published
 * by the Free Software Foundation; either version 2 of the License,
 * or (at your option) any later version.
 *
 * JVnTextPro-v.2.0 is distributed in the hope that it will be useful, but
 * WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with  JVnTextPro-v.2.0); if not, write to the Free Software Foundation,
 * Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA.
 */

package jvntextpro.data;

import java.util.ArrayList;

// TODO: Auto-generated Javadoc
/**
 * The Class TaggingData.
 */
public class TaggingData {
	
	/** The cntx gen vector. */
	protected ArrayList cntxGenVector = null;
	
	/**
	 * Instantiates a new tagging data.
	 */
	public TaggingData(){		
		cntxGenVector = new ArrayList();		
	}

	/**
	 * Instantiates a new tagging data.
	 *
	 * @param _cntxGenVector the _cntx gen vector
	 */
	public TaggingData(ArrayList _cntxGenVector){		
		cntxGenVector = _cntxGenVector;
	}
	
	/**
	 * Instantiates a new tagging data.
	 *
	 * @param cntxGen the cntx gen
	 */
	public TaggingData(ContextGenerator cntxGen){		
		cntxGenVector = new ArrayList();
		cntxGenVector.add(cntxGen);
	}
	
	/**
	 * Adds the context generator.
	 *
	 * @param cntxGen the cntx gen
	 */
	public void addContextGenerator(ContextGenerator cntxGen){
		cntxGenVector.add(cntxGen);
	}
	
	/**
	 * Gets the context.
	 *
	 * @param sent the sent
	 * @param wordIdx the word idx
	 * @return the context
	 */
	public String [] getContext (Sentence sent, int wordIdx){
		ArrayList tempCps = new ArrayList();
		
		for (int i = 0; i < cntxGenVector.size(); ++i){
			String [] context = cntxGenVector.get(i).getContext(sent, wordIdx);
			if (context != null){
				for (int j = 0; j < context.length; ++j){
					if (context[j].trim().equals("")) continue;
					tempCps.add(context[j]);
				}
			}
		}
		
		String [] tempCpsArray = new String[tempCps.size()];
		return tempCps.toArray(tempCpsArray);
	}
	
	/**
	 * Gets the context str.
	 *
	 * @param sent the sentence
	 * @param wordIdx the word index
	 * @return the string representing contexts extracted at wordIdx of the sentence sent 
	 */
	public String getContextStr(Sentence sent, int wordIdx){
		String cpStr = "";
		
		for (int i = 0; i < cntxGenVector.size(); ++i){
			String [] context = cntxGenVector.get(i).getContext(sent, wordIdx);
			if (context != null){
				for (int j = 0; j < context.length; ++j){
					if (context[j].trim().equals("")) continue;
					cpStr += context[j] + " ";
				}
			}
		}
		
		return cpStr.trim();
	}
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy