All Downloads are FREE. Search and download functionalities are using the official Maven repository.

edu.emory.mathcs.nlp.common.verbnet.VNLib Maven / Gradle / Ivy

The newest version!
/**
 * Copyright 2015, Emory University
 * 
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 * 
 *     http://www.apache.org/licenses/LICENSE-2.0
 * 
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package edu.emory.mathcs.nlp.common.verbnet;

import java.io.BufferedInputStream;
import java.io.FileInputStream;
import java.io.InputStream;
import java.util.List;

import org.w3c.dom.Element;
import org.w3c.dom.NodeList;

import edu.emory.mathcs.nlp.common.util.FileUtils;
import edu.emory.mathcs.nlp.common.util.XMLUtils;

/**
 * @author Jinho D. Choi ({@code [email protected]})
 */
public class VNLib
{
	private VNLib() {}
	
	/**
	 * @param dirPath a directory containing VerbNet XML files.
	 * @param discardNoFrame if {@code true}, discard classes with no frames.
	 */
	static public VNMap getVerbNetMap(String dirPath, boolean discardNoFrame)
	{
		List filelist = FileUtils.getFileList(dirPath, ".xml", false);
		VNMap map = new VNMap();
		InputStream in;
		
		try
		{
			for (String filename : filelist)
			{
				in = new BufferedInputStream(new FileInputStream(filename));
				putVerbNetClasses(in, map, discardNoFrame);
			}
		}
		catch (Exception e) {e.printStackTrace();}
		
		return map;
	}
	
	/** Called by {@link #getVerbNetMap(String)}. */
	static private void putVerbNetClasses(InputStream in, VNMap map, boolean discardNoFrame)
	{
		Element eVNClass = XMLUtils.getDocumentElement(in);
		NodeList list = eVNClass.getElementsByTagName(VNXml.E_VNSUBCLASS);
		int i, size = list.getLength();
		VNClass vn; 
		
		vn = new VNClass(eVNClass);
		if (discardNoFrame && vn.getFrameSize() > 0) map.put(vn);
		
		for (i=0; i 0) map.put(vn);
		}
	}
	
	static public String stripVerbNetClassName(String vncls)
	{
		if (vncls.startsWith(","))	vncls = vncls.substring(1);
		if (vncls.endsWith(",")) 	vncls = vncls.substring(0, vncls.length()-1);
		
		if (!Character.isDigit(vncls.charAt(0)))
		{
			int idx = vncls.indexOf('-');
			if (0 < idx && idx+1 < vncls.length()) vncls = vncls.substring(idx+1);	
		}
		
		return vncls.trim();
	}
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy