edu.emory.mathcs.nlp.common.verbnet.VNLib Maven / Gradle / Ivy
The newest version!
/**
* Copyright 2015, Emory University
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package edu.emory.mathcs.nlp.common.verbnet;
import java.io.BufferedInputStream;
import java.io.FileInputStream;
import java.io.InputStream;
import java.util.List;
import org.w3c.dom.Element;
import org.w3c.dom.NodeList;
import edu.emory.mathcs.nlp.common.util.FileUtils;
import edu.emory.mathcs.nlp.common.util.XMLUtils;
/**
* @author Jinho D. Choi ({@code [email protected]})
*/
public class VNLib
{
private VNLib() {}
/**
* @param dirPath a directory containing VerbNet XML files.
* @param discardNoFrame if {@code true}, discard classes with no frames.
*/
static public VNMap getVerbNetMap(String dirPath, boolean discardNoFrame)
{
List filelist = FileUtils.getFileList(dirPath, ".xml", false);
VNMap map = new VNMap();
InputStream in;
try
{
for (String filename : filelist)
{
in = new BufferedInputStream(new FileInputStream(filename));
putVerbNetClasses(in, map, discardNoFrame);
}
}
catch (Exception e) {e.printStackTrace();}
return map;
}
/** Called by {@link #getVerbNetMap(String)}. */
static private void putVerbNetClasses(InputStream in, VNMap map, boolean discardNoFrame)
{
Element eVNClass = XMLUtils.getDocumentElement(in);
NodeList list = eVNClass.getElementsByTagName(VNXml.E_VNSUBCLASS);
int i, size = list.getLength();
VNClass vn;
vn = new VNClass(eVNClass);
if (discardNoFrame && vn.getFrameSize() > 0) map.put(vn);
for (i=0; i 0) map.put(vn);
}
}
static public String stripVerbNetClassName(String vncls)
{
if (vncls.startsWith(",")) vncls = vncls.substring(1);
if (vncls.endsWith(",")) vncls = vncls.substring(0, vncls.length()-1);
if (!Character.isDigit(vncls.charAt(0)))
{
int idx = vncls.indexOf('-');
if (0 < idx && idx+1 < vncls.length()) vncls = vncls.substring(idx+1);
}
return vncls.trim();
}
}
© 2015 - 2024 Weber Informatics LLC | Privacy Policy