All Downloads are FREE. Search and download functionalities are using the official Maven repository.

it.unipi.di.acube.batframework.datasetPlugins.ConllAidaTestADataset Maven / Gradle / Ivy

There is a newer version: 1.3.6
Show newest version
package it.unipi.di.acube.batframework.datasetPlugins;

import it.unipi.di.acube.batframework.data.*;
import it.unipi.di.acube.batframework.utils.*;

import java.io.IOException;
import java.util.*;

import javax.xml.parsers.ParserConfigurationException;
import javax.xml.xpath.XPathExpressionException;

import org.xml.sax.SAXException;

public class ConllAidaTestADataset extends ConllAidaDataset{
	private static final int FIRST_DOC_ID = 947;
	private static final int LAST_DOC_ID = 1162;

	public ConllAidaTestADataset(String file, WikipediaApiInterface api) throws IOException, AnnotationException, XPathExpressionException, ParserConfigurationException, SAXException {
		super(file, api);
	}

	@Override
	public int getSize() {
		return LAST_DOC_ID-FIRST_DOC_ID+1;
	}

	@Override
	public int getTagsCount() {
		int count = 0;
		for (HashSet s : getA2WGoldStandardList())
			count += s.size();
		return count;
	}

	@Override
	public List> getC2WGoldStandardList() {
		return ProblemReduction.A2WToC2WList(getA2WGoldStandardList());
	}

	@Override
	public List> getA2WGoldStandardList() {
		return super.getA2WGoldStandardList().subList(FIRST_DOC_ID-1, LAST_DOC_ID);
	}

	@Override
	public List> getD2WGoldStandardList() {
		return getA2WGoldStandardList();
	}

	@Override
	public List getTextInstanceList() {
		return super.getTextInstanceList().subList(FIRST_DOC_ID-1, LAST_DOC_ID);
	}
	
	@Override
	public List> getMentionsInstanceList() {
		return ProblemReduction.A2WToD2WMentionsInstance(getA2WGoldStandardList());
	}

	@Override
	public String getName() {
		return "AIDA/CO-NLL-TestB";
	}

}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy