All Downloads are FREE. Search and download functionalities are using the official Maven repository.

dkpro.similarity.example.ml.Features2Arff Maven / Gradle / Ivy

/**
 * Copyright 2012-2016
 * Ubiquitous Knowledge Processing (UKP) Lab
 * Technische Universität Darmstadt
 *
 * This program is free software: you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program.  If not, see http://www.gnu.org/licenses/.
 */
package dkpro.similarity.example.ml;

import java.io.File;
import java.util.ArrayList;
import java.util.List;

import org.apache.commons.io.FileUtils;

import dkpro.similarity.ml.util.ArffConverter;


public class Features2Arff
{
	public static void main(String[] args)
		throws Exception
	{
		// TRAIN
		
		String F_BASE_PATH = "/home/danielb/Projekte/Similarity/workspace/de.tudarmstadt.ukp.similarity-asl/de.tudarmstadt.ukp.similarity.example";
		String G_BASE_PATH = "/home/danielb/Projekte/Similarity/workspace/de.tudarmstadt.ukp.similarity-asl/de.tudarmstadt.ukp.similarity.dkpro.data-asl";
		
		File inputDir = new File(F_BASE_PATH + "/src/main/resources/semeval-train-all-combined-features");
		
		String arff = ArffConverter.toArffString(
				listFiles(inputDir, ".txt", true),
				new File(G_BASE_PATH + "/src/main/resources/goldstandards/semeval/train/STS.gs.ALLcombined.txt"));
		
		FileUtils.writeStringToFile(new File("src/main/resources/models/semeval-train-all-combined.arff"), arff);
		
		// TEST
		
		String BASE_PATH = "/home/danielb/Projekte/Similarity/workspace/de.tudarmstadt.ukp.similarity-asl/de.tudarmstadt.ukp.similarity.example";
		inputDir = new File(BASE_PATH + "/src/main/resources/mm09-features");
		
		arff = ArffConverter.toArffString(
				listFiles(inputDir, ".txt", true),
				null);
		
		FileUtils.writeStringToFile(new File("src/main/resources/models/mm09.arff"), arff);
	}
	
	private static List listFiles(File folder, String suffix, boolean recursively)
	{
		List files = new ArrayList();
		
		String s = folder.getAbsolutePath();
		
		for (File file : folder.listFiles())
		{
			if (file.isDirectory())
			{
				if (recursively && !file.getName().startsWith("."))
					files.addAll(listFiles(file, suffix, recursively));
			} else {
				if (!file.getName().startsWith(".") && 
					file.getName().endsWith(suffix))
					files.add(file);
			}
		}
		
		return files;
	}
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy