ciir.umass.edu.eval.Evaluator Maven / Gradle / Ivy

Go to download

/*===============================================================================
 * Copyright (c) 2010-2016 University of Massachusetts.  All Rights Reserved.
 *
 * Use of the RankLib package is subject to the terms of the software license set 
 * forth in the LICENSE file included with this software, and also available at
 * http://people.cs.umass.edu/~vdang/ranklib_license.html
 *===============================================================================
 */

package ciir.umass.edu.eval;

import ciir.umass.edu.features.*;
import ciir.umass.edu.learning.*;
import ciir.umass.edu.learning.boosting.AdaRank;
import ciir.umass.edu.learning.boosting.RankBoost;
import ciir.umass.edu.learning.neuralnet.ListNet;
import ciir.umass.edu.learning.neuralnet.Neuron;
import ciir.umass.edu.learning.neuralnet.RankNet;
import ciir.umass.edu.learning.tree.LambdaMART;
import ciir.umass.edu.learning.tree.RFRanker;
import ciir.umass.edu.metric.ERRScorer;
import ciir.umass.edu.metric.METRIC;
import ciir.umass.edu.metric.MetricScorer;
import ciir.umass.edu.metric.MetricScorerFactory;
import ciir.umass.edu.utilities.*;

import java.io.*;
import java.text.DecimalFormat;
import java.util.ArrayList;
import java.util.List;

/**
 * @author vdang
 * 
 * This class is meant to provide the interface to run and compare different ranking algorithms. 
 * It lets users specify general parameters (e.g. what algorithm to run, training/testing/validating
 *  data, etc.) as well as algorithm-specific parameters. Type "java -jar bin/RankLib.jar" at the 
 *  command-line to see all the options. 
 */
public class Evaluator {

	/**
	 * @param args
	 */
	public static void main(String[] args) {
		
		String[] rType = new String[] { "MART", "RankNet", "RankBoost", "AdaRank", "Coordinate Ascent",
                                                "LambdaRank", "LambdaMART", "ListNet", "Random Forests", 
                                                "Linear Regression" };
		RANKER_TYPE[] rType2 = new RANKER_TYPE[] { RANKER_TYPE.MART, RANKER_TYPE.RANKNET, 
                                                           RANKER_TYPE.RANKBOOST, RANKER_TYPE.ADARANK, 
                                                           RANKER_TYPE.COOR_ASCENT, RANKER_TYPE.LAMBDARANK, 
                                                           RANKER_TYPE.LAMBDAMART, RANKER_TYPE.LISTNET, 
                                                           RANKER_TYPE.RANDOM_FOREST, RANKER_TYPE.LINEAR_REGRESSION };
		
		String trainFile = "";
		String featureDescriptionFile = "";
		float ttSplit = 0;//train-test split
		float tvSplit = 0;//train-validation split
		int foldCV = -1;
		String validationFile = "";
		String testFile = "";
		List testFiles = new ArrayList<>();
		int rankerType = 4;
		String trainMetric = "ERR@10";
		String testMetric = "";
		Evaluator.normalize = false;
		String savedModelFile = "";
		List savedModelFiles = new ArrayList<>();
		String kcvModelDir = "";
		String kcvModelFile = "";
		String rankFile = "";
		String prpFile = "";
		
		int nThread = -1; // nThread = #cpu-cores
		//for my personal use
		String indriRankingFile = "";
		String scoreFile = "";
		
		if(args.length < 2)
		{
			System.out.println("Usage: java -jar RankLib.jar ");
			System.out.println("Params:");
			System.out.println("  [+] Training (+ tuning and evaluation)");
			System.out.println("\t-train \t\tTraining data");
			System.out.println("\t-ranker \t\tSpecify which ranking algorithm to use");
			System.out.println("\t\t\t\t0: MART (gradient boosted regression tree)");
			System.out.println("\t\t\t\t1: RankNet");
			System.out.println("\t\t\t\t2: RankBoost");
			System.out.println("\t\t\t\t3: AdaRank");
			System.out.println("\t\t\t\t4: Coordinate Ascent");
			System.out.println("\t\t\t\t6: LambdaMART");
			System.out.println("\t\t\t\t7: ListNet");
			System.out.println("\t\t\t\t8: Random Forests");
			System.out.println("\t\t\t\t9: Linear regression (L2 regularization)");
			System.out.println("\t[ -feature  ]\tFeature description file: list features to be considered by the learner, each on a separate line");
			System.out.println("\t\t\t\tIf not specified, all features will be used.");
			//System.out.println("\t[ -metric2t  ]\tMetric to optimize on the training data. Supported: MAP, NDCG@k, DCG@k, P@k, RR@k, BEST@k, ERR@k (default=" + trainMetric + ")");
			System.out.println("\t[ -metric2t  ]\tMetric to optimize on the training data.  " +
                                           "Supported: MAP, NDCG@k, DCG@k, P@k, RR@k, ERR@k (default=" + trainMetric + ")");
			System.out.println("\t[ -gmax  ]\tHighest judged relevance label. It affects the calculation of ERR " +
                                           "(default=" + (int)SimpleMath.logBase2(ERRScorer.MAX) + ", i.e. 5-point scale {0,1,2,3,4})");
			System.out.println("\t[ -qrel  ]\tTREC-style relevance judgment file. It only affects MAP and NDCG (default=unspecified)");
			System.out.println("\t[ -silent ]\t\tDo not print progress messages (which are printed by default)");
			System.out.println("\t[ -missingZero ]\tSubstitute zero for missing feature values rather than throwing an exception.");
			
			System.out.println("");
			//System.out.println("        Use the entire specified training data");
			System.out.println("\t[ -validate  ]\tSpecify if you want to tune your system on the validation data (default=unspecified)");
			System.out.println("\t\t\t\tIf specified, the final model will be the one that performs best on the validation data");
			System.out.println("\t[ -tvs  ]\tIf you don't have separate validation data, use this to set train-validation split to be (x)(1.0-x)");

			System.out.println("\t[ -save  ]\tSave the model learned (default=not-save)");
			
			System.out.println("");
			System.out.println("\t[ -test  ]\tSpecify if you want to evaluate the trained model on this data (default=unspecified)");
			System.out.println("\t[ -tts  ]\tSet train-test split to be (x)(1.0-x). -tts will override -tvs");
			System.out.println("\t[ -metric2T  ]\tMetric to evaluate on the test data (default to the same as specified for -metric2t)");
			
			System.out.println("");
			System.out.println("\t[ -norm ]\tNormalize all feature vectors (default=no-normalization). Method can be:");
			System.out.println("\t\t\t\tsum: normalize each feature by the sum of all its values");
			System.out.println("\t\t\t\tzscore: normalize each feature by its mean/standard deviation");
			System.out.println("\t\t\t\tlinear: normalize each feature by its min/max values");
			
			//System.out.println("");
			//System.out.println("\t[ -sparse ]\t\tUse sparse representation for all feature vectors (default=dense)");
			
			System.out.println("");
			System.out.println("\t[ -kcv  ]\t\tSpecify if you want to perform k-fold cross validation using the specified training data (default=NoCV)");
			System.out.println("\t\t\t\t-tvs can be used to further reserve a portion of the training data in each fold for validation");
			//System.out.println("\t\t\t\tData for each fold is created from sequential partitions of the training data.");
			//System.out.println("\t\t\t\tRandomized partitioning can be done by shuffling the training data in advance.");
			//System.out.println("\t\t\t\tType \"java -cp bin/RankLib.jar ciir.umass.edu.feature.FeatureManager\" for help with shuffling.");
			
			System.out.println("\t[ -kcvmd  ]\tDirectory for models trained via cross-validation (default=not-save)");
			System.out.println("\t[ -kcvmn  ]\tName for model learned in each fold. It will be prefix-ed with the fold-number (default=empty)");
			
			System.out.println("");
			System.out.println("    [-] RankNet-specific parameters");
			System.out.println("\t[ -epoch  ]\t\tThe number of epochs to train (default=" + RankNet.nIteration + ")");
			System.out.println("\t[ -layer  ]\tThe number of hidden layers (default=" + RankNet.nHiddenLayer + ")");
			System.out.println("\t[ -node  ]\tThe number of hidden nodes per layer (default=" + RankNet.nHiddenNodePerLayer + ")");
			System.out.println("\t[ -lr  ]\t\tLearning rate (default=" + (new DecimalFormat("###.########")).format(RankNet.learningRate) + ")");
			
			System.out.println("");
			System.out.println("    [-] RankBoost-specific parameters");
			System.out.println("\t[ -round  ]\t\tThe number of rounds to train (default=" + RankBoost.nIteration + ")");
			System.out.println("\t[ -tc  ]\t\tNumber of threshold candidates to search. -1 to use all feature values (default=" + 
                                           RankBoost.nThreshold + ")");
			
			System.out.println("");
			System.out.println("    [-] AdaRank-specific parameters");
			System.out.println("\t[ -round  ]\t\tThe number of rounds to train (default=" + AdaRank.nIteration + ")");
			System.out.println("\t[ -noeq ]\t\tTrain without enqueuing too-strong features (default=unspecified)");
			System.out.println("\t[ -tolerance  ]\tTolerance between two consecutive rounds of learning (default=" + AdaRank.tolerance + ")");
			System.out.println("\t[ -max  ]\tThe maximum number of times a feature can be consecutively selected " +
                                           "without changing performance (default=" + AdaRank.maxSelCount + ")");

			System.out.println("");
			System.out.println("    [-] Coordinate Ascent-specific parameters");
			System.out.println("\t[ -r  ]\t\tThe number of random restarts (default=" + CoorAscent.nRestart + ")");
			System.out.println("\t[ -i  ]\tThe number of iterations to search in each dimension (default=" + CoorAscent.nMaxIteration + ")");
			System.out.println("\t[ -tolerance  ]\tPerformance tolerance between two solutions (default=" + CoorAscent.tolerance + ")");
			System.out.println("\t[ -reg  ]\tRegularization parameter (default=no-regularization)");

			System.out.println("");
			System.out.println("    [-] {MART, LambdaMART}-specific parameters");
			System.out.println("\t[ -tree  ]\t\tNumber of trees (default=" + LambdaMART.nTrees + ")");
			System.out.println("\t[ -leaf  ]\t\tNumber of leaves for each tree (default=" + LambdaMART.nTreeLeaves + ")");
			System.out.println("\t[ -shrinkage  ]\tShrinkage, or learning rate (default=" + LambdaMART.learningRate + ")");
			System.out.println("\t[ -tc  ]\t\tNumber of threshold candidates for tree spliting. -1 to use all feature values (default=" + 
                                           LambdaMART.nThreshold + ")");
			System.out.println("\t[ -mls  ]\t\tMin leaf support -- minimum % of docs each leaf has to contain (default=" +
                                           LambdaMART.minLeafSupport + ")");
			System.out.println("\t[ -estop  ]\t\tStop early when no improvement is observed on validaton data in e consecutive rounds (default=" + 
                                           LambdaMART.nRoundToStopEarly + ")");

			System.out.println("");
			System.out.println("    [-] ListNet-specific parameters");
			System.out.println("\t[ -epoch  ]\t\tThe number of epochs to train (default=" + ListNet.nIteration + ")");
			System.out.println("\t[ -lr  ]\t\tLearning rate (default=" + (new DecimalFormat("###.########")).format(ListNet.learningRate) + ")");

			System.out.println("");
			System.out.println("    [-] Random Forests-specific parameters");
			System.out.println("\t[ -bag  ]\t\tNumber of bags (default=" + RFRanker.nBag + ")");
			System.out.println("\t[ -srate  ]\t\tSub-sampling rate (default=" + RFRanker.subSamplingRate + ")");
			System.out.println("\t[ -frate  ]\t\tFeature sampling rate (default=" + RFRanker.featureSamplingRate + ")");
			int type = (RFRanker.rType.ordinal()-RANKER_TYPE.MART.ordinal());
			System.out.println("\t[ -rtype  ]\tRanker to bag (default=" + type + ", i.e. " + rType[type] + ")");
			System.out.println("\t[ -tree  ]\t\tNumber of trees in each bag (default=" + RFRanker.nTrees + ")");
			System.out.println("\t[ -leaf  ]\t\tNumber of leaves for each tree (default=" + RFRanker.nTreeLeaves + ")");
			System.out.println("\t[ -shrinkage  ]\tShrinkage, or learning rate (default=" + RFRanker.learningRate + ")");
			System.out.println("\t[ -tc  ]\t\tNumber of threshold candidates for tree spliting. -1 to use all feature values (default=" +
                                           RFRanker.nThreshold + ")");
			System.out.println("\t[ -mls  ]\t\tMin leaf support -- minimum % of docs each leaf has to contain (default=" + RFRanker.minLeafSupport + ")");

			System.out.println("");
			System.out.println("    [-] Linear Regression-specific parameters");
			System.out.println("\t[ -L2  ]\t\tL2 regularization parameter (default=" + LinearRegRank.lambda + ")");

			System.out.println("");
			System.out.println("  [+] Testing previously saved models");
			System.out.println("\t-load \t\tThe model to load");
			System.out.println("\t\t\t\tMultiple -load can be used to specify models from multiple folds (in increasing order),");
			System.out.println("\t\t\t\t  in which case the test/rank data will be partitioned accordingly.");
			System.out.println("\t-test \t\tTest data to evaluate the model(s) (specify either this or -rank but not both)");
			System.out.println("\t-rank \t\tRank the samples in the specified file (specify either this or -test but not both)");
			System.out.println("\t[ -metric2T  ]\tMetric to evaluate on the test data (default=" + trainMetric + ")");
			System.out.println("\t[ -gmax  ]\tHighest judged relevance label. It affects the calculation of ERR (default=" + (int)SimpleMath.logBase2(ERRScorer.MAX) + ", i.e. 5-point scale {0,1,2,3,4})");
			System.out.println("\t[ -score ]\tStore ranker's score for each object being ranked (has to be used with -rank)");
			System.out.println("\t[ -qrel  ]\tTREC-style relevance judgment file. It only affects MAP and NDCG (default=unspecified)");
			System.out.println("\t[ -idv  ]\t\tSave model performance (in test metric) on individual ranked lists (has to be used with -test)");
			System.out.println("\t[ -norm ]\t\tNormalize feature vectors (similar to -norm for training/tuning)");
			//System.out.println("\t[ -sparse ]\t\tUse sparse representation for all feature vectors (default=dense)");

			System.out.println("");
			return;
		}
		
		for(int i=0;i 0)
					System.out.println("Train-Validation split: " + tvSplit);
			}
			else
			{
				if(testFile.compareTo("") != 0)
					System.out.println("Test data:\t" + testFile);
				else if(ttSplit > 0)//choose to split training data into train and test
					System.out.println("Train-Test split: " + ttSplit);
				
				if(validationFile.compareTo("")!=0)//the user has specified the validation set 
					System.out.println("Validation data:\t" + validationFile);
				else if(ttSplit <= 0 && tvSplit > 0)
					System.out.println("Train-Validation split: " + tvSplit);
			}
			System.out.println("Feature vector representation: " + ((useSparseRepresentation)?"Sparse":"Dense") + ".");
			System.out.println("Ranking method:\t" + rType[rankerType]);
			if(featureDescriptionFile.compareTo("")!=0)
				System.out.println("Feature description file:\t" + featureDescriptionFile);
			else
				System.out.println("Feature description file:\tUnspecified. All features will be used.");
			System.out.println("Train metric:\t" + trainMetric);
			System.out.println("Test metric:\t" + testMetric);

			if(trainMetric.toUpperCase().startsWith("ERR") || testMetric.toUpperCase().startsWith("ERR"))
				System.out.println("Highest relevance label (to compute ERR): " + (int)SimpleMath.logBase2(ERRScorer.MAX));
			if(qrelFile.compareTo("") != 0)
				System.out.println("TREC-format relevance judgment (only affects MAP and NDCG scores): " + qrelFile);
			System.out.println("Feature normalization: " + ((Evaluator.normalize)?Evaluator.nml.name():"No"));

			if(kcvModelDir.compareTo("")!=0)
				System.out.println("Models directory: " + kcvModelDir);

			if(kcvModelFile.compareTo("")!=0)
				System.out.println("Models' name: " + kcvModelFile);				

			if(modelFile.compareTo("")!=0)
				System.out.println("Model file: " + modelFile);
			//System.out.println("#threads:\t" + nThread);
			
			System.out.println("");
			System.out.println("[+] " + rType[rankerType] + "'s Parameters:");
			RankerFactory rf = new RankerFactory();
			
			rf.createRanker(rType2[rankerType]).printParameters();
			System.out.println("");
			
			//starting to do some work
			if(foldCV != -1)
			{
			        //if(kcvModelDir.compareTo("") != 0 && kcvModelFile.compareTo("") == 0)
				//	kcvModelFile = "default";
                                //
                                //- Behavioral changes: Write kcv models if kcvmd OR kcvmn defined.  Use
                                //  default names for missing arguments: "kcvmodels" default directory
                                //  and "kcv" default model name.
			        if (kcvModelDir.compareTo("") != 0 && kcvModelFile.compareTo("") == 0) {
					kcvModelFile = "kcv";
			        }
                                else if(kcvModelDir.compareTo("") == 0 && kcvModelFile.compareTo("") != 0) {
					kcvModelDir = "kcvmodels";  
				}

                                //- models won't be saved if kcvModelDir=""   [OBSOLETE]
                                //- Models saved if EITHER kcvmd OR kcvmn defined.  Use default names for missing values.
				e.evaluate(trainFile, featureDescriptionFile, foldCV, tvSplit, kcvModelDir, kcvModelFile);
			}
			else
			{
				if(ttSplit > 0.0)//we should use a held-out portion of the training data for testing?
					e.evaluate(trainFile, validationFile, featureDescriptionFile, ttSplit);//no validation will be done if validationFile=""
				else if(tvSplit > 0.0)//should we use a portion of the training data for validation?
					e.evaluate(trainFile, tvSplit, testFile, featureDescriptionFile);
				else
					e.evaluate(trainFile, validationFile, testFile, featureDescriptionFile);//All files except for trainFile can be empty. This will be handled appropriately
			}
		}
		else //scenario: test a saved model
		{
			System.out.println("Model file:\t" + savedModelFile);
			System.out.println("Feature normalization: " + ((Evaluator.normalize)?Evaluator.nml.name():"No"));
			if(rankFile.compareTo("") != 0)
			{
				if(scoreFile.compareTo("") != 0)
				{
					if(savedModelFiles.size() > 1)//models trained via cross-validation
						e.score(savedModelFiles, rankFile, scoreFile);
					else //a single model
						e.score(savedModelFile, rankFile, scoreFile);
				}
				else if(indriRankingFile.compareTo("") != 0)
				{
					if(savedModelFiles.size() > 1)//models trained via cross-validation
						e.rank(savedModelFiles, rankFile, indriRankingFile);
					else if(savedModelFiles.size() == 1)
						e.rank(savedModelFile, rankFile, indriRankingFile);
					else {
						//This is *ONLY* for debugging purposes. It is *NOT* exposed via cmd-line
						//It will evaluate the input ranking (without being re-ranked by any model) using any measure specified via metric2T
						e.rank(rankFile, indriRankingFile);
					}
				}
				else
				{
					throw RankLibError.create("This function has been removed.\n" +
							"Consider using -score in addition to your current parameters, " +
							"and do the ranking yourself based on these scores.");
					//e.rank(savedModelFile, rankFile);
				}
			}
			else
			{
				System.out.println("Test metric:\t" + testMetric);
				if(testMetric.startsWith("ERR"))
					System.out.println("Highest relevance label (to compute ERR): " + (int)SimpleMath.logBase2(ERRScorer.MAX));
				
				if(savedModelFile.compareTo("") != 0)
				{
					if(savedModelFiles.size() > 1)//models trained via cross-validation
					{
						if(testFiles.size() > 1)
							e.test(savedModelFiles, testFiles, prpFile);
						else
							e.test(savedModelFiles, testFile, prpFile);
					}
					else if(savedModelFiles.size() == 1) // a single model
						e.test(savedModelFile, testFile, prpFile);
				}
				else if(scoreFile.compareTo("") != 0)
					e.testWithScoreFile(testFile, scoreFile);
				//It will evaluate the input ranking (without being re-ranked by any model) using any measure specified via metric2T
				else
					e.test(testFile, prpFile);
			}
		}
		MyThreadPool.getInstance().shutdown();
	}

	//main settings
	public static boolean mustHaveRelDoc = false;
	public static boolean useSparseRepresentation = false;
	public static boolean normalize = false;
	public static Normalizer nml = new SumNormalizor();
	public static String modelFile = "";
 	
 	public static String qrelFile = "";//measure such as NDCG and MAP requires "complete" judgment.
 	//The relevance labels attached to our samples might be only a subset of the entire relevance judgment set.
 	//If we're working on datasets like Letor/Web10K or Yahoo! LTR, we can totally ignore this parameter.
 	//However, if we sample top-K documents from baseline run (e.g. query-likelihood) to create training data for TREC collections,
 	//there's a high chance some relevant document (the in qrel file TREC provides) does not appear in our top-K list -- thus the calculation of
 	//MAP and NDCG is no longer precise. If so, specify that "external" relevance judgment here (via the -qrel cmd parameter)
 	
 	//tmp settings, for personal use
 	public static String newFeatureFile = "";
 	public static boolean keepOrigFeatures = false;
 	public static int topNew = 2000;

 	protected RankerFactory rFact = new RankerFactory();
	protected MetricScorerFactory mFact = new MetricScorerFactory();
	
	protected MetricScorer trainScorer = null;
	protected MetricScorer testScorer = null;
	protected RANKER_TYPE type = RANKER_TYPE.MART;
	

	public Evaluator(RANKER_TYPE rType, METRIC trainMetric, METRIC testMetric)
	{
		this.type = rType;
		trainScorer = mFact.createScorer(trainMetric);
		testScorer = mFact.createScorer(testMetric);
		if(qrelFile.compareTo("") != 0)
		{
			trainScorer.loadExternalRelevanceJudgment(qrelFile);
			testScorer.loadExternalRelevanceJudgment(qrelFile);
		}
	}


	public Evaluator(RANKER_TYPE rType, METRIC trainMetric, int trainK, METRIC testMetric, int testK)
	{
		this.type = rType;
		trainScorer = mFact.createScorer(trainMetric, trainK);
		testScorer = mFact.createScorer(testMetric, testK);
		if(qrelFile.compareTo("") != 0)
		{
			trainScorer.loadExternalRelevanceJudgment(qrelFile);
			testScorer.loadExternalRelevanceJudgment(qrelFile);
		}
	}


	public Evaluator(RANKER_TYPE rType, METRIC trainMetric, METRIC testMetric, int k)
	{
		this.type = rType;
		trainScorer = mFact.createScorer(trainMetric, k);
		testScorer = mFact.createScorer(testMetric, k);
		if(qrelFile.compareTo("") != 0)
		{
			trainScorer.loadExternalRelevanceJudgment(qrelFile);
			testScorer.loadExternalRelevanceJudgment(qrelFile);
		}
	}


	public Evaluator(RANKER_TYPE rType, METRIC metric, int k)
	{
		this.type = rType;
		trainScorer = mFact.createScorer(metric, k);
		if(qrelFile.compareTo("") != 0)
			trainScorer.loadExternalRelevanceJudgment(qrelFile);
		testScorer = trainScorer;		
	}


	public Evaluator(RANKER_TYPE rType, String trainMetric, String testMetric)
	{
		this.type = rType;
		trainScorer = mFact.createScorer(trainMetric);
		testScorer = mFact.createScorer(testMetric);
		if(qrelFile.compareTo("") != 0)
		{
			trainScorer.loadExternalRelevanceJudgment(qrelFile);
			testScorer.loadExternalRelevanceJudgment(qrelFile);
		}
	}	
	

	public List readInput(String inputFile)	
	{
		return FeatureManager.readInput(inputFile, mustHaveRelDoc, useSparseRepresentation);		
	}


	public void normalize(List samples)
	{
		for (RankList sample : samples) nml.normalize(sample);
	}


	public void normalize(List samples, int[] fids)
	{
		for (RankList sample : samples) nml.normalize(sample, fids);
	}


	public void normalizeAll(List> samples, int[] fids)
	{
		for (List sample : samples) normalize(sample, fids);
	}


	public int[] readFeature(String featureDefFile)
	{
                //if(featureDefFile.compareTo("") == 0)
                if (featureDefFile.isEmpty())
			return null;
		return FeatureManager.readFeature(featureDefFile);
	}


	public double evaluate(Ranker ranker, List rl)
	{
		List l = rl;
		if(ranker != null)
			l = ranker.rank(rl);
		return testScorer.score(l);
	}

	
	/**
	 * Evaluate the currently selected ranking algorithm using .
	 * @param trainFile
	 * @param validationFile
	 * @param testFile
	 * @param featureDefFile
	 */
	public void evaluate(String trainFile, String validationFile, String testFile, String featureDefFile)
	{
		List train = readInput(trainFile);//read input
		
		List validation = null;
		//if(validationFile.compareTo("")!=0)
                if (!validationFile.isEmpty())
			validation = readInput(validationFile);
		
		List test = null;
		//if(testFile.compareTo("")!=0)
                if (!testFile.isEmpty())
			test = readInput(testFile);
		
		int[] features = readFeature(featureDefFile);//read features
		if(features == null)//no features specified ==> use all features in the training file
			features = FeatureManager.getFeatureFromSampleVector(train);
		
		if(normalize)
		{
			normalize(train, features);
			if(validation != null)
				normalize(validation, features);
			if(test != null)
				normalize(test, features);
		}		
		
		RankerTrainer trainer = new RankerTrainer();
		Ranker ranker = trainer.train(type, train, validation, features, trainScorer);
		
		if(test != null)
		{
			double rankScore = evaluate(ranker, test);
			System.out.println(testScorer.name() + " on test data: " + SimpleMath.round(rankScore, 4));
		}
		if(modelFile.compareTo("")!=0)
		{
			System.out.println("");
			ranker.save(modelFile);
			System.out.println("Model saved to: " + modelFile);
		}
	}


	/**
	 * Evaluate the currently selected ranking algorithm using percenTrain% of the samples for training the rest for testing.
	 * @param sampleFile
	 * @param validationFile Empty string for "no validation data"
	 * @param featureDefFile
	 * @param percentTrain
	 */
	public void evaluate(String sampleFile, String validationFile, String featureDefFile, double percentTrain)
	{
		List trainingData = new ArrayList<>();
		List testData = new ArrayList<>();
		int[] features = prepareSplit(sampleFile, featureDefFile, percentTrain, normalize, trainingData, testData);
		List validation = null;

		//if(validationFile.compareTo("") != 0)
                if (!validationFile.isEmpty())
		{
			validation = readInput(validationFile);
			if(normalize)
				normalize(validation, features);
		}

		RankerTrainer trainer = new RankerTrainer();
		Ranker ranker = trainer.train(type, trainingData, validation, features, trainScorer);
		
		double rankScore = evaluate(ranker, testData);
		
		System.out.println(testScorer.name() + " on test data: " + SimpleMath.round(rankScore, 4));
		if(modelFile.compareTo("")!=0)
		{
			System.out.println("");
			ranker.save(modelFile);
			System.out.println("Model saved to: " + modelFile);
		}
	}


	/**
	 * Evaluate the currently selected ranking algorithm using percenTrain% of the training samples for training the rest as validation data.
	 * Test data is specified separately.
	 * @param trainFile
	 * @param percentTrain
	 * @param testFile Empty string for "no test data"
	 * @param featureDefFile
	 */
	public void evaluate(String trainFile, double percentTrain, String testFile, String featureDefFile)
	{
		List train = new ArrayList<>();
		List validation = new ArrayList<>();
		int[] features = prepareSplit(trainFile, featureDefFile, percentTrain, normalize, train, validation);
		List test = null;

		//if(testFile.compareTo("") != 0)
		if (!testFile.isEmpty())
		{
			test = readInput(testFile);
			if(normalize)
				normalize(test, features);
		}
		
		RankerTrainer trainer = new RankerTrainer();
		Ranker ranker = trainer.train(type, train, validation, features, trainScorer);
		
		if(test != null)
		{
			double rankScore = evaluate(ranker, test);		
			System.out.println(testScorer.name() + " on test data: " + SimpleMath.round(rankScore, 4));
		}
		if(modelFile.compareTo("")!=0)
		{
			System.out.println("");
			ranker.save(modelFile);
			System.out.println("Model saved to: " + modelFile);
		}
	}


	/**
	 * Evaluate the currently selected ranking algorithm using  with k-fold cross validation.
	 * @param sampleFile
	 * @param featureDefFile
	 * @param nFold
	 * @param modelDir
	 * @param modelFile
	 */
	public void evaluate(String sampleFile, String featureDefFile, int nFold, String modelDir, String modelFile)
	{
		evaluate(sampleFile, featureDefFile, nFold, -1, modelDir, modelFile);
	}


	/**
	 * Evaluate the currently selected ranking algorithm using  with k-fold cross validation.
	 * @param sampleFile
	 * @param featureDefFile
	 * @param nFold
	 * @param tvs Train-validation split ratio.
	 * @param modelDir
	 * @param modelFile
	 */
	public void evaluate(String sampleFile, String featureDefFile, int nFold, float tvs, String modelDir, String modelFile)
	{
		List> trainingData = new ArrayList<>();
		List> validationData = new ArrayList<>();
		List> testData = new ArrayList<>();

		//read all samples
		//List samples = FeatureManager.readInput(sampleFile);
                List samples = readInput (sampleFile);

		//get features
		int[] features = readFeature(featureDefFile);//read features
		if(features == null)//no features specified ==> use all features in the training file
			features = FeatureManager.getFeatureFromSampleVector(samples);

		FeatureManager.prepareCV(samples, nFold, tvs, trainingData, validationData, testData);

		//normalization
		if(normalize)
		{
			for(int i=0;i train = trainingData.get(i);
			List vali = null;
			if(tvs > 0)
				vali = validationData.get(i);
			List test = testData.get(i);
			
			RankerTrainer trainer = new RankerTrainer();
			ranker = trainer.train(type, train, vali, features, trainScorer);
			
			double s2 = evaluate(ranker, test);
			scoreOnTrain += ranker.getScoreOnTrainingData();
			scoreOnTest += s2;
			totalScoreOnTest += s2 * test.size();
			totalTestSampleSize += test.size();

			//save performance in each fold
			scores[i][0] = ranker.getScoreOnTrainingData();
			scores[i][1] = s2;
			
			//if(modelDir.compareTo("") != 0)
                        if (!modelDir.isEmpty())
			{
				ranker.save(FileUtils.makePathStandard(modelDir) + "f" + (i+1) + "." + modelFile);
				System.out.println("Fold-" + (i+1) + " model saved to: " + modelFile);				
			}
		}
		System.out.println("Summary:");
		System.out.println(testScorer.name() + "\t|   Train\t| Test");
		System.out.println("----------------------------------");
		for(int i=0;i test = readInput(testFile);
		double rankScore = evaluate(null, test);
		System.out.println(testScorer.name() + " on test data: " + SimpleMath.round(rankScore, 4));
	}


	public void test(String testFile, String prpFile)
	{
		List test = readInput(testFile);
		double rankScore = 0.0;
		List ids = new ArrayList<>();
		List scores = new ArrayList<>();
		for (RankList l : test) {
			double score = testScorer.score(l);
			ids.add(l.getID());
			scores.add(score);
			rankScore += score;
		}
		rankScore /= test.size();
		ids.add("all");
		scores.add(rankScore);		
		System.out.println(testScorer.name() + " on test data: " + SimpleMath.round(rankScore, 4));

		//if(prpFile.compareTo("") != 0)
                if (!prpFile.isEmpty())
		{
			savePerRankListPerformanceFile(ids, scores, prpFile);
			System.out.println("Per-ranked list performance saved to: " + prpFile);
		}
	}


	/**
	 * Evaluate the performance (in -metric2T) of a pre-trained model. Save its performance on each of the ranked list if this is specified. 
	 * @param modelFile Pre-trained model
	 * @param testFile Test data
	 * @param prpFile Per-ranked list performance file: Model's performance on each of the ranked list. These won't be saved if prpFile="". 
	 */
	public void test(String modelFile, String testFile, String prpFile)
	{
		Ranker ranker = rFact.loadRankerFromFile(modelFile);
		int[] features = ranker.getFeatures();
		List test = readInput(testFile);
		if(normalize)
			normalize(test, features);
		
		double rankScore = 0.0;
		List ids = new ArrayList<>();
		List scores = new ArrayList<>();
		for (RankList aTest : test) {
			RankList l = ranker.rank(aTest);
			double score = testScorer.score(l);
			ids.add(l.getID());
			scores.add(score);
			rankScore += score;
		}
		rankScore /= test.size();
		ids.add("all");
		scores.add(rankScore);		
		System.out.println(testScorer.name() + " on test data: " + SimpleMath.round(rankScore, 4));

		//if(prpFile.compareTo("") != 0)
		if (!prpFile.isEmpty())
		{
			savePerRankListPerformanceFile(ids, scores, prpFile);
			System.out.println("Per-ranked list performance saved to: " + prpFile);
		}
	}


	/**
	 * Evaluate the performance (in -metric2T) of k pre-trained models. Data in the test file will be splitted into k fold, where k=|models|.
	 * Each model will be evaluated on the data from the corresponding fold.
	 * @param modelFiles Pre-trained models
	 * @param testFile Test data
	 * @param prpFile Per-ranked list performance file: Model's performance on each of the ranked list. These won't be saved if prpFile="".
	 */
	public void test(List modelFiles, String testFile, String prpFile)
	{
		List> trainingData = new ArrayList<>();
		List> testData = new ArrayList<>();

		//read all samples
		int nFold = modelFiles.size();
		//List samples = FeatureManager.readInput(testFile);
                List samples = readInput(testFile);

		System.out.print("Preparing " + nFold + "-fold test data... ");
		FeatureManager.prepareCV(samples, nFold, trainingData, testData);
		System.out.println("[Done.]");
		double rankScore = 0.0;
		List ids = new ArrayList<>();
		List scores = new ArrayList<>();
		for(int f=0;f test = testData.get(f);
			Ranker ranker = rFact.loadRankerFromFile(modelFiles.get(f));
			int[] features = ranker.getFeatures();
			if(normalize)
				normalize(test, features);

			for (RankList aTest : test) {
				RankList l = ranker.rank(aTest);
				double score = testScorer.score(l);
				ids.add(l.getID());
				scores.add(score);
				rankScore += score;
			}
		}
		rankScore = rankScore/ids.size();
		ids.add("all");
		scores.add(rankScore);
		System.out.println(testScorer.name() + " on test data: " + SimpleMath.round(rankScore, 4));
		//if(prpFile.compareTo("") != 0)
		if (!prpFile.isEmpty())
		{
			savePerRankListPerformanceFile(ids, scores, prpFile);
			System.out.println("Per-ranked list performance saved to: " + prpFile);
		}
	}


	/**
	 * Similar to the above, except data has already been splitted. The k-th model will be applied on the k-th test file.
	 * @param modelFiles
	 * @param testFiles
	 * @param prpFile
	 */
	public void test(List modelFiles, List testFiles, String prpFile)
	{
		int nFold = modelFiles.size();
		double rankScore = 0.0;
		List ids = new ArrayList<>();
		List scores = new ArrayList<>();
		for(int f=0;f test = FeatureManager.readInput(testFiles.get(f));
		        List test = readInput(testFiles.get(f));
			Ranker ranker = rFact.loadRankerFromFile(modelFiles.get(f));
			int[] features = ranker.getFeatures();

			if(normalize)
				normalize(test, features);

			for (RankList aTest : test) {
				RankList l = ranker.rank(aTest);
				double score = testScorer.score(l);
				ids.add(l.getID());
				scores.add(score);
				rankScore += score;
			}
		}
		rankScore = rankScore/ids.size();
		ids.add("all");
		scores.add(rankScore);
		System.out.println(testScorer.name() + " on test data: " + SimpleMath.round(rankScore, 4));

		//if(prpFile.compareTo("") != 0)
		if (!prpFile.isEmpty())
		{
			savePerRankListPerformanceFile(ids, scores, prpFile);
			System.out.println("Per-ranked list performance saved to: " + prpFile);
		}
	}


	/**
	 * Re-order the input rankings and measure their effectiveness (in -metric2T)
	 * @param testFile Input rankings
	 * @param scoreFile The model score file on each of the documents
	 */
	public void testWithScoreFile(String testFile, String scoreFile)
	{
		try (BufferedReader in = FileUtils.smartReader(scoreFile)) {
			List test = readInput(testFile);
			String content = "";
			;
			List scores = new ArrayList<>();
			while((content = in.readLine()) != null)
			{
				content = content.trim();
				if(content.compareTo("") == 0)
					continue;
				scores.add(Double.parseDouble(content));
			}
			in.close();
			int k = 0;
			for(int i=0;i test = readInput(testFile);
		if(normalize)
			normalize(test, features);
		
		try {
			BufferedWriter out = new BufferedWriter(new OutputStreamWriter(new FileOutputStream(outputFile), "UTF-8"));
			for (RankList l : test) {
				for (int j = 0; j < l.size(); j++) {
					out.write(l.getID() + "\t" + j + "\t" + ranker.eval(l.get(j)) + "");
					out.newLine();
				}
			}
			out.close();
		}
		catch(IOException ex)
		{
			throw RankLibError.create("Error in Evaluator::rank(): ", ex);
		}
	}


	/**
	 * Write the models' score for each of the documents in a test rankings. These test rankings are splitted into k chunks where k=|models|.
	 * Each model is applied on the data from the corresponding fold.
	 * @param modelFiles
	 * @param testFile
	 * @param outputFile
	 */
	public void score(List modelFiles, String testFile, String outputFile)
	{
		List> trainingData = new ArrayList<>();
		List> testData = new ArrayList<>();

		//read all samples
		int nFold = modelFiles.size();
		//List samples = FeatureManager.readInput(testFile);
                List samples = readInput(testFile);
		System.out.print("Preparing " + nFold + "-fold test data... ");
		FeatureManager.prepareCV(samples, nFold, trainingData, testData);
		System.out.println("[Done.]");
		try {
			BufferedWriter out = new BufferedWriter(new OutputStreamWriter(new FileOutputStream(outputFile), "UTF-8"));
			for(int f=0;f test = testData.get(f);
				Ranker ranker = rFact.loadRankerFromFile(modelFiles.get(f));
				int[] features = ranker.getFeatures();
				if(normalize)
					normalize(test, features);
				for (RankList l : test) {
					for (int j = 0; j < l.size(); j++) {
						out.write(l.getID() + "\t" + j + "\t" + ranker.eval(l.get(j)) + "");
						out.newLine();
					}
				}
			}
			out.close();
		}
		catch(IOException ex)
		{
			throw RankLibError.create("Error in Evaluator::score(): ", ex);
		}
	}


	/**
	 * Similar to the above, except data has already been split. The k-th model will be applied on the k-th test file.
	 * @param modelFiles
	 * @param testFiles
	 * @param outputFile
	 */
	public void score(List modelFiles, List testFiles, String outputFile)
	{
		int nFold = modelFiles.size();
		try (BufferedWriter out = new BufferedWriter(new OutputStreamWriter(new FileOutputStream(outputFile), "UTF-8"))) {
			for(int f=0;f test = FeatureManager.readInput(testFiles.get(f));
                                List test = readInput(testFiles.get(f));
				Ranker ranker = rFact.loadRankerFromFile(modelFiles.get(f));
				int[] features = ranker.getFeatures();

				if(normalize)
					normalize(test, features);

				for (RankList l : test) {
					for (int j = 0; j < l.size(); j++) {
						out.write(l.getID() + "\t" + j + "\t" + ranker.eval(l.get(j)) + "");
						out.newLine();
					}
				}
			}
		}
		catch(IOException ex)
		{
			throw RankLibError.create("Error in Evaluator::score(): ", ex);
		}
	}


	/**
	 * Use a pre-trained model to re-rank the test rankings. Save the output ranking in indri's run format
	 * @param modelFile
	 * @param testFile
	 * @param indriRanking
	 */
	public void rank(String modelFile, String testFile, String indriRanking)
	{
		Ranker ranker = rFact.loadRankerFromFile(modelFile);
		int[] features = ranker.getFeatures();
		List test = readInput(testFile);

		if(normalize)
			normalize(test, features);
		try {
			BufferedWriter out = new BufferedWriter(new OutputStreamWriter(new FileOutputStream(indriRanking), "UTF-8"));
			for (RankList l : test) {
				double[] scores = new double[l.size()];
				for (int j = 0; j < l.size(); j++)
					scores[j] = ranker.eval(l.get(j));
				int[] idx = MergeSorter.sort(scores, false);
				for (int j = 0; j < idx.length; j++) {
					int k = idx[j];
					String str = l.getID() + " Q0 " + l.get(k).getDescription().replace("#", "").trim() +
                                                     " " + (j + 1) + " " + SimpleMath.round(scores[k], 5) + " indri";
					out.write(str);
					out.newLine();
				}
			}
			out.close();
		}
		catch(IOException ex)
		{
			throw RankLibError.create("Error in Evaluator::rank(): ", ex);
		}
	}


	/**
	 * Generate a ranking in Indri's format from the input ranking
	 * @param testFile
	 * @param indriRanking
	 */
	public void rank(String testFile, String indriRanking)
	{
		List test = readInput(testFile);

		try {
			BufferedWriter out = new BufferedWriter(new OutputStreamWriter(new FileOutputStream(indriRanking), "UTF-8"));
			for (RankList l : test) {
				for (int j = 0; j < l.size(); j++) {
					String str = l.getID() + " Q0 " + l.get(j).getDescription().replace("#", "").trim() + " " +
                                                     (j + 1) + " " + SimpleMath.round(1.0 - 0.0001 * j, 5) + " indri";
					out.write(str);
					out.newLine();
				}
			}
			out.close();
		}
		catch(IOException ex)
		{
			throw RankLibError.create("Error in Evaluator::rank(): ", ex);
		}
	}


	/**
	 * Use k pre-trained models to re-rank the test rankings. Test rankings will be splitted into k fold, where k=|models|.
	 * Each model will be used to rank the data from the corresponding fold. Save the output ranking in indri's run format. 
	 * @param modelFiles
	 * @param testFile
	 * @param indriRanking
	 */
	public void rank(List modelFiles, String testFile, String indriRanking)
	{
		List> trainingData = new ArrayList<>();
		List> testData = new ArrayList<>();

		//read all samples
		int nFold = modelFiles.size();
		//List samples = FeatureManager.readInput(testFile);
                List samples = readInput(testFile);
		System.out.print("Preparing " + nFold + "-fold test data... ");
		FeatureManager.prepareCV(samples, nFold, trainingData, testData);
		System.out.println("[Done.]");

		try {
			BufferedWriter out = new BufferedWriter(new OutputStreamWriter(new FileOutputStream(indriRanking), "UTF-8"));
			for(int f=0;f test = testData.get(f);
				Ranker ranker = rFact.loadRankerFromFile(modelFiles.get(f));
				int[] features = ranker.getFeatures();
				if(normalize)
					normalize(test, features);

				for (RankList l : test) {
					double[] scores = new double[l.size()];
					for (int j = 0; j < l.size(); j++)
						scores[j] = ranker.eval(l.get(j));
					int[] idx = MergeSorter.sort(scores, false);
					for (int j = 0; j < idx.length; j++) {
						int k = idx[j];
						String str = l.getID() + " Q0 " + l.get(k).getDescription().replace("#", "").trim() + " " +
                                                            (j + 1) + " " + SimpleMath.round(scores[k], 5) + " indri";
						out.write(str);
						out.newLine();
					}
				}				
			}
			out.close();
		}
		catch(Exception ex)
		{
			throw RankLibError.create("Error in Evaluator::rank(): ", ex);
		}
	}	


	/**
	 * Similar to the above, except data has already been splitted. The k-th model will be applied on the k-th test file.
	 * @param modelFiles
	 * @param testFiles
	 * @param indriRanking
	 */
	public void rank(List modelFiles, List testFiles, String indriRanking)
	{
		int nFold = modelFiles.size();

		try {
			BufferedWriter out = new BufferedWriter(new OutputStreamWriter(new FileOutputStream(indriRanking), "UTF-8"));

			for(int f=0;f test = FeatureManager.readInput(testFiles.get(f));
				List test = readInput(testFiles.get(f));
				Ranker ranker = rFact.loadRankerFromFile(modelFiles.get(f));
				int[] features = ranker.getFeatures();

				if(normalize)
					normalize(test, features);

				for (RankList l : test) {
					double[] scores = new double[l.size()];

					for (int j = 0; j < l.size(); j++)
						scores[j] = ranker.eval(l.get(j));

					int[] idx = MergeSorter.sort(scores, false);

					for (int j = 0; j < idx.length; j++) {
						int k = idx[j];
						String str = l.getID() + " Q0 " + l.get(k).getDescription().replace("#", "").trim() + " " + (j + 1) + " " + SimpleMath.round(scores[k], 5) + " indri";
						out.write(str);
						out.newLine();
					}
				}				
			}
			out.close();
		}
		catch(IOException ex)
		{
			throw RankLibError.create("Error in Evaluator::rank(): ", ex);
		}
	}


	/**
	 * Split the input file into two with respect to a specified split size.
	 * @param sampleFile Input data file
	 * @param featureDefFile Feature definition file (if it's an empty string, all features in the input file will be used)
	 * @param percentTrain How much of the input data will be used for training? (the remaining will be reserved for test/validation)
	 * @param normalize Whether to do normalization.
	 * @param trainingData [Output] Training data (after splitting) 
	 * @param testData [Output] Test (or validation) data (after splitting)
	 * @return A list of ids of the features to be used for learning.
	 */
	private int[] prepareSplit(String sampleFile, String featureDefFile, double percentTrain, boolean normalize, List trainingData, List testData)
	{
                //read input
		List data = readInput(sampleFile);

                //read features
		int[] features = readFeature(featureDefFile);

                // no features specified ==> use all features in the training file
		if(features == null)
			features = FeatureManager.getFeatureFromSampleVector(data);
		
		if(normalize)
			normalize(data, features);
		
		FeatureManager.prepareSplit(data, percentTrain, trainingData, testData);
		return features;
	}

		
	/**
	 * Save systems' performance to file
	 * @param ids Ranked list IDs.
	 * @param scores Evaluation score (in whatever measure specified/calculated upstream such as NDCG@k, ERR@k, etc.)
	 * @param prpFile Output filename.
	 */
	public void savePerRankListPerformanceFile(List ids, List scores, String prpFile)
	{
		try (BufferedWriter out = new BufferedWriter(new OutputStreamWriter(new FileOutputStream(prpFile)))) {
			for(int i=0;i

    

    

    
            
    
            

    
        
            
                Related Artifacts
                
                     mysql-connector-java mysql
 facebook-messenger com.github.codedrinker
 selenium-java org.seleniumhq.selenium
 instagram-java com.github.sola92
 gson com.google.code.gson
 poi org.apache.poi
 httpclient org.apache.httpcomponents
 json org.json
 facebook-java-api com.google.code.facebook-java-api
 poi-ooxml org.apache.poi
 jackson-databind com.fasterxml.jackson.core
 junit junit
 primefaces org.primefaces
 ojdbc7 com.github.noraui
 jfoenix com.jfoenix
 testng org.testng
 json-simple com.googlecode.json-simple
 selenium-server org.seleniumhq.selenium
 itextpdf com.itextpdf
 spring-core org.springframework
                
            
        
        
            
                Related Groups
                
                     org.springframework
 org.apache.poi
 org.hibernate
 org.springframework.boot
 com.fasterxml.jackson.core
 com.itextpdf
 org.seleniumhq.selenium
 mysql
 org.finos.legend.engine
 org.apache.httpcomponents
 org.apache.logging.log4j
 org.openjfx
 org.apache.commons
 org.json
 com.google.guava
 com.google.zxing
 net.sf.jasperreports
 javax.xml.bind
 ojdbc
 com.google.code.facebook-java-api