net.jkernelmachines.kernel.extra.NystromKernel Maven / Gradle / Ivy

Go to download
/*******************************************************************************
 * Copyright (c) 2016, David Picard.
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without modification,
 * are permitted provided that the following conditions are met:
 *
 * 1. Redistributions of source code must retain the above copyright notice, this
 * list of conditions and the following disclaimer.
 *
 * 2. Redistributions in binary form must reproduce the above copyright notice,
 * this list of conditions and the following disclaimer in the documentation and/or
 * other materials provided with the distribution.
 *
 * 3. Neither the name of the copyright holder nor the names of its contributors
 * may be used to endorse or promote products derived from this software without
 * specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
 * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR
 * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
 * ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
 * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 *******************************************************************************/
package net.jkernelmachines.kernel.extra;

import static java.lang.Math.min;

import java.util.ArrayList;
import java.util.Collections;
import java.util.Comparator;
import java.util.List;

import net.jkernelmachines.kernel.Kernel;
import net.jkernelmachines.kernel.typed.DoubleLinear;
import net.jkernelmachines.type.TrainingSample;
import net.jkernelmachines.util.DebugPrinter;
import net.jkernelmachines.util.algebra.MatrixOperations;
import net.jkernelmachines.util.algebra.ThreadedMatrixOperations;

/**
 * This kernel provides a fast approximation of a given kernel using the Nystrom
 * approximation.
 * 
 * A fast active learning algorithm analog to that used in:
 * Fast Approximation of Distance Between Elastic Curves using
 * Kernels
 * Hedi Tabia; David Picard; Hamid Laga; Philippe-Henri Gosselin
 * British Machine Vision Conference, Sep 2013, United Kingdom. British Machine
 * Vision Conference
 * 
 * 
 * @author picard
 * 
 */
public class NystromKernel extends Kernel {

	/**
	 * 
	 */
	private static final long serialVersionUID = 6324067887253049771L;

	private static DebugPrinter debug = new DebugPrinter();

	Kernel kernel;
	DoubleLinear linear;
	private double[][] projectors;
	private double[] eigenvalues;
	private List> list;
	private int dim = -1;

	/**
	 * Default constructor with kernel to approximate as argument
	 * 
	 * @param kernel
	 *            the kernel to be approximated
	 */
	public NystromKernel(Kernel kernel) {
		this.kernel = kernel;
		linear = new DoubleLinear();
	}

	/**
	 * Train the Nystrom approx on a full training set.
	 * 
	 * 
	 * Might be costly for large training sets, since it involves the inversion
	 * of the Gram matrix.
	 * 
	 * 
	 * @param list
	 *            the training list of samples
	 */
	public void train(List> list) {
		this.list = new ArrayList>();
		this.list.addAll(list);
		dim = list.size();
		debug.println(3, "matrix size : " + dim);
		double[][] matrix = kernel.getKernelMatrix(list);
		double[][][] eig = MatrixOperations.eig(matrix);

		projectors = ThreadedMatrixOperations.transi(eig[0]);
		eigenvalues = new double[dim];
		for (int d = 0; d < dim; d++) {
			double p = eig[1][d][d];
			if (p > 1e-15) {
				eigenvalues[d] = 1. / Math.sqrt(p);
			}
		}

	}

	public void activeTrain(List> list, int iterations,
			int samples, int pool) {
		this.list = new ArrayList>();
		List> dup = new ArrayList>();
		List> poolList = new ArrayList>();
		dup.addAll(list);

		for (int i = 0; i < iterations; i++) {
			debug.println(3, "active iteration " + i);
			// select pool samples randomly
			Collections.shuffle(dup);

			poolList.clear();
			int dupSize = dup.size();
			for (int j = 0; j < min(pool, dupSize); j++) {
				poolList.add(dup.remove(0));
			}

			// computes errors
			class Err {
				public TrainingSample t;
				public double error;
			}
			List errors = new ArrayList();
			List> subPool = poolList.subList(0,
					min(pool, poolList.size()));
			double[][] mori = kernel.getKernelMatrix(subPool);
			double[][] mapp = getKernelMatrix(subPool);

			for (int j = 0; j < min(pool, poolList.size()); j++) {
				TrainingSample t = poolList.get(j);
				double e = 0;
				for (int k = 0; k < min(pool, poolList.size()); k++) {
					double v1 = mori[j][k];
					double v2 = mapp[j][k];
					double d = (v1 - v2);
					e += d * d;
				}
				Err err = new Err();
				err.t = t;
				err.error = e;
				errors.add(err);
			}
			Collections.sort(errors, new Comparator() {
				@Override
				public int compare(Err t1, Err t2) {
					return -Double.compare(t1.error, t2.error);
				}
			});

			// add high error to the list
			for (int k = 0; k < samples; k++) {
				this.list.add(errors.remove(0).t);
			}
			// add low error samples back to the pool
			while (!errors.isEmpty()) {
				dup.add(errors.remove(0).t);
			}

			// train
			this.train(this.list);
		}

	}

	/**
	 * Project a sample to the space induced by the Nystrom approx
	 * 
	 * @param sample sample
	 * @return projection of the sample
	 */
	public double[] projectSample(T sample) {
		// if was not train, return 0
		if (dim <= 0)
			return new double[1];

		double[] out = new double[dim];
		double[] km = new double[list.size()];
		for (int i = 0; i < list.size(); i++)
			km[i] = kernel.valueOf(list.get(i).sample, sample);

		for (int d = 0; d < dim; d++) {
			for (int i = 0; i < list.size(); i++) {
				out[d] += projectors[d][i] * km[i];
			}
			out[d] *= eigenvalues[d];
		}

		return out;
	}

	public List> projectList(List> l) {
		List> out = new ArrayList>(
				l.size());
		for (TrainingSample t : l) {
			double[] d = projectSample(t.sample);
			out.add(new TrainingSample(d, t.label));
		}
		return out;
	}

	/*
	 * (non-Javadoc)
	 * 
	 * @see fr.lip6.jkernelmachines.kernel.Kernel#valueOf(java.lang.Object,
	 * java.lang.Object)
	 */
	@Override
	public double valueOf(T t1, T t2) {
		return linear.valueOf(projectSample(t1), projectSample(t2));
	}

	/*
	 * (non-Javadoc)
	 * 
	 * @see fr.lip6.jkernelmachines.kernel.Kernel#valueOf(java.lang.Object)
	 */
	@Override
	public double valueOf(T t1) {
		double[] s = projectSample(t1);
		return linear.valueOf(s, s);
	}

}