org.ddogleg.optimization.impl.LevenbergMarquardtDampened Maven / Gradle / Ivy

Go to download
Show more of this group Show more artifacts with this name
Show all versions of ddogleg Show documentation
DDogleg Numerics is a high performance Java library for non-linear optimization, robust model fitting, polynomial root finding, sorting, and more.
There is a newer version: 0.23.4
Show newest version
/*
 * Copyright (c) 2012-2013, Peter Abeles. All Rights Reserved.
 *
 * This file is part of DDogleg (http://ddogleg.org).
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *   http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.ddogleg.optimization.impl;

import org.ejml.alg.dense.linsol.LinearSolverSafe;
import org.ejml.alg.dense.mult.VectorVectorMult;
import org.ejml.data.DenseMatrix64F;
import org.ejml.factory.LinearSolver;
import org.ejml.ops.CommonOps;

/**
 * 
 * Modification of {@link LevenbergDampened} which incorporates the insight of Marquardt.  The insight
 * was to use the function's curvature information to increase dampening along directions with
 * a larger gradient.  In practice this method seems to do better on nearly singular systems.
 * 
 *
 * 
 * The step 'x' is computed using the following formula:
 * [J(k)'*J(k) + μ*diag(J(k)'*J(k))]x = -g = -J'*f

 * where J is the Jacobian, μ is the damping coefficient, g is the gradient,
 * f is the functions output.
 * 
 *
 * 
 * The linear solver it uses is specified in the constructor.  Cholesky based solver will be the fastest
 * but can fail if the J(x)'J(x) matrix is nearly singular.  In those situations a pseudo inverse type
 * solver should be used, which is immune to that type of problem but much more expensive.
 * 
 *
 * @author Peter Abeles
 */
public class LevenbergMarquardtDampened extends LevenbergDenseBase {

	// solver used to compute (A + mu*diag(A))d = g
	protected LinearSolver solver;

	/**
	 * Specifies termination condition and linear solver.  Selection of the linear solver an effect
	 * speed and robustness.
	 *
	 * @param solver		   Linear solver. Cholesky or pseudo-inverse are recommended.
	 * @param initialDampParam Initial value of the dampening parameter.  Tune.. try 1e-3;
	 */
	public LevenbergMarquardtDampened(LinearSolver solver,
									  double initialDampParam) {
		super(initialDampParam);
		this.solver = solver;
		if( solver.modifiesB() )
			this.solver = new LinearSolverSafe(solver);
	}

	@Override
	protected void computeJacobian( DenseMatrix64F residuals , DenseMatrix64F gradient) {
		// calculate the Jacobian values at the current sample point
		function.computeJacobian(jacobianVals.data);

		// compute helper matrices
		// B = J'*J;   g = J'*r
		// Take advantage of symmetry when computing B and only compute the upper triangular
		// portion used by cholesky decomposition
		CommonOps.multInner(jacobianVals, B);
		CommonOps.multTransA(jacobianVals, residuals, gradient);

		// extract diagonal elements from B
		CommonOps.extractDiag(B, Bdiag);
	}

	@Override
	protected boolean computeStep(double lambda, DenseMatrix64F gradientNegative, DenseMatrix64F step) {
		// add dampening parameter
		for( int i = 0; i < N; i++ ) {
			int index = B.getIndex(i,i);
			B.data[index] = (1+lambda)*Bdiag.data[i];
		}

		// compute the change in step.
		if( !solver.setA(B) ) {
//			addToMessage("Singularity encountered.  Try a more robust solver line pseudo inverse");
			return false;
		}
		// solve for change in x
		solver.solve(gradientNegative, step);

		return true;
	}

	/**
	 * compute the change predicted by the model
	 *
	 * m_k(0) - m_k(p_k) = -g_k'*p - 0.5*p'*B*p
	 * (J'*J+mu*diag(J'*J))*p = -J'*r = -g
	 *
	 * @return predicted reduction
	 */
	@Override
	protected double predictedReduction( DenseMatrix64F param, DenseMatrix64F gradientNegative , double mu ) {

		double p_dot_g = VectorVectorMult.innerProd(param,gradientNegative);
		double p_JJ_p = 0;
		for( int i = 0; i < N; i++ )
			p_JJ_p += param.data[i]*Bdiag.data[i]*param.data[i];

		// The variable g is really the negative of g
		return 0.5*(p_dot_g + mu*p_JJ_p);

	}
}