boofcv.alg.tracker.meanshift.TrackerMeanShiftLikelihood Maven / Gradle / Ivy
Show all versions of boofcv-recognition Show documentation
/*
* Copyright (c) 2021, Peter Abeles. All Rights Reserved.
*
* This file is part of BoofCV (http://boofcv.org).
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package boofcv.alg.tracker.meanshift;
import boofcv.alg.misc.ImageMiscOps;
import boofcv.struct.image.GrayF32;
import boofcv.struct.image.ImageBase;
import boofcv.struct.sparse.SparseImageSample_F32;
import georegression.struct.shapes.Rectangle2D_I32;
import georegression.struct.shapes.RectangleLength2D_I32;
/**
*
* Mean-shift [1] based tracker which tracks the target inside a likelihood image using a flat rectangular kernel
* of fixed size. The likelihood for each pixel is computed using {@link SparseImageSample_F32}. How that
* model is computed is not specified by this class, but is often based on color. For sake of efficiency, the
* likelihood for a pixel is only computed as needed.
*
*
*
* This algorithm can run very fast and works well when the target being tracked is visually distinctive from
* the background and largely composed of one color. It can't handle changes in scale or shape of the target,
* which does limit its applications.
*
*
*
* [1] Yizong Chen, "Mean Shift, Mode Seeking, and Clustering" IEEE Trans. Pattern Analysis and Machine Intelligence,
* VOL. 17, NO. 8, August 1995
*
*
* @author Peter Abeles
*/
public class TrackerMeanShiftLikelihood> {
// likelihood model for the target being tracked
private SparseImageSample_F32 targetModel;
// image used to store the likelihood
private GrayF32 pdf = new GrayF32(1, 1);
// current location of the target
private RectangleLength2D_I32 location = new RectangleLength2D_I32();
// rectangle inside of PDF which has been modified. Used to minimize writing to the image. probably
// premature optimization
private Rectangle2D_I32 dirty = new Rectangle2D_I32();
// maximum number of iterations
private int maxIterations;
// if the total sum of the likelihood drops below this value it is assumed that the target has been lost
private float minimumSum;
// fraction of initial likelihood sum which minimumSum is set to
private float minFractionDrop;
// if true the tracker has failed
private boolean failed;
/**
* Configures tracker
*
* @param targetModel Target used to model the target's likelihood
* @param maxIterations Maximum number of iterations. try 20
* @param minFractionDrop If the likelihood drops below its initial value by this fraction the track is
* assumed to be lost
*/
public TrackerMeanShiftLikelihood( PixelLikelihood targetModel, int maxIterations, float minFractionDrop ) {
this.targetModel = targetModel;
this.maxIterations = maxIterations;
this.minFractionDrop = minFractionDrop;
}
/**
* Specifies the initial target location so that it can learn its description
*
* @param image Image
* @param initial Initial target location and the mean-shift bandwidth
*/
public void initialize( T image, RectangleLength2D_I32 initial ) {
if (!image.isInBounds(initial.x0, initial.y0))
throw new IllegalArgumentException("Initial rectangle is out of bounds!");
if (!image.isInBounds(initial.x0 + initial.width, initial.y0 + initial.height))
throw new IllegalArgumentException("Initial rectangle is out of bounds!");
pdf.reshape(image.width, image.height);
ImageMiscOps.fill(pdf, -1);
setTrackLocation(initial);
failed = false;
// compute the initial sum of the likelihood so that it can detect when the target is no longer visible
minimumSum = 0;
targetModel.setImage(image);
for (int y = 0; y < initial.height; y++) {
for (int x = 0; x < initial.width; x++) {
minimumSum += targetModel.compute(x + initial.x0, y + initial.y0);
}
}
minimumSum *= minFractionDrop;
}
/**
* Used to set the location of the track without changing any appearance history.
*
* @param location new location
*/
public void setTrackLocation( RectangleLength2D_I32 location ) {
this.location.setTo(location);
// massage the rectangle so that it has an odd width and height
// otherwise it could experience a bias when localizing
this.location.width += 1 - this.location.width%2;
this.location.height += 1 - this.location.height%2;
failed = false;
}
/**
* Updates the target's location in the image by performing a mean-shift search. Returns if it was
* successful at finding the target or not. If it fails once it will need to be re-initialized
*
* @param image Most recent image in the sequence
* @return true for success or false if it failed
*/
public boolean process( T image ) {
if (failed)
return false;
targetModel.setImage(image);
// mark the region where the pdf has been modified as dirty
dirty.setTo(location.x0, location.y0, location.x0 + location.width, location.y0 + location.height);
// compute the pdf inside the initial rectangle
updatePdfImage(location.x0, location.y0, location.x0 + location.width, location.y0 + location.height);
// current location of the target
int x0 = location.x0;
int y0 = location.y0;
// previous location of the target in the most recent iteration
int prevX = x0;
int prevY = y0;
// iterate until it converges or reaches the maximum number of iterations
for (int i = 0; i < maxIterations; i++) {
// compute the weighted centroid using the likelihood function
float totalPdf = 0;
float sumX = 0;
float sumY = 0;
for (int y = 0; y < location.height; y++) {
int indexPdf = pdf.startIndex + pdf.stride*(y + y0) + x0;
for (int x = 0; x < location.width; x++) {
float p = pdf.data[indexPdf++];
totalPdf += p;
sumX += (x0 + x)*p;
sumY += (y0 + y)*p;
}
}
// if the target isn't likely to be in view, give up
if (totalPdf <= minimumSum) {
failed = true;
return false;
}
// Use the new center to find the new top left corner, while rounding to the nearest integer
x0 = (int)(sumX/totalPdf - location.width/2 + 0.5f);
y0 = (int)(sumY/totalPdf - location.height/2 + 0.5f);
// make sure it doesn't go outside the image
if (x0 < 0)
x0 = 0;
else if (x0 >= image.width - location.width)
x0 = image.width - location.width;
if (y0 < 0)
y0 = 0;
else if (y0 >= image.height - location.height)
y0 = image.height - location.height;
// see if it has converged
if (x0 == prevX && y0 == prevY)
break;
// save the previous location
prevX = x0;
prevY = y0;
// update the pdf
updatePdfImage(x0, y0, x0 + location.width, y0 + location.height);
}
// update the output
location.x0 = x0;
location.y0 = y0;
// clean up the image for the next iteration
ImageMiscOps.fillRectangle(pdf, -1, dirty.x0, dirty.y0, dirty.x1 - dirty.x0, dirty.y1 - dirty.y0);
return true;
}
/**
* Computes the PDF only inside the image as needed amd update the dirty rectangle
*/
protected void updatePdfImage( int x0, int y0, int x1, int y1 ) {
for (int y = y0; y < y1; y++) {
int indexOut = pdf.startIndex + pdf.stride*y + x0;
for (int x = x0; x < x1; x++, indexOut++) {
if (pdf.data[indexOut] < 0)
pdf.data[indexOut] = targetModel.compute(x, y);
}
}
// update the dirty region
if (dirty.x0 > x0)
dirty.x0 = x0;
if (dirty.y0 > y0)
dirty.y0 = y0;
if (dirty.x1 < x1)
dirty.x1 = x1;
if (dirty.y1 < y1)
dirty.y1 = y1;
}
/**
* Current location of target in the image
*
* @return rectangle containing the target
*/
public RectangleLength2D_I32 getLocation() {
return location;
}
/**
* If true the tracker has filed
*/
public boolean isFailed() {
return failed;
}
}