gov.sandia.cognition.learning.algorithm.clustering.divergence.ClusterMeanLinkDivergenceFunction Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of cognitive-foundry Show documentation
Show all versions of cognitive-foundry Show documentation
A single jar with all the Cognitive Foundry components.
/*
* File: ClusterMeanLinkDivergenceFunction.java
* Authors: Justin Basilico
* Company: Sandia National Laboratories
* Project: Cognitive Foundry
*
* Copyright June 28, 2006, Sandia Corporation. Under the terms of Contract
* DE-AC04-94AL85000, there is a non-exclusive license for use of this work by
* or on behalf of the U.S. Government. Export of this program may require a
* license from the United States Government. See CopyrightHistory.txt for
* complete details.
*
*/
package gov.sandia.cognition.learning.algorithm.clustering.divergence;
import gov.sandia.cognition.annotation.CodeReview;
import gov.sandia.cognition.learning.algorithm.clustering.cluster.Cluster;
import gov.sandia.cognition.math.DivergenceFunction;
import java.util.Collection;
/**
* The ClusterMeanLinkDivergenceFunction class implements the mean linkage
* distance metric between two clusters. That is, the value returned by the
* metric is the mean distance between any point in the first cluster and any
* point in the second cluster.
*
* @param type of {@code Cluster} used in the
* {@code learn()} method
* @param The algorithm operates on a {@code Collection},
* so {@code DataType} will be something like Vector or String
* @author Justin Basilico
* @since 1.0
*/
@CodeReview(
reviewer="Kevin R. Dixon",
date="2008-07-23",
changesNeeded=false,
comments={
"Cleaned up javadoc a little bit with code annotations.",
"Otherwise, looks fine."
}
)
public class ClusterMeanLinkDivergenceFunction, DataType>
extends AbstractClusterToClusterDivergenceFunction
{
/**
* Creates a new instance of ClusterMeanLinkDivergenceFunction.
*/
public ClusterMeanLinkDivergenceFunction()
{
this(null);
}
/**
* Creates a new instance of ClusterMeanLinkDivergenceFunction using
* the given divergence function for elements.
*
* @param divergenceFunction The divergence function for elements.
*/
public ClusterMeanLinkDivergenceFunction(
DivergenceFunction super DataType, ? super DataType> divergenceFunction)
{
super(divergenceFunction);
}
/**
* The method computes the complete link distance between the two given
* Clusters. The distance returned is the mean distance between a member
* of the first cluster and a member of the second cluster.
*
* @param from The first Cluster.
* @param to The second Cluster.
* @return The mean link distance between the two given Clusters.
*/
public double evaluate(
ClusterType from,
ClusterType to)
{
// Get the members of each cluster.
Collection fromMembers = from.getMembers();
Collection toMembers = to.getMembers();
// Since we are going to compute the mean we need to know the
// sum of all the distances along with the total number of pairs.
double sum = 0.0;
int numPairs = fromMembers.size() * toMembers.size();
// Double-loop over the members of each cluster.
for ( DataType first : fromMembers )
{
for ( DataType second : toMembers )
{
// Compute the distance between the two memebers.
double distance =
this.divergenceFunction.evaluate(first, second);
// Add the distance to the sum.
sum += distance;
}
}
// Return the mean of the distance.
return sum / (double) numPairs;
}
}