All Downloads are FREE. Search and download functionalities are using the official Maven repository.

smile.clustering.linkage.UPGMALinkage Maven / Gradle / Ivy

The newest version!
/*******************************************************************************
 * Copyright (c) 2010 Haifeng Li
 *   
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *  
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 *******************************************************************************/

package smile.clustering.linkage;

/**
 * Unweighted Pair Group Method with Arithmetic mean (also known as average linkage).
 * The distance between two clusters is the mean distance between all possible
 * pairs of nodes in the two clusters. 
 * 

* In bioinformatics, UPGMA is used for the creation of phenetic trees * (phenograms). UPGMA assumes a constant rate of evolution (molecular * clock hypothesis), and is not a well-regarded method for inferring * relationships unless this assumption has been tested and justified * for the data set being used. * * @author Haifeng Li */ public class UPGMALinkage extends Linkage { /** * The number of samples in each cluster. */ private int[] n; /** * Constructor. * @param proximity the proximity matrix to store the distance measure of * dissimilarity. To save space, we only need the lower half of matrix. */ public UPGMALinkage(double[][] proximity) { this.proximity = proximity; n = new int[proximity.length]; for (int i = 0; i < n.length; i++) n[i] = 1; } @Override public String toString() { return "UPGMA linkage"; } @Override public void merge(int i, int j) { double sum = n[i] + n[j]; for (int k = 0; k < i; k++) { proximity[i][k] = proximity[i][k] * n[i] / sum + d(j, k) * n[j] / sum; } for (int k = i+1; k < proximity.length; k++) { proximity[k][i] = proximity[k][i] * n[i] / sum + d(j, k) * n[j] / sum; } n[i] += n[j]; } }





© 2015 - 2025 Weber Informatics LLC | Privacy Policy