org.gephi.statistics.plugin.Modularity Maven / Gradle / Ivy
The newest version!
/*
Copyright 2008-2011 Gephi
Authors : Patick J. McSweeney , Sebastien Heymann
Website : http://www.gephi.org
This file is part of Gephi.
DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS HEADER.
Copyright 2011 Gephi Consortium. All rights reserved.
The contents of this file are subject to the terms of either the GNU
General Public License Version 3 only ("GPL") or the Common
Development and Distribution License("CDDL") (collectively, the
"License"). You may not use this file except in compliance with the
License. You can obtain a copy of the License at
http://gephi.org/about/legal/license-notice/
or /cddl-1.0.txt and /gpl-3.0.txt. See the License for the
specific language governing permissions and limitations under the
License. When distributing the software, include this License Header
Notice in each file and include the License files at
/cddl-1.0.txt and /gpl-3.0.txt. If applicable, add the following below the
License Header, with the fields enclosed by brackets [] replaced by
your own identifying information:
"Portions Copyrighted [year] [name of copyright owner]"
If you wish your version of this file to be governed by only the CDDL
or only the GPL Version 3, indicate your decision by adding
"[Contributor] elects to include this software in this distribution
under the [CDDL or GPL Version 3] license." If you do not indicate a
single choice of license, a recipient has the option to distribute
your version of this file under either the CDDL, the GPL Version 3 or
to extend the choice of license to its licensees as provided above.
However, if you add GPL Version 3 code and therefore, elected the GPL
Version 3 license, then the option applies only if the new code is
made subject to such option by the copyright holder.
Contributor(s): Thomas Aynaud
Portions Copyrighted 2011 Gephi Consortium.
*/
package org.gephi.statistics.plugin;
import java.text.DecimalFormat;
import java.text.NumberFormat;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.HashSet;
import java.util.List;
import java.util.Map;
import java.util.Random;
import java.util.Set;
import org.gephi.graph.api.Column;
import org.gephi.graph.api.Edge;
import org.gephi.graph.api.Graph;
import org.gephi.graph.api.GraphModel;
import org.gephi.graph.api.Node;
import org.gephi.graph.api.NodeIterable;
import org.gephi.graph.api.Table;
import org.gephi.statistics.spi.Statistics;
import org.gephi.utils.longtask.spi.LongTask;
import org.gephi.utils.progress.Progress;
import org.gephi.utils.progress.ProgressTicket;
import org.jfree.chart.ChartFactory;
import org.jfree.chart.JFreeChart;
import org.jfree.chart.plot.PlotOrientation;
import org.jfree.data.xy.XYSeries;
import org.jfree.data.xy.XYSeriesCollection;
/**
* @author pjmcswee
*/
public class Modularity implements Statistics, LongTask {
public static final String MODULARITY_CLASS = "modularity_class";
private ProgressTicket progress;
private boolean isCanceled;
private CommunityStructure structure;
private double modularity;
private double modularityResolution;
private boolean isRandomized = false;
private boolean useWeight = true;
private double resolution = 1.;
private int initialModularityClassIndex = 0;
public boolean getRandom() {
return isRandomized;
}
public void setRandom(boolean isRandomized) {
this.isRandomized = isRandomized;
}
public boolean getUseWeight() {
return useWeight;
}
public void setUseWeight(boolean useWeight) {
this.useWeight = useWeight;
}
public double getResolution() {
return resolution;
}
public void setResolution(double resolution) {
this.resolution = resolution;
}
public int getInitialModularityClassIndex(){
return initialModularityClassIndex;
}
public void setInitialModularityClassIndex(int initialModularityClassIndex){
this.initialModularityClassIndex = initialModularityClassIndex;
}
@Override
public boolean cancel() {
this.isCanceled = true;
return true;
}
@Override
public void setProgressTicket(ProgressTicket progressTicket) {
this.progress = progressTicket;
}
@Override
public void execute(GraphModel graphModel) {
Graph graph = graphModel.getUndirectedGraphVisible();
execute(graph);
}
public void execute(Graph graph) {
isCanceled = false;
Table nodeTable = graph.getModel().getNodeTable();
ColumnUtils.cleanUpColumns(nodeTable, new String[] {MODULARITY_CLASS}, Integer.class);
Column modCol = nodeTable.getColumn(MODULARITY_CLASS);
if (modCol == null) {
nodeTable.addColumn(MODULARITY_CLASS, "Modularity Class", Integer.class, 0);
}
graph.readLock();
try {
structure = new Modularity.CommunityStructure(graph);
int[] comStructure = new int[graph.getNodeCount()];
if (graph.getNodeCount() > 0) {//Fixes issue #713 Modularity Calculation Throws Exception On Empty Graph
HashMap computedModularityMetrics =
computeModularity(graph, structure, comStructure, resolution, isRandomized, useWeight);
modularity = computedModularityMetrics.get("modularity");
modularityResolution = computedModularityMetrics.get("modularityResolution");
} else {
modularity = 0;
modularityResolution = 0;
}
for(int i = 0; i < comStructure.length; i++){
comStructure[i] = comStructure[i] + initialModularityClassIndex;
}
saveValues(comStructure, graph, structure);
} finally {
graph.readUnlock();
}
}
protected HashMap computeModularity(Graph graph, CommunityStructure theStructure,
int[] comStructure,
double currentResolution, boolean randomized,
boolean weighted) {
isCanceled = false;
Progress.start(progress);
Random rand = new Random();
double totalWeight = theStructure.graphWeightSum;
double[] nodeDegrees = theStructure.weights.clone();
HashMap results = new HashMap<>();
if (isCanceled) {
return results;
}
boolean someChange = true;
while (someChange) {
someChange = false;
boolean localChange = true;
while (localChange) {
localChange = false;
int start = 0;
if (randomized) {
start = Math.abs(rand.nextInt()) % theStructure.N;
}
int step = 0;
for (int i = start; step < theStructure.N; i = (i + 1) % theStructure.N) {
step++;
Community bestCommunity = updateBestCommunity(theStructure, i, currentResolution);
if ((theStructure.nodeCommunities[i] != bestCommunity) && (bestCommunity != null)) {
theStructure.moveNodeTo(i, bestCommunity);
localChange = true;
}
if (isCanceled) {
return results;
}
}
someChange = localChange || someChange;
if (isCanceled) {
return results;
}
}
if (someChange) {
theStructure.zoomOut();
}
}
fillComStructure(graph, theStructure, comStructure);
double[] degreeCount = fillDegreeCount(graph, theStructure, comStructure, nodeDegrees, weighted);
double computedModularity = finalQ(comStructure, degreeCount, graph, theStructure, totalWeight, 1., weighted);
double computedModularityResolution =
finalQ(comStructure, degreeCount, graph, theStructure, totalWeight, currentResolution, weighted);
results.put("modularity", computedModularity);
results.put("modularityResolution", computedModularityResolution);
return results;
}
private Community updateBestCommunity(CommunityStructure theStructure, int node_id, double currentResolution) {
double best = 0.;
Community bestCommunity = null;
Set iter = theStructure.nodeConnectionsWeight[node_id].keySet();
for (Community com : iter) {
double qValue = q(node_id, com, theStructure, currentResolution);
if (qValue > best) {
best = qValue;
bestCommunity = com;
}
}
return bestCommunity;
}
private int[] fillComStructure(Graph graph, CommunityStructure theStructure, int[] comStructure) {
int count = 0;
for (Community com : theStructure.communities) {
for (Integer node : com.nodes) {
Community hidden = theStructure.invMap.get(node);
for (Integer nodeInt : hidden.nodes) {
comStructure[nodeInt] = count;
}
}
count++;
}
return comStructure;
}
private double[] fillDegreeCount(Graph graph, CommunityStructure theStructure, int[] comStructure,
double[] nodeDegrees, boolean weighted) {
double[] degreeCount = new double[theStructure.communities.size()];
for (Node node : graph.getNodes()) {
int index = theStructure.map.get(node);
if (weighted) {
degreeCount[comStructure[index]] += nodeDegrees[index];
} else {
degreeCount[comStructure[index]] += graph.getDegree(node);
}
}
return degreeCount;
}
private double finalQ(int[] struct, double[] degrees, Graph graph,
CommunityStructure theStructure, double totalWeight, double usedResolution,
boolean weighted) {
double res = 0;
double[] internal = new double[degrees.length];
for (Node n : graph.getNodes()) {
int n_index = theStructure.map.get(n);
for (Edge edge : graph.getEdges(n)) {
Node neighbor = graph.getOpposite(n, edge);
if (n == neighbor) {
continue;
}
int neigh_index = theStructure.map.get(neighbor);
if (struct[neigh_index] == struct[n_index]) {
if (weighted) {
internal[struct[neigh_index]] += edge.getWeight(graph.getView());
} else {
internal[struct[neigh_index]]++;
}
}
}
}
for (int i = 0; i < degrees.length; i++) {
internal[i] /= 2.0;
res += usedResolution * (internal[i] / totalWeight) - Math.pow(degrees[i] / (2 * totalWeight), 2);//HERE
}
return res;
}
private void saveValues(int[] struct, Graph graph, CommunityStructure theStructure) {
Table nodeTable = graph.getModel().getNodeTable();
Column modCol = nodeTable.getColumn(MODULARITY_CLASS);
for (Node n : graph.getNodes()) {
int n_index = theStructure.map.get(n);
n.setAttribute(modCol, struct[n_index]);
}
}
public double getModularity() {
return modularity;
}
@Override
public String getReport() {
//Distribution series
Map sizeDist = new HashMap<>();
for (Node n : structure.graph.getNodes()) {
Integer v = (Integer) n.getAttribute(MODULARITY_CLASS);
if (!sizeDist.containsKey(v)) {
sizeDist.put(v, 0);
}
sizeDist.put(v, sizeDist.get(v) + 1);
}
XYSeries dSeries = ChartUtils.createXYSeries(sizeDist, "Size Distribution");
XYSeriesCollection dataset1 = new XYSeriesCollection();
dataset1.addSeries(dSeries);
JFreeChart chart = ChartFactory.createXYLineChart(
"Size Distribution",
"Modularity Class",
"Size (number of nodes)",
dataset1,
PlotOrientation.VERTICAL,
true,
false,
false);
chart.removeLegend();
ChartUtils.decorateChart(chart);
ChartUtils.scaleChart(chart, dSeries, false);
String imageFile = ChartUtils.renderChart(chart, "communities-size-distribution.png");
NumberFormat f = new DecimalFormat("#0.000");
String report = " Modularity Report
"
+ "
"
+ " Parameters:
"
+ "Randomize: " + (isRandomized ? "On" : "Off") + "
"
+ "Use edge weights: " + (useWeight ? "On" : "Off") + "
"
+ "Resolution: " + (resolution) + "
"
+ "
Results:
"
+ "Modularity: " + f.format(modularity) + "
"
+ "Modularity with resolution: " + f.format(modularityResolution) + "
"
+ "Number of Communities: " + structure.communities.size()
+ "
" + imageFile
+ "
" + " Algorithm:
"
+
"Vincent D Blondel, Jean-Loup Guillaume, Renaud Lambiotte, Etienne Lefebvre, Fast unfolding of communities in large networks, in Journal of Statistical Mechanics: Theory and Experiment 2008 (10), P1000
"
+ "
" + " Resolution:
"
+
"R. Lambiotte, J.-C. Delvenne, M. Barahona Laplacian Dynamics and Multiscale Modular Structure in Networks 2009
"
+ " ";
return report;
}
private double q(int node, Community community, CommunityStructure theStructure, double currentResolution) {
Float edgesToFloat = theStructure.nodeConnectionsWeight[node].get(community);
double edgesTo = 0;
if (edgesToFloat != null) {
edgesTo = edgesToFloat.doubleValue();
}
double weightSum = community.weightSum;
double nodeWeight = theStructure.weights[node];
double qValue = currentResolution * edgesTo - (nodeWeight * weightSum) / (2.0 * theStructure.graphWeightSum);
if ((theStructure.nodeCommunities[node] == community) && (theStructure.nodeCommunities[node].size() > 1)) {
qValue = currentResolution * edgesTo -
(nodeWeight * (weightSum - nodeWeight)) / (2.0 * theStructure.graphWeightSum);
}
if ((theStructure.nodeCommunities[node] == community) && (theStructure.nodeCommunities[node].size() == 1)) {
qValue = 0.;
}
return qValue;
}
class ModEdge {
int source;
int target;
float weight;
public ModEdge(int s, int t, float w) {
source = s;
target = t;
weight = w;
}
}
class CommunityStructure {
HashMap[] nodeConnectionsWeight;
HashMap[] nodeConnectionsCount;
HashMap map;
Community[] nodeCommunities;
Graph graph;
double[] weights;
double graphWeightSum;
List[] topology;
List communities;
int N;
HashMap invMap;
CommunityStructure(Graph graph) {
this.graph = graph;
N = graph.getNodeCount();
invMap = new HashMap<>();
nodeConnectionsWeight = new HashMap[N];
nodeConnectionsCount = new HashMap[N];
nodeCommunities = new Community[N];
map = new HashMap<>();
topology = new ArrayList[N];
communities = new ArrayList<>();
int index = 0;
weights = new double[N];
NodeIterable nodesIterable = graph.getNodes();
for (Node node : nodesIterable) {
map.put(node, index);
nodeCommunities[index] = new Community(this);
nodeConnectionsWeight[index] = new HashMap<>();
nodeConnectionsCount[index] = new HashMap<>();
weights[index] = 0;
nodeCommunities[index].seed(index);
Community hidden = new Community(structure);
hidden.nodes.add(index);
invMap.put(index, hidden);
communities.add(nodeCommunities[index]);
index++;
if (isCanceled) {
nodesIterable.doBreak();
return;
}
}
int[] edgeTypes = graph.getModel().getEdgeTypes();
nodesIterable = graph.getNodes();
for (Node node : nodesIterable) {
int node_index = map.get(node);
topology[node_index] = new ArrayList<>();
Set uniqueNeighbors = new HashSet<>(graph.getNeighbors(node).toCollection());
for (Node neighbor : uniqueNeighbors) {
if (node == neighbor) {
continue;
}
int neighbor_index = map.get(neighbor);
float weight = 0;
//Sum all parallel edges weight:
for (int edgeType : edgeTypes) {
for (Edge edge : graph.getEdges(node, neighbor, edgeType)) {
if (useWeight) {
weight += edge.getWeight(graph.getView());
} else {
weight += 1;
}
}
}
//Finally add a single edge with the summed weight of all parallel edges:
//Fixes issue #1419 Getting null pointer error when trying to calculate modularity
weights[node_index] += weight;
Modularity.ModEdge me = new ModEdge(node_index, neighbor_index, weight);
topology[node_index].add(me);
Community adjCom = nodeCommunities[neighbor_index];
nodeConnectionsWeight[node_index].put(adjCom, weight);
nodeConnectionsCount[node_index].put(adjCom, 1);
Community nodeCom = nodeCommunities[node_index];
nodeCom.connectionsWeight.put(adjCom, weight);
nodeCom.connectionsCount.put(adjCom, 1);
nodeConnectionsWeight[neighbor_index].put(nodeCom, weight);
nodeConnectionsCount[neighbor_index].put(nodeCom, 1);
adjCom.connectionsWeight.put(nodeCom, weight);
adjCom.connectionsCount.put(nodeCom, 1);
graphWeightSum += weight;
}
if (isCanceled) {
nodesIterable.doBreak();
return;
}
}
graphWeightSum /= 2.0;
}
private void addNodeTo(int node, Community to) {
to.add(node);
nodeCommunities[node] = to;
for (ModEdge e : topology[node]) {
int neighbor = e.target;
////////
//Remove Node Connection to this community
Float neighEdgesTo = nodeConnectionsWeight[neighbor].get(to);
if (neighEdgesTo == null) {
nodeConnectionsWeight[neighbor].put(to, e.weight);
} else {
nodeConnectionsWeight[neighbor].put(to, neighEdgesTo + e.weight);
}
Integer neighCountEdgesTo = nodeConnectionsCount[neighbor].get(to);
if (neighCountEdgesTo == null) {
nodeConnectionsCount[neighbor].put(to, 1);
} else {
nodeConnectionsCount[neighbor].put(to, neighCountEdgesTo + 1);
}
///////////////////
Modularity.Community adjCom = nodeCommunities[neighbor];
Float wEdgesto = adjCom.connectionsWeight.get(to);
if (wEdgesto == null) {
adjCom.connectionsWeight.put(to, e.weight);
} else {
adjCom.connectionsWeight.put(to, wEdgesto + e.weight);
}
Integer cEdgesto = adjCom.connectionsCount.get(to);
if (cEdgesto == null) {
adjCom.connectionsCount.put(to, 1);
} else {
adjCom.connectionsCount.put(to, cEdgesto + 1);
}
Float nodeEdgesTo = nodeConnectionsWeight[node].get(adjCom);
if (nodeEdgesTo == null) {
nodeConnectionsWeight[node].put(adjCom, e.weight);
} else {
nodeConnectionsWeight[node].put(adjCom, nodeEdgesTo + e.weight);
}
Integer nodeCountEdgesTo = nodeConnectionsCount[node].get(adjCom);
if (nodeCountEdgesTo == null) {
nodeConnectionsCount[node].put(adjCom, 1);
} else {
nodeConnectionsCount[node].put(adjCom, nodeCountEdgesTo + 1);
}
if (to != adjCom) {
Float comEdgesto = to.connectionsWeight.get(adjCom);
if (comEdgesto == null) {
to.connectionsWeight.put(adjCom, e.weight);
} else {
to.connectionsWeight.put(adjCom, comEdgesto + e.weight);
}
Integer comCountEdgesto = to.connectionsCount.get(adjCom);
if (comCountEdgesto == null) {
to.connectionsCount.put(adjCom, 1);
} else {
to.connectionsCount.put(adjCom, comCountEdgesto + 1);
}
}
}
}
private void removeNodeFromItsCommunity(int node) {
Community community = nodeCommunities[node];
for (ModEdge e : topology[node]) {
int neighbor = e.target;
////////
//Remove Node Connection to this community
Float edgesTo = nodeConnectionsWeight[neighbor].get(community);
Integer countEdgesTo = nodeConnectionsCount[neighbor].get(community);
if (countEdgesTo - 1 == 0) {
nodeConnectionsWeight[neighbor].remove(community);
nodeConnectionsCount[neighbor].remove(community);
} else {
nodeConnectionsWeight[neighbor].put(community, edgesTo - e.weight);
nodeConnectionsCount[neighbor].put(community, countEdgesTo - 1);
}
///////////////////
//Remove Adjacency Community's connection to this community
Modularity.Community adjCom = nodeCommunities[neighbor];
Float oEdgesto = adjCom.connectionsWeight.get(community);
Integer oCountEdgesto = adjCom.connectionsCount.get(community);
if (oCountEdgesto - 1 == 0) {
adjCom.connectionsWeight.remove(community);
adjCom.connectionsCount.remove(community);
} else {
adjCom.connectionsWeight.put(community, oEdgesto - e.weight);
adjCom.connectionsCount.put(community, oCountEdgesto - 1);
}
if (node == neighbor) {
continue;
}
if (adjCom != community) {
Float comEdgesto = community.connectionsWeight.get(adjCom);
Integer comCountEdgesto = community.connectionsCount.get(adjCom);
if (comCountEdgesto - 1 == 0) {
community.connectionsWeight.remove(adjCom);
community.connectionsCount.remove(adjCom);
} else {
community.connectionsWeight.put(adjCom, comEdgesto - e.weight);
community.connectionsCount.put(adjCom, comCountEdgesto - 1);
}
}
Float nodeEgesTo = nodeConnectionsWeight[node].get(adjCom);
Integer nodeCountEgesTo = nodeConnectionsCount[node].get(adjCom);
if (nodeCountEgesTo - 1 == 0) {
nodeConnectionsWeight[node].remove(adjCom);
nodeConnectionsCount[node].remove(adjCom);
} else {
nodeConnectionsWeight[node].put(adjCom, nodeEgesTo - e.weight);
nodeConnectionsCount[node].put(adjCom, nodeCountEgesTo - 1);
}
}
community.remove(node);
}
private void moveNodeTo(int node, Community to) {
removeNodeFromItsCommunity(node);
addNodeTo(node, to);
}
private void zoomOut() {
int M = communities.size();
ArrayList[] newTopology = new ArrayList[M];
int index = 0;
nodeCommunities = new Community[M];
nodeConnectionsWeight = new HashMap[M];
nodeConnectionsCount = new HashMap[M];
HashMap newInvMap = new HashMap<>();
for (int i = 0; i < communities.size(); i++) {//Community com : mCommunities) {
Community com = communities.get(i);
nodeConnectionsWeight[index] = new HashMap<>();
nodeConnectionsCount[index] = new HashMap<>();
newTopology[index] = new ArrayList<>();
nodeCommunities[index] = new Community(com);
Set iter = com.connectionsWeight.keySet();
double weightSum = 0;
Community hidden = new Community(structure);
for (Integer nodeInt : com.nodes) {
Community oldHidden = invMap.get(nodeInt);
hidden.nodes.addAll(oldHidden.nodes);
}
newInvMap.put(index, hidden);
for (Modularity.Community adjCom : iter) {
int target = communities.indexOf(adjCom);
float weight = com.connectionsWeight.get(adjCom);
if (target == index) {
weightSum += 2. * weight;
} else {
weightSum += weight;
}
ModEdge e = new ModEdge(index, target, weight);
newTopology[index].add(e);
}
weights[index] = weightSum;
nodeCommunities[index].seed(index);
index++;
}
communities.clear();
for (int i = 0; i < M; i++) {
Community com = nodeCommunities[i];
communities.add(com);
for (ModEdge e : newTopology[i]) {
nodeConnectionsWeight[i].put(nodeCommunities[e.target], e.weight);
nodeConnectionsCount[i].put(nodeCommunities[e.target], 1);
com.connectionsWeight.put(nodeCommunities[e.target], e.weight);
com.connectionsCount.put(nodeCommunities[e.target], 1);
}
}
N = M;
topology = newTopology;
invMap = newInvMap;
}
}
class Community {
double weightSum;
CommunityStructure structure;
List nodes;
HashMap connectionsWeight;
HashMap connectionsCount;
public Community(Modularity.Community com) {
structure = com.structure;
connectionsWeight = new HashMap<>();
connectionsCount = new HashMap<>();
nodes = new ArrayList<>();
//mHidden = pCom.mHidden;
}
public Community(CommunityStructure structure) {
this.structure = structure;
connectionsWeight = new HashMap<>();
connectionsCount = new HashMap<>();
nodes = new ArrayList<>();
}
public int size() {
return nodes.size();
}
public void seed(int node) {
nodes.add(node);
weightSum += structure.weights[node];
}
public boolean add(int node) {
nodes.add(node);
weightSum += structure.weights[node];
return true;
}
public boolean remove(int node) {
boolean result = nodes.remove((Integer) node);
weightSum -= structure.weights[node];
if (nodes.isEmpty()) {
structure.communities.remove(this);
}
return result;
}
}
}