org.neo4j.gds.similarity.nodesim.JaccardSimilarityComputer Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of similarity-params Show documentation
Show all versions of similarity-params Show documentation
Neo4j Graph Data Science :: Similarity Algorithms Parameters
The newest version!
/*
* Copyright (c) "Neo4j"
* Neo4j Sweden AB [http://neo4j.com]
*
* This file is part of Neo4j.
*
* Neo4j is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program. If not, see .
*/
package org.neo4j.gds.similarity.nodesim;
import org.neo4j.gds.core.utils.Intersections;
public class JaccardSimilarityComputer implements MetricSimilarityComputer {
private final double similarityCutoff;
public JaccardSimilarityComputer(double similarityCutoff) {
this.similarityCutoff = similarityCutoff;
}
@Override
public double computeSimilarity(long[] vector1, long[] vector2) {
long intersection = Intersections.intersection3(vector1, vector2);
long union = vector1.length + vector2.length - intersection;
double similarity = union == 0 ? 0 : intersection / (double) union;
return similarity >= similarityCutoff ? similarity : Double.NaN;
}
@Override
public double computeWeightedSimilarity(long[] vector1, long[] vector2, double[] weights1, double[] weights2) {
assert vector1.length == weights1.length;
assert vector2.length == weights2.length;
int offset1 = 0;
int offset2 = 0;
int length1 = weights1.length;
int length2 = weights2.length;
double max = 0;
double min = 0;
while (offset1 < length1 && offset2 < length2) {
long target1 = vector1[offset1];
long target2 = vector2[offset2];
if (target1 == target2) {
double w1 = weights1[offset1];
double w2 = weights2[offset2];
if (w1 > w2) {
max += w1;
min += w2;
} else {
min += w1;
max += w2;
}
offset1++;
offset2++;
} else if (target1 < target2) {
max += weights1[offset1];
offset1++;
} else {
max += weights2[offset2];
offset2++;
}
}
for (; offset1 < length1; offset1++) {
max += weights1[offset1];
}
for (; offset2 < length2; offset2++) {
max += weights2[offset2];
}
double similarity = min / max;
return similarity >= similarityCutoff ? similarity : Double.NaN;
}
static class Builder implements MetricSimilarityComputerBuilder {
public MetricSimilarityComputer build(double similarityCutoff) {
return new JaccardSimilarityComputer(similarityCutoff);
}
@Override
public String render() {
return "JACCARD";
}
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy