All Downloads are FREE. Search and download functionalities are using the official Maven repository.

apoc.stats.DegreeDistribution Maven / Gradle / Ivy

There is a newer version: 5.25.1
Show newest version
/*
 * Copyright (c) "Neo4j"
 * Neo4j Sweden AB [http://neo4j.com]
 *
 * This file is part of Neo4j.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *    http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package apoc.stats;

import static org.neo4j.token.api.TokenConstants.ANY_LABEL;
import static org.neo4j.token.api.TokenConstants.ANY_RELATIONSHIP_TYPE;

import apoc.Pools;
import apoc.path.RelationshipTypeAndDirections;
import apoc.util.kernel.MultiThreadedGlobalGraphOperations;
import java.util.ArrayList;
import java.util.Iterator;
import java.util.List;
import java.util.stream.Stream;
import org.HdrHistogram.AtomicHistogram;
import org.apache.commons.lang3.tuple.Pair;
import org.neo4j.graphdb.Direction;
import org.neo4j.graphdb.RelationshipType;
import org.neo4j.internal.kernel.api.NodeCursor;
import org.neo4j.internal.kernel.api.Read;
import org.neo4j.internal.kernel.api.TokenRead;
import org.neo4j.kernel.api.KernelTransaction;
import org.neo4j.kernel.internal.GraphDatabaseAPI;
import org.neo4j.procedure.Context;
import org.neo4j.procedure.Description;
import org.neo4j.procedure.Name;
import org.neo4j.procedure.NotThreadSafe;
import org.neo4j.procedure.Procedure;
import org.neo4j.token.api.NamedToken;

/**
 * @author mh
 * @since 07.08.17
 */
public class DegreeDistribution {

    private static final int BATCHSIZE = 10_000;

    public static class DegreeStats {
        public final String typeName;
        public final long total;
        private final int type;
        private final Direction direction;
        private transient AtomicHistogram histogram;

        public void computeDegree(NodeCursor nodeCursor) {
            int degree = DegreeUtil.degree(nodeCursor, type, direction);
            record(degree);
        }

        public static class Result {
            @Description("The type of the relationship.")
            public String type;

            @Description("The direction of the relationship.")
            public String direction;

            @Description("The total observed relationships.")
            public long total;

            @Description("The 50th percentile grouping.")
            public long p50;

            @Description("The 75th percentile grouping.")
            public long p75;

            @Description("The 90th percentile grouping.")
            public long p90;

            @Description("The 95th percentile grouping.")
            public long p95;

            @Description("The 99th percentile grouping.")
            public long p99;

            @Description("The 99.9th percentile grouping.")
            public long p999;

            @Description("The max value.")
            public long max;

            @Description("The min value.")
            public long min;

            @Description("The mean value.")
            public double mean;
        }

        public DegreeStats(String typeName, int type, Direction direction, long total) {
            this.typeName = typeName;
            this.type = type;
            this.direction = direction;
            this.total = total;
            this.histogram = new AtomicHistogram(total, 3);
        }

        public void record(long value) {
            histogram.recordValue(value);
        }

        public Result done() {
            Result result = new Result();
            result.type = typeName;
            result.direction = direction.name();
            result.total = total;
            result.max = histogram.getMaxValue();
            result.min = histogram.getMinValue();
            result.mean = histogram.getMean();
            result.p50 = histogram.getValueAtPercentile(50);
            result.p75 = histogram.getValueAtPercentile(75);
            result.p90 = histogram.getValueAtPercentile(90);
            result.p95 = histogram.getValueAtPercentile(95);
            result.p99 = histogram.getValueAtPercentile(99);
            result.p999 = histogram.getValueAtPercentile(99.9);
            this.histogram.reset();
            this.histogram = null;
            return result;
        }
    }

    @Context
    public GraphDatabaseAPI db;

    @Context
    public KernelTransaction tx;

    @Context
    public Pools pools;

    @NotThreadSafe
    @Procedure("apoc.stats.degrees")
    @Description(
            "Returns the percentile groupings of the degrees on the `NODE` values connected by the given `RELATIONSHIP` types.")
    public Stream degrees(
            @Name(
                            value = "relTypes",
                            defaultValue = "",
                            description =
                                    "The relationship types to calculate the percentile grouping over. If this is empty or omitted, all relationships are used.")
                    String types) {
        List stats = prepareStats(types);

        MultiThreadedGlobalGraphOperations.forAllNodes(
                db,
                pools.getDefaultExecutorService(),
                BATCHSIZE,
                nodeCursor -> stats.forEach((s) -> s.computeDegree(nodeCursor)));
        return stats.stream().map(DegreeStats::done);
    }

    public List prepareStats(String types) {
        List stats = new ArrayList<>();
        TokenRead tokenRead = tx.tokenRead();
        Read read = tx.dataRead();
        if ("*".equals(types)) {
            Iterator tokens = tokenRead.relationshipTypesGetAllTokens();
            while (tokens.hasNext()) {
                NamedToken token = tokens.next();
                long total = read.countsForRelationship(ANY_LABEL, token.id(), ANY_LABEL);
                stats.add(new DegreeStats(token.name(), token.id(), Direction.OUTGOING, total));
                stats.add(new DegreeStats(token.name(), token.id(), Direction.INCOMING, total));
            }
            return stats;
        }
        List> pairs = RelationshipTypeAndDirections.parse(types);
        for (Pair pair : pairs) {
            String typeName = pair.getLeft() == null ? null : pair.getLeft().name();
            int type = typeName == null ? ANY_RELATIONSHIP_TYPE : tokenRead.relationshipType(typeName);
            long total = read.countsForRelationship(ANY_LABEL, type, ANY_LABEL);
            stats.add(new DegreeStats(typeName, type, pair.getRight(), total));
        }
        return stats;
    }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy