src.it.unimi.dsi.util.IntParallelCounterArray Maven / Gradle / Ivy

Go to download
Show more of this group Show more artifacts with this name
Show all versions of dsiutils Show documentation
The DSI utilities are a mishmash of classes accumulated during the last twenty years in projects developed at the DSI (Dipartimento di Scienze dell'Informazione, i.e., Information Sciences Department), now DI (Dipartimento di Informatica, i.e., Informatics Department), of the Universita` degli Studi di Milano.
There is a newer version: 2.7.3
Show newest version
package it.unimi.dsi.util;

/*
 * DSI utilities
 *
 * Copyright (C) 2010-2020 Paolo Boldi and Sebastiano Vigna
 *
 *  This library is free software; you can redistribute it and/or modify it
 *  under the terms of the GNU Lesser General Public License as published by the Free
 *  Software Foundation; either version 3 of the License, or (at your option)
 *  any later version.
 *
 *  This library is distributed in the hope that it will be useful, but
 *  WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
 *  or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public License
 *  for more details.
 *
 *  You should have received a copy of the GNU Lesser General Public License
 *  along with this program; if not, see .
 *
 */

import it.unimi.dsi.Util;
import it.unimi.dsi.bits.Fast;
import it.unimi.dsi.bits.LongArrayBitVector;
import it.unimi.dsi.fastutil.longs.LongBigList;
import it.unimi.dsi.stat.Ziggurat;

import java.io.Serializable;

/**
 * An array of approximate sets each represented using a Parallel counter.
 *
 * Parallel counters represent the number of elements of a set in an approximate way. They have been
 * introduced by Philippe Flajolet, Éric Fusy, Olivier Gandouet, and Freédeéric Meunier in
 * “Parallel: the analysis of a near-optimal cardinality estimation algorithm”,
 * Proceedings of the 13th conference on analysis of algorithm (AofA 07), pages
 * 127−146, 2007. They are an improvement over the basic idea of loglog counting, introduced by
 * Marianne Durand and Philippe Flajolet in “Loglog counting of large cardinalities”,
 * ESA 2003, 11th Annual European Symposium, volume 2832 of Lecture Notes in Computer Science, pages 605−617, Springer, 2003.
 *
 * 
Each counter is composed by {@link #m} registers, and each register is made of {@link #registerSize} bits.
 * The first number depends on the desired relative standard deviation, and its logarithm can be computed using {@link #log2NumberOfRegisters(double)},
 * whereas the second number depends on an upper bound on the number of distinct elements to be counted, and it can be computed
 * using {@link #registerSize(long)}.
 *
 * 
Actually, this class implements an array of counters. Each counter is completely independent, but they all use the same hash function.
 * The reason for this design is that in our intended applications hundred of millions of counters are common, and the JVM overhead to create such a number of objects
 * would be unbearable. This class allocates an array of {@link LongArrayBitVector}s, each containing {@link #CHUNK_SIZE} registers,
 * and can thus handle billions of billions of registers efficiently (in turn, this means being able to
 * handle an array of millions of billions of high-precision counters).
 *
 * 
When creating an instance, you can choose the size of the array (i.e., the number of counters) and the desired relative standard deviation
 * (either {@linkplain #IntParallelCounterArray(int, long, int, double) explicitly} or
 * {@linkplain #IntParallelCounterArray(int, long, int, double) choosing the number of registers per counter}).
 * Then, you can {@linkplain #add(int, int) add an element to a counter}. At any time, you can
 * {@linkplain #count(int) count} count (approximately) the number of distinct elements that have been added to a counter.
 *
 * @author Paolo Boldi
 * @author Sebastiano Vigna
 */

public class IntParallelCounterArray implements Serializable {
	private static final long serialVersionUID = 1L;
	private static final boolean ASSERTS = false;
	private static final boolean DEBUG = false;

	public final static int MAX_EXPONENT = 2;

	/** The logarithm of the maximum size in registers of a bit vector. */
	public final static int CHUNK_SHIFT = 30;
	/** The maximum size in registers of a bit vector. */
	public final static long CHUNK_SIZE = 1L << CHUNK_SHIFT;
	public final static long CHUNK_MASK = CHUNK_SIZE - 1;

	/** A an array of bit vectors containing all registers. */
	protected final LongArrayBitVector bitVector[];

	/** {@link #registerSize}-bit views of {@link #bitVector}. */
	protected final LongBigList registers[];

	/** The number of registers. */
	protected final int m;

	/** The number of registers. */
	protected final int log2m;

	/** The number of registers minus one. */
	protected final int mMinus1;

	/** The size in bits of each register. */
	protected final int registerSize;

	/** The mask corresponding to a register. */
	protected final int registerMask;

	/** The shift that selects the chunk corresponding to a node. */
	protected final int nodeShift;

	private Ziggurat ziggurat;
	protected double base;
	private double logBase;
	private int maxExponent;

	/**
	 * Returns the logarithm of the number of registers per counter that are necessary to attain a
	 * given relative standard deviation.
	 *
	 * @param rsd the relative standard deviation to be attained.
	 * @return the logarithm of the number of registers that are necessary to attain relative standard deviation rsd.
	 */
	public static int log2NumberOfRegisters(final double rsd) {
		return (int)Math.ceil(Fast.log2((1 / rsd) * (1 / rsd)));
	}


	/**
	 * Returns the relative standard deviation corresponding to a given logarithm of the number of registers per counter.
	 *
	 * @param log2m the logarithm of the number of registers.
	 * @return the resulting relative standard deviation.
	 */
	public static double relativeStandardDeviation(final int log2m) {
		return 1 / Math.sqrt(1 << log2m);
	}

	/**
	 * Returns the register size in bits, given an upper bound on the number of distinct elements.
	 *
	 * @param n an upper bound on the number of distinct elements.
	 * @return the register size in bits.
	 */

	public static int registerSize(final long n) {
		return Math.max(4, (int)Math.ceil(Math.log(Math.log(n) / Math.log(2)) / Math.log(2)));
	}

	/**
	 * Creates a new array of counters.
	 *
	 * @param arraySize the number of counters.
	 * @param n the expected number of elements.
	 * @param rsd the relative standard deviation.
	 * @param floatingPointPrecision the precision used for floating-point computations.
	 */
	public IntParallelCounterArray(final int arraySize, final long n, final double rsd, final double floatingPointPrecision) {
		this(arraySize, n, log2NumberOfRegisters(rsd), floatingPointPrecision);
	}

	/**
	 * Creates a new array of counters.
	 *
	 * @param arraySize the number of counters.
	 * @param n the expected number of elements.
	 * @param log2m the logarithm of the number of registers per counter.
 	 * @param floatingPointPrecision the precision used for floating-point computations.
	 */
	public IntParallelCounterArray(final int arraySize, final long n, final int log2m, final double floatingPointPrecision) {
		this(arraySize, n, log2m, floatingPointPrecision, Util.randomSeed());
	}

	/**
	 * Creates a new array of counters.
	 *
	 * @param arraySize the number of counters.
	 * @param n the expected number of elements.
	 * @param log2m the logarithm of the number of registers per counter.
	 * @param floatingPointPrecision the precision used for floating-point computations.
	 * @param seed the seed used to compute the hash function
	 */
	public IntParallelCounterArray(final int arraySize, final long n, final int log2m, final double floatingPointPrecision, final long seed) {
		this.m = 1 << (this.log2m = log2m);
		this.mMinus1 = m - 1;
		this.registerSize = (int)(registerSize(n) + Math.ceil(-Fast.log2(floatingPointPrecision)));
		registerMask = (1 << registerSize) - 1;
		nodeShift = CHUNK_SHIFT - log2m;

		base = (1 + floatingPointPrecision) / (1 - floatingPointPrecision);
		logBase = Math.log(base);
		maxExponent = (int)Math.ceil(Math.log(2) / logBase);

		// System.err.println(arraySize + " " + m + " " + registerSize);
		final long sizeInRegisters = (long)arraySize * m;
		final int numVectors = (int)((sizeInRegisters + CHUNK_MASK) >>> CHUNK_SHIFT);

		bitVector = new LongArrayBitVector[numVectors];
		registers = new LongBigList[numVectors];
		for(int i = 0; i < numVectors; i++) {
			this.bitVector[i] = LongArrayBitVector.ofLength(registerSize * Math.min(CHUNK_SIZE, sizeInRegisters - ((long)i << CHUNK_SHIFT)));
			this.registers[i] = bitVector[i].asLongBigList(registerSize);
		}
		ziggurat = new Ziggurat(new XoRoShiRo128PlusRandom(seed));
		if (DEBUG) System.err.println("Register size: " + registerSize + " log2m (b): " + log2m + " m: " + m + " base: " + base);
	}


	private double[] maxz = new double[10000];
	private long[] maxe = new long[10000];

	/** Adds an element to a counter.
	 *
	 * @param k the index of the counter.
	 * @param v the element to be added.
	 */
	public void add(int k, int v) {
		final int registerSize = this.registerSize;
		// Chunk of the first register
		int chunk = (int)((long)k >>> nodeShift);
		// Offset in bits of the first register inside the chunk
		long offset = ((long)k << log2m & CHUNK_MASK) * registerSize;
		long[] bits = bitVector[chunk].bits();
		int length = bits.length;

		int word = (int)(offset / Long.SIZE) - 1;
		long curr = 0;
		// The number of bits still to be filled in curr.
		// TODO: This won't work unless offset is a multiple of Long.SIZE.
		int used = (int)(offset % Long.SIZE);

		long ee[];

		if (ASSERTS) ee = new long[m];

		for (int i = 0; i < m; i++) {
			double z = ziggurat.nextDouble();
			maxz[i] = Math.max(maxz[i], 1/z);
			final long e = Math.max(0, - Math.round(Math.log(z) / logBase) + maxExponent) & registerMask;
			maxe[i] = Math.max(maxe[i], e);
			//System.err.print(e + "\t");
			if (ASSERTS) ee[i] = e;
			if (ASSERTS) assert e < (1 << registerSize);
			if (ASSERTS) assert e >= 0;

			if (used < Long.SIZE - registerSize) {
				curr |= e << used;
				used += registerSize;
			}
			else {
				if (++word == length)  {
					word = 0;
					bits = bitVector[++chunk].bits();
					length = bits.length;
				}
				bits[word] = curr | e << used;
				curr = e >>> Long.SIZE - used;
				used += registerSize - Long.SIZE;
			}
		}

		//System.err.println();

		if (ASSERTS) {
			for (int j = 0; j < m; j++) {
				assert ee[j] == registers[(int)((((long)k << log2m) + j) >> CHUNK_SHIFT)].getLong((((long)k << log2m) + j) & CHUNK_MASK) : "[" + j + "] " + ee[j] + "!=" + registers[(int)((((long)k << log2m) + j) >> CHUNK_SHIFT)].getLong((((long)k << log2m) + j) & CHUNK_MASK);
			}
		}

	}

	public void printMins() {
		for(int i = 0; i < m; i++) System.out.print(maxe[i] + "\t");
		System.err.println();
		for(int i = 0; i < m; i++) System.out.print(1 / maxz[i] + "\t");
		System.err.println();
		for(int i = 0; i < m; i++) System.out.print(maxz[i] + "\t");
		System.err.println();
	}


	/** Returns the array of big lists of registers underlying this array of counters.
	 *
	 * The main purpose of this method is debugging, as it makes comparing
	 * the evolution of the state of two implementations easy.
	 *
	 * @return the array of big lists of registers underlying this array of counters.
	 */

	public LongBigList[] registers() {
		return registers;
		/* TODO: final LongBigList[] result = new LongBigList[registers.length];
		for(int i = result.length; i-- != 0;) result[i] = LongBigLists.unmodifiable(registers[i]);
		return result;*/
	}

	/** Estimates the number of distinct elements that have been added to a given counter so far.
	 *
	 * @param k the index of the counter.
	 * @return an approximation of the number of distinct elements that have been added to counter k so far.
	 */
	public double count(final int k) {
		double s = 0;

		final int registerSize = this.registerSize;
		// Chunk of the first register
		int chunk = (int)((long)k >>> nodeShift);
		// Offset in bits of the first register inside the chunk
		long offset = ((long)k << log2m & CHUNK_MASK) * registerSize;
		long[] bits = bitVector[chunk].bits();
		int length = bits.length;

		int word = (int)(offset / Long.SIZE);
		long curr = bits[word] >>> offset % Long.SIZE;
		long r;
		int remaining = (int)(Long.SIZE - offset % Long.SIZE), mask = (1 << registerSize) - 1;

		for (int j = 0; j < m; j++) {
			if (remaining >= registerSize) {
				r = curr & mask;
				curr >>>= registerSize;
				remaining -= registerSize;
			}
			else {
				if (++word == length)  {
					word = 0;
					bits = bitVector[++chunk].bits();
					length = bits.length;
				}
				r = (curr | bits[word] << remaining) & mask;
				curr = bits[word] >>> registerSize - remaining;
				remaining += Long.SIZE - registerSize;
			}

			if (ASSERTS) assert r == registers[(int)((((long)k << log2m) + j) >> CHUNK_SHIFT)].getLong((((long)k << log2m) + j) & CHUNK_MASK) : "[" + j + "] " + r + "!=" + registers[(int)((((long)k << log2m) + j) >> CHUNK_SHIFT)].getLong((((long)k << log2m) + j) & CHUNK_MASK);

			s += Math.pow(base, -r + maxExponent);
		}

		return m / s;
	}
}