test.it.unimi.dsi.util.HyperLogLogCounterArrayTest Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of dsiutils Show documentation
Show all versions of dsiutils Show documentation
The DSI utilities are a mishmash of classes accumulated during the last twenty years in projects developed at the DSI (Dipartimento di Scienze dell'Informazione, i.e., Information Sciences Department), now DI (Dipartimento di Informatica, i.e., Informatics Department), of the Universita` degli Studi di Milano.
package it.unimi.dsi.util;
/*
* DSI utilities
*
* Copyright (C) 2010-2020 Paolo Boldi and Sebastiano Vigna
*
* This library is free software; you can redistribute it and/or modify it
* under the terms of the GNU Lesser General Public License as published by the Free
* Software Foundation; either version 3 of the License, or (at your option)
* any later version.
*
* This library is distributed in the hope that it will be useful, but
* WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
* or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public License
* for more details.
*
* You should have received a copy of the GNU Lesser General Public License
* along with this program; if not, see .
*
*/
import static org.junit.Assert.assertTrue;
import org.junit.Ignore;
import org.junit.Test;
import it.unimi.dsi.logging.ProgressLogger;
public class HyperLogLogCounterArrayTest {
@Test
public void testSingle() {
final int numTrials = 10;
for(final int size: new int[] { 1, 10, 100, 1000, 100000 })
for(final int log2m: new int[] { 6, 8, 12 }) {
final double rsd = HyperLogLogCounterArray.relativeStandardDeviation(log2m);
int correct = 0;
for (int trial = 0; trial < numTrials; trial++) {
final HyperLogLogCounterArray a = new HyperLogLogCounterArray(1, size, log2m, trial);
final int incr = (int)((1L << 32) / size);
int x = Integer.MIN_VALUE;
for(int i = 0; i < size; i++) {
a.add(0, x);
x += incr;
}
//System.err.println("Trial " + trial + ", size " + size + ", error: " + (size - a.count(0)) / size + " " + (Math.abs(size - a.count(0)) < 2 * rsd * size ? "(+)" : "(-)"));
if (Math.abs(size - a.count(0)) / size < 2 * rsd) correct++;
}
//System.err.println("Correct trials for size " + size + ", rsd " + rsd + ": " + correct);
assertTrue(correct + " < " + 9, correct >= 9);
}
}
@Test
public void testDouble() {
final int numTrials = 10;
for(final int size: new int[] { 1, 10, 100, 1000, 100000 })
for(final int log2m: new int[] { 4, 6, 8, 12 }) {
final double rsd = HyperLogLogCounterArray.relativeStandardDeviation(log2m);
int correct0 = 0, correct1 = 0;
for (int trial = 0; trial < numTrials; trial++) {
final HyperLogLogCounterArray a = new HyperLogLogCounterArray(2, size, log2m, trial);
final int incr = (int)((1L << 32) / size);
int x = Integer.MIN_VALUE;
for(int i = 0; i < size; i++) {
a.add(0, x);
a.add(1, x);
x += incr;
}
//System.err.println("Trial " + trial + " (0), size " + size + ", error: " + (size - a.count(0)) / size + " " + (Math.abs(size - a.count(0)) < 2 * rsd * size ? "(+)" : "(-)"));
//System.err.println("Trial " + trial + " (1), size " + size + ", error: " + (size - a.count(1)) / size + " " + (Math.abs(size - a.count(1)) < 2 * rsd * size ? "(+)" : "(-)"));
if (Math.abs(size - a.count(0)) / size < 2 * rsd) correct0++;
if (Math.abs(size - a.count(1)) / size < 2 * rsd) correct1++;
}
//System.err.println("Correct trials (0) for size " + size + ", rsd " + rsd + ": " + correct0);
//System.err.println("Correct trials (1) for size " + size + ", rsd " + rsd + ": " + correct1);
assertTrue(correct0 + " < " + 9, correct0 >= 9);
assertTrue(correct1 + " < " + 9, correct1 >= 9);
}
}
@Ignore("too slow")
@Test
public void testLarge() {
final int numTrials = 10;
for(final long size: new long[] { 1000000000, 4000000000L })
for(final int log2m: new int[] { 6, 8, 12 }) {
final double rsd = HyperLogLogCounterArray.relativeStandardDeviation(log2m);
int correct = 0;
for (int trial = 0; trial < numTrials; trial++) {
final HyperLogLogCounterArray a = new HyperLogLogCounterArray(1, size, log2m, trial);
final long incr = (1L << 60) / size;
long x = Long.MIN_VALUE;
for(long i = size; i-- != 0;) {
a.add(0, x);
x += incr;
}
//System.err.println("Trial " + trial + ", size " + size + ", error: " + (size - a.count(0)) / size + " " + (Math.abs(size - a.count(0)) < 2 * rsd * size ? "(+)" : "(-)"));
if (Math.abs(size - a.count(0)) / size < 2 * rsd) correct++;
}
//System.err.println("Correct trials for size " + size + ", rsd " + rsd + ": " + correct);
assertTrue(correct + " < " + 9, correct >= 9);
}
}
@Ignore("too slow")
@Test
public void testExtreme() {
final int numTrials = 20, mustBeCorrect = 18;
final ProgressLogger pl = new ProgressLogger();
for(final int log2m: new int[] { 6, 8, 12 }) {
final double rsd = HyperLogLogCounterArray.relativeStandardDeviation(log2m);
int correct = 0;
final long size = 3L * 1024 * 1024 * 1024;
for (int trial = 0; trial < numTrials; trial++) {
final HyperLogLogCounterArray a = new HyperLogLogCounterArray(1, size, log2m, trial);
pl.start();
for(int i = Integer.MIN_VALUE; i < Integer.MAX_VALUE; i++) if (i % 4 != 0) a.add(0, i);
pl.stop();
pl.count = size;
//System.err.println(pl);
//System.err.println("Trial " + trial + ", error: " + (size - a.count(0)) / size + " " + (Math.abs(size - a.count(0)) < 2 * rsd * size ? "(+)" : "(-)"));
if (Math.abs(size - a.count(0)) < 2 * rsd * size) correct++;
}
//System.err.println("Correct trials for size " + size + ", rsd " + rsd + ": " + correct);
assertTrue(correct + " < " + mustBeCorrect, correct >= mustBeCorrect);
}
for(final int log2m: new int[] { 6, 8, 12 }) {
final double rsd = HyperLogLogCounterArray.relativeStandardDeviation(log2m);
int correct = 0;
final long size = 7L * 512 * 1024 * 1024;
for (int trial = 0; trial < numTrials; trial++) {
final HyperLogLogCounterArray a = new HyperLogLogCounterArray(1, size, log2m, trial);
pl.start();
for(int i = Integer.MIN_VALUE; i < Integer.MAX_VALUE; i++) if (i % 8 != 0) a.add(0, i);
pl.stop();
pl.count = size;
//System.err.println(pl);
//System.err.println("Trial " + trial + ", error: " + (size - a.count(0)) / size + " " + (Math.abs(size - a.count(0)) < 2 * rsd * size ? "(+)" : "(-)"));
if (Math.abs(size - a.count(0)) / size < 2 * rsd) correct++;
}
//System.err.println("Correct trials for size " + size + ", rsd " + rsd + ": " + correct);
assertTrue(correct + " < " + mustBeCorrect, mustBeCorrect >= 9);
}
for(final int log2m: new int[] { 6, 8, 12 }) {
final double rsd = HyperLogLogCounterArray.relativeStandardDeviation(log2m);
int correct = 0;
final long size = 8L * 1024 * 1024 * 1024;
for (int trial = 0; trial < numTrials; trial++) {
final HyperLogLogCounterArray a = new HyperLogLogCounterArray(1, size, log2m, trial);
pl.start();
for(int i = Integer.MIN_VALUE; i < Integer.MAX_VALUE; i++) if (i % 8 != 0) a.add(0, i);
pl.stop();
pl.count = size;
//System.err.println(pl);
//System.err.println("Trial " + trial + ", error: " + (size - a.count(0)) / size + " " + (Math.abs(size - a.count(0)) < 2 * rsd * size ? "(+)" : "(-)"));
if (Math.abs(size - a.count(0)) / size < 2 * rsd) correct++;
}
//System.err.println("Correct trials for size " + size + ", rsd " + rsd + ": " + correct);
assertTrue(correct + " < " + mustBeCorrect, mustBeCorrect >= 9);
}
}
public static void main(final String arg[]) {
new HyperLogLogCounterArrayTest().testExtreme();
}
}