org.apache.datasketches.tuple.ArrayOfDoublesUpdatableSketchBuilder Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of datasketches-java Show documentation
Show all versions of datasketches-java Show documentation
Core sketch algorithms used alone and by other Java repositories in the DataSketches library.
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package org.apache.datasketches.tuple;
import static org.apache.datasketches.Util.DEFAULT_NOMINAL_ENTRIES;
import static org.apache.datasketches.Util.DEFAULT_UPDATE_SEED;
import static org.apache.datasketches.Util.checkNomLongs;
import org.apache.datasketches.ResizeFactor;
import org.apache.datasketches.SketchesArgumentException;
import org.apache.datasketches.memory.WritableMemory;
/**
* For building a new ArrayOfDoublesUpdatableSketch
*/
public class ArrayOfDoublesUpdatableSketchBuilder {
private int nomEntries_;
private ResizeFactor resizeFactor_;
private int numValues_;
private float samplingProbability_;
private long seed_;
private static final int DEFAULT_NUMBER_OF_VALUES = 1;
private static final float DEFAULT_SAMPLING_PROBABILITY = 1;
private static final ResizeFactor DEFAULT_RESIZE_FACTOR = ResizeFactor.X8;
/**
* Creates an instance of builder with default parameters
*/
public ArrayOfDoublesUpdatableSketchBuilder() {
nomEntries_ = DEFAULT_NOMINAL_ENTRIES;
resizeFactor_ = DEFAULT_RESIZE_FACTOR;
numValues_ = DEFAULT_NUMBER_OF_VALUES;
samplingProbability_ = DEFAULT_SAMPLING_PROBABILITY;
seed_ = DEFAULT_UPDATE_SEED;
}
/**
* This is to set the nominal number of entries.
* @param nomEntries Nominal number of entries. Forced to the nearest power of 2 greater than
* or equal to given value.
* @return this builder
*/
public ArrayOfDoublesUpdatableSketchBuilder setNominalEntries(final int nomEntries) {
nomEntries_ = 1 << checkNomLongs(nomEntries);
return this;
}
/**
* This is to set the resize factor.
* Value of X1 means that the maximum capacity is allocated from the start.
* Default resize factor is X8.
* @param resizeFactor value of X1, X2, X4 or X8
* @return this UpdatableSketchBuilder
*/
public ArrayOfDoublesUpdatableSketchBuilder setResizeFactor(final ResizeFactor resizeFactor) {
resizeFactor_ = resizeFactor;
return this;
}
/**
* This is to set sampling probability.
* Default probability is 1.
* @param samplingProbability sampling probability from 0 to 1
* @return this builder
*/
public ArrayOfDoublesUpdatableSketchBuilder
setSamplingProbability(final float samplingProbability) {
if ((samplingProbability < 0) || (samplingProbability > 1f)) {
throw new SketchesArgumentException("sampling probability must be between 0 and 1");
}
samplingProbability_ = samplingProbability;
return this;
}
/**
* This is to set the number of double values associated with each key
* @param numValues number of double values
* @return this builder
*/
public ArrayOfDoublesUpdatableSketchBuilder setNumberOfValues(final int numValues) {
numValues_ = numValues;
return this;
}
/**
* Sets the long seed value that is required by the hashing function.
* @param seed See seed
* @return this builder
*/
public ArrayOfDoublesUpdatableSketchBuilder setSeed(final long seed) {
seed_ = seed;
return this;
}
/**
* Returns an ArrayOfDoublesUpdatableSketch with the current configuration of this Builder.
* @return an ArrayOfDoublesUpdatableSketch
*/
public ArrayOfDoublesUpdatableSketch build() {
return new HeapArrayOfDoublesQuickSelectSketch(nomEntries_, resizeFactor_.lg(),
samplingProbability_, numValues_, seed_);
}
/**
* Returns an ArrayOfDoublesUpdatableSketch with the current configuration of this Builder.
* @param dstMem instance of Memory to be used by the sketch
* @return an ArrayOfDoublesUpdatableSketch
*/
public ArrayOfDoublesUpdatableSketch build(final WritableMemory dstMem) {
return new DirectArrayOfDoublesQuickSelectSketch(nomEntries_, resizeFactor_.lg(),
samplingProbability_, numValues_, seed_, dstMem);
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy