All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.elasticsearch.search.aggregations.bucket.BucketUtils Maven / Gradle / Ivy

The newest version!
/*
 * Licensed to Elasticsearch under one or more contributor
 * license agreements. See the NOTICE file distributed with
 * this work for additional information regarding copyright
 * ownership. Elasticsearch licenses this file to you under
 * the Apache License, Version 2.0 (the "License"); you may
 * not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *    http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 * KIND, either express or implied.  See the License for the
 * specific language governing permissions and limitations
 * under the License.
 */
package org.elasticsearch.search.aggregations.bucket;

/**
 * Helper functions for common Bucketing functions
 */
public class BucketUtils {

    /**
     * Heuristic used to determine the size of shard-side PriorityQueues when
     * selecting the top N terms from a distributed index.
     * 
     * @param finalSize
     *            The number of terms required in the final reduce phase.
     * @param numberOfShards
     *            The number of shards being queried.
     * @return A suggested default for the size of any shard-side PriorityQueues
     */
    public static int suggestShardSideQueueSize(int finalSize, int numberOfShards) {
        assert numberOfShards >= 1;
        if (numberOfShards == 1) {
            return finalSize;
        }
        //Cap the multiplier used for shards to avoid excessive data transfer
        final long shardSampleSize = (long) finalSize * Math.min(10, numberOfShards);
        // When finalSize is very small e.g. 1 and there is a low number of
        // shards then we need to ensure we still gather a reasonable sample of statistics from each
        // shard (at low cost) to improve the chances of the final result being accurate.
        return (int) Math.min(Integer.MAX_VALUE, Math.max(10, shardSampleSize));
    }
    
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy