com.datastax.driver.core.policies.LatencyAwarePolicy Maven / Gradle / Ivy

/*
 * Copyright DataStax, Inc.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package com.datastax.driver.core.policies;

import com.codahale.metrics.Gauge;
import com.datastax.driver.core.Cluster;
import com.datastax.driver.core.Host;
import com.datastax.driver.core.HostDistance;
import com.datastax.driver.core.LatencyTracker;
import com.datastax.driver.core.Metrics;
import com.datastax.driver.core.MetricsUtil;
import com.datastax.driver.core.Statement;
import com.datastax.driver.core.exceptions.BootstrappingException;
import com.datastax.driver.core.exceptions.DriverException;
import com.datastax.driver.core.exceptions.OverloadedException;
import com.datastax.driver.core.exceptions.QueryValidationException;
import com.datastax.driver.core.exceptions.UnavailableException;
import com.datastax.driver.core.exceptions.UnpreparedException;
import com.google.common.annotations.VisibleForTesting;
import com.google.common.collect.AbstractIterator;
import com.google.common.collect.ImmutableMap;
import com.google.common.collect.ImmutableSet;
import com.google.common.util.concurrent.ThreadFactoryBuilder;
import java.util.ArrayDeque;
import java.util.Collection;
import java.util.Collections;
import java.util.HashMap;
import java.util.HashSet;
import java.util.Iterator;
import java.util.Map;
import java.util.Queue;
import java.util.Set;
import java.util.concurrent.ConcurrentHashMap;
import java.util.concurrent.ConcurrentMap;
import java.util.concurrent.Executors;
import java.util.concurrent.ScheduledExecutorService;
import java.util.concurrent.ThreadFactory;
import java.util.concurrent.TimeUnit;
import java.util.concurrent.atomic.AtomicReference;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

/**
 * A wrapper load balancing policy that adds latency awareness to a child policy.
 *
 * When used, this policy will collect the latencies of the queries to each Cassandra node and
 * maintain a per-node average latency score. The nodes that are slower than the best performing
 * node by more than a configurable threshold will be moved to the end of the query plan (that is,
 * they will only be tried if all other nodes failed). Note that this policy only penalizes slow
 * nodes, it does not globally sort the query plan by latency.
 *
 * 
The latency score for a given node is a based on a form of exponential moving
 * average. In other words, the latency score of a node is the average of its previously
 * measured latencies, but where older measurements gets an exponentially decreasing weight. The
 * exact weight applied to a newly received latency is based on the time elapsed since the previous
 * measure (to account for the fact that latencies are not necessarily reported with equal
 * regularity, neither over time nor between different nodes).
 *
 * 
Once a node is excluded from query plans (because its averaged latency grew over the exclusion
 * threshold), its latency score will not be updated anymore (since it is not queried). To give a
 * chance to this node to recover, the policy has a configurable retry period. The policy will not
 * penalize a host for which no measurement has been collected for more than this retry period.
 *
 * 
Please see the {@link Builder} class and methods for more details on the possible parameters
 * of this policy.
 *
 * @since 1.0.4
 */
public class LatencyAwarePolicy implements ChainableLoadBalancingPolicy {

  private static final Logger logger = LoggerFactory.getLogger(LatencyAwarePolicy.class);
  private static final boolean HOST_METRICS_ENABLED =
      Boolean.getBoolean("com.datastax.driver.HOST_METRICS_ENABLED");

  private final LoadBalancingPolicy childPolicy;
  private final Tracker latencyTracker;
  private final ScheduledExecutorService updaterService =
      Executors.newSingleThreadScheduledExecutor(threadFactory("LatencyAwarePolicy updater"));

  private final double exclusionThreshold;

  private final long scale;
  private final long retryPeriod;
  private final long minMeasure;
  private volatile Metrics metrics;

  private LatencyAwarePolicy(
      LoadBalancingPolicy childPolicy,
      double exclusionThreshold,
      long scale,
      long retryPeriod,
      long updateRate,
      int minMeasure) {
    this.childPolicy = childPolicy;
    this.retryPeriod = retryPeriod;
    this.scale = scale;
    this.latencyTracker = new Tracker();
    this.exclusionThreshold = exclusionThreshold;
    this.minMeasure = minMeasure;

    updaterService.scheduleAtFixedRate(new Updater(), updateRate, updateRate, TimeUnit.NANOSECONDS);
  }

  @Override
  public LoadBalancingPolicy getChildPolicy() {
    return childPolicy;
  }

  /**
   * Creates a new latency aware policy builder given the child policy that the resulting policy
   * should wrap.
   *
   * @param childPolicy the load balancing policy to wrap with latency awareness.
   * @return the created builder.
   */
  public static Builder builder(LoadBalancingPolicy childPolicy) {
    return new Builder(childPolicy);
  }

  @VisibleForTesting
  class Updater implements Runnable {

    private Set excludedAtLastTick = Collections.emptySet();

    @Override
    public void run() {
      try {
        logger.trace("Updating LatencyAwarePolicy minimum");
        latencyTracker.updateMin();

        if (logger.isDebugEnabled()) {
          /*
           * For users to be able to know if the policy potentially needs tuning, we need to provide
           * some feedback on on how things evolve. For that, we use the min computation to also check
           * which host will be excluded if a query is submitted now and if any host is, we log it (but
           * we try to avoid flooding too). This is probably interesting information anyway since it
           * gets an idea of which host perform badly.
           */
          Set excludedThisTick = new HashSet();
          double currentMin = latencyTracker.getMinAverage();
          for (Map.Entry entry :
              getScoresSnapshot().getAllStats().entrySet()) {
            Host host = entry.getKey();
            Snapshot.Stats stats = entry.getValue();
            if (stats.getMeasurementsCount() < minMeasure) continue;

            if (stats.lastUpdatedSince() > retryPeriod) {
              if (excludedAtLastTick.contains(host))
                logger.debug(
                    String.format(
                        "Previously avoided host %s has not be queried since %.3fms: will be reconsidered.",
                        host, inMS(stats.lastUpdatedSince())));
              continue;
            }

            if (stats.getLatencyScore() > ((long) (exclusionThreshold * currentMin))) {
              excludedThisTick.add(host);
              if (!excludedAtLastTick.contains(host))
                logger.debug(
                    String.format(
                        "Host %s has an average latency score of %.3fms, more than %f times more than the minimum %.3fms: will be avoided temporarily.",
                        host, inMS(stats.getLatencyScore()), exclusionThreshold, inMS(currentMin)));
              continue;
            }

            if (excludedAtLastTick.contains(host)) {
              logger.debug(
                  "Previously avoided host {} average latency has come back within accepted bounds: will be reconsidered.",
                  host);
            }
          }
          excludedAtLastTick = excludedThisTick;
        }
      } catch (RuntimeException e) {
        // An unexpected exception would suppress further execution, so catch, log, but swallow
        // after that.
        logger.error("Error while updating LatencyAwarePolicy minimum", e);
      }
    }
  }

  private static double inMS(long nanos) {
    return ((double) nanos) / (1000 * 1000);
  }

  private static double inMS(double nanos) {
    return nanos / (1000 * 1000);
  }

  private static ThreadFactory threadFactory(String nameFormat) {
    return new ThreadFactoryBuilder().setNameFormat(nameFormat).build();
  }

  @Override
  public void init(Cluster cluster, Collection hosts) {
    childPolicy.init(cluster, hosts);
    for (Host host : hosts) {
      latencyTracker.addHost(host);
    }
    cluster.register(latencyTracker);
    metrics = cluster.getMetrics();
    if (metrics != null) {
      metrics
          .getRegistry()
          .register(
              "LatencyAwarePolicy.latencies.min",
              new Gauge() {
                @Override
                public Long getValue() {
                  return latencyTracker.getMinAverage();
                }
              });
    }
  }

  /**
   * Returns the HostDistance for the provided host.
   *
   * @param host the host of which to return the distance of.
   * @return the HostDistance to {@code host} as returned by the wrapped policy.
   */
  @Override
  public HostDistance distance(Host host) {
    return childPolicy.distance(host);
  }

  /**
   * Returns the hosts to use for a new query.
   *
   * 
The returned plan will be the same as the plan generated by the child policy, except that
   * nodes that are slower than the best performing node by more than a configurable threshold will
   * be moved to the end (that is, they will only be tried if all other nodes failed). Note that
   * this policy only penalizes slow nodes, it does not globally sort the query plan by
   * latency.
   *
   * @param loggedKeyspace the currently logged keyspace.
   * @param statement the statement for which to build the plan.
   * @return the new query plan.
   */
  @Override
  public Iterator newQueryPlan(String loggedKeyspace, Statement statement) {
    final Iterator childIter = childPolicy.newQueryPlan(loggedKeyspace, statement);
    return new AbstractIterator() {

      private Queue skipped;

      @Override
      protected Host computeNext() {
        long min = latencyTracker.getMinAverage();
        long now = System.nanoTime();
        while (childIter.hasNext()) {
          Host host = childIter.next();
          TimestampedAverage latency = latencyTracker.latencyOf(host);

          // If we haven't had enough data point yet to have a score, or the last update of the
          // score
          // is just too old, include the host.
          if (min < 0
              || latency == null
              || latency.nbMeasure < minMeasure
              || (now - latency.timestamp) > retryPeriod) {
            if (hostMetricsEnabled()) {
              metrics
                  .getRegistry()
                  .counter(
                      MetricsUtil.hostMetricName("LatencyAwarePolicy.inclusions-nodata.", host))
                  .inc();
            }
            return host;
          }

          // If the host latency is within acceptable bound of the faster known host, return
          // that host. Otherwise, skip it.
          if (latency.average <= ((long) (exclusionThreshold * (double) min))) {
            if (hostMetricsEnabled()) {
              metrics
                  .getRegistry()
                  .counter(MetricsUtil.hostMetricName("LatencyAwarePolicy.inclusions.", host))
                  .inc();
            }
            return host;
          }

          if (skipped == null) skipped = new ArrayDeque();
          skipped.offer(host);
          if (hostMetricsEnabled()) {
            metrics
                .getRegistry()
                .counter(MetricsUtil.hostMetricName("LatencyAwarePolicy.exclusions.", host))
                .inc();
          }
        }

        if (skipped != null && !skipped.isEmpty()) {
          Host host = skipped.poll();
          if (hostMetricsEnabled()) {
            metrics
                .getRegistry()
                .counter(
                    MetricsUtil.hostMetricName("LatencyAwarePolicy.hits-while-excluded.", host))
                .inc();
          }
          return host;
        }

        return endOfData();
      };
    };
  }

  /**
   * Returns a snapshot of the scores (latency averages) maintained by this policy.
   *
   * @return a new (immutable) {@link Snapshot} object containing the current latency scores
   *     maintained by this policy.
   */
  public Snapshot getScoresSnapshot() {
    Map currentLatencies = latencyTracker.currentLatencies();
    ImmutableMap.Builder builder = ImmutableMap.builder();
    long now = System.nanoTime();
    for (Map.Entry entry : currentLatencies.entrySet()) {
      Host host = entry.getKey();
      TimestampedAverage latency = entry.getValue();
      Snapshot.Stats stats =
          new Snapshot.Stats(now - latency.timestamp, latency.average, latency.nbMeasure);
      builder.put(host, stats);
    }
    return new Snapshot(builder.build());
  }

  @Override
  public void onUp(Host host) {
    childPolicy.onUp(host);
    latencyTracker.addHost(host);
  }

  @Override
  public void onDown(Host host) {
    childPolicy.onDown(host);
    latencyTracker.resetHost(host);
  }

  @Override
  public void onAdd(Host host) {
    childPolicy.onAdd(host);
    latencyTracker.addHost(host);
  }

  @Override
  public void onRemove(Host host) {
    childPolicy.onRemove(host);
    latencyTracker.resetHost(host);
  }

  /**
   * An immutable snapshot of the per-host scores (and stats in general) maintained by {@code
   * LatencyAwarePolicy} to base its decision upon.
   */
  public static class Snapshot {
    private final Map stats;

    private Snapshot(Map stats) {
      this.stats = stats;
    }

    /**
     * A map with the stats for all hosts tracked by the {@code LatencyAwarePolicy} at the time of
     * the snapshot.
     *
     * @return a immutable map with all the stats contained in this snapshot.
     */
    public Map getAllStats() {
      return stats;
    }

    /**
     * The {@code Stats} object for a given host.
     *
     * @param host the host to return the stats of.
     * @return the {@code Stats} for {@code host} in this snapshot or {@code null} if the snapshot
     *     has not information on {@code host}.
     */
    public Stats getStats(Host host) {
      return stats.get(host);
    }

    /** A snapshot of the statistics on a given host kept by {@code LatencyAwarePolicy}. */
    public static class Stats {
      private final long lastUpdatedSince;
      private final long average;
      private final long nbMeasurements;

      private Stats(long lastUpdatedSince, long average, long nbMeasurements) {
        this.lastUpdatedSince = lastUpdatedSince;
        this.average = average;
        this.nbMeasurements = nbMeasurements;
      }

      /**
       * The number of nanoseconds since the last latency update was recorded (at the time of the
       * snapshot).
       *
       * @return The number of nanoseconds since the last latency update was recorded (at the time
       *     of the snapshot).
       */
      public long lastUpdatedSince() {
        return lastUpdatedSince;
      }

      /**
       * The latency score for the host this is the stats of at the time of the snapshot.
       *
       * @return the latency score for the host this is the stats of at the time of the snapshot, or
       *     {@code -1L} if not enough measurements have been taken to assign a score.
       */
      public long getLatencyScore() {
        return average;
      }

      /**
       * The number of recorded latency measurements for the host this is the stats of.
       *
       * @return the number of recorded latency measurements for the host this is the stats of.
       */
      public long getMeasurementsCount() {
        return nbMeasurements;
      }
    }
  }

  /**
   * A set of DriverException subclasses that we should prevent from updating the host's score. The
   * intent behind it is to filter out "fast" errors: when a host replies with such errors, it
   * usually does so very quickly, because it did not involve any actual coordination work. Such
   * errors are not good indicators of the host's responsiveness, and tend to make the host's score
   * look better than it actually is.
   */
  private static final Set> EXCLUDED_EXCEPTIONS =
      ImmutableSet.of(
          UnavailableException.class, // this is done via the snitch and is usually very fast
          OverloadedException.class,
          BootstrappingException.class,
          UnpreparedException.class,
          QueryValidationException
              .class // query validation also happens at early stages in the coordinator
          );

  private class Tracker implements LatencyTracker {

    private final ConcurrentMap latencies =
        new ConcurrentHashMap();
    private volatile long cachedMin = -1L;

    @Override
    public void update(
        final Host host, Statement statement, Exception exception, long newLatencyNanos) {
      HostLatencyTracker hostTracker = latencies.get(host);
      if (hostTracker != null) {
        if (shouldConsiderNewLatency(statement, exception)) {
          hostTracker.add(newLatencyNanos);
        } else if (hostMetricsEnabled()) {
          metrics
              .getRegistry()
              .counter(MetricsUtil.hostMetricName("LatencyAwarePolicy.ignored-latencies.", host))
              .inc();
        }
      }
    }

    private boolean shouldConsiderNewLatency(Statement statement, Exception exception) {
      // query was successful: always consider
      if (exception == null) return true;
      // filter out "fast" errors
      if (EXCLUDED_EXCEPTIONS.contains(exception.getClass())) return false;
      return true;
    }

    public void updateMin() {
      long newMin = Long.MAX_VALUE;
      long now = System.nanoTime();
      for (HostLatencyTracker tracker : latencies.values()) {
        TimestampedAverage latency = tracker.getCurrentAverage();
        if (latency != null
            && latency.average >= 0
            && latency.nbMeasure >= minMeasure
            && (now - latency.timestamp) <= retryPeriod) newMin = Math.min(newMin, latency.average);
      }
      if (newMin != Long.MAX_VALUE) cachedMin = newMin;
    }

    public long getMinAverage() {
      return cachedMin;
    }

    public TimestampedAverage latencyOf(Host host) {
      HostLatencyTracker tracker = latencies.get(host);
      return tracker == null ? null : tracker.getCurrentAverage();
    }

    public Map currentLatencies() {
      Map map = new HashMap(latencies.size());
      for (Map.Entry entry : latencies.entrySet()) {
        TimestampedAverage average = entry.getValue().getCurrentAverage();
        // average may be null if no latencies have been recorded yet for a host.
        if (average != null) {
          map.put(entry.getKey(), average);
        }
      }
      return map;
    }

    public void addHost(final Host host) {
      logger.debug("Adding tracker for {}", host);
      HostLatencyTracker old =
          latencies.putIfAbsent(host, new HostLatencyTracker(scale, (30L * minMeasure) / 100L));
      if (old == null && hostMetricsEnabled()) {
        String metricName = MetricsUtil.hostMetricName("LatencyAwarePolicy.latencies.", host);
        if (!metrics.getRegistry().getNames().contains(metricName)) {
          logger.debug("Adding gauge " + metricName);
          metrics
              .getRegistry()
              .register(
                  metricName,
                  new Gauge() {
                    @Override
                    public Long getValue() {
                      TimestampedAverage latency = latencyTracker.latencyOf(host);
                      return (latency == null) ? -1 : latency.average;
                    }
                  });
        }
      }
    }

    public void resetHost(Host host) {
      logger.debug("Removing tracker for {}", host);
      latencies.remove(host);
    }

    @Override
    public void onRegister(Cluster cluster) {
      // nothing to do
    }

    @Override
    public void onUnregister(Cluster cluster) {
      // nothing to do
    }
  }

  private static class TimestampedAverage {

    private final long timestamp;
    private final long average;
    private final long nbMeasure;

    TimestampedAverage(long timestamp, long average, long nbMeasure) {
      this.timestamp = timestamp;
      this.average = average;
      this.nbMeasure = nbMeasure;
    }
  }

  private static class HostLatencyTracker {

    private final long thresholdToAccount;
    private final double scale;
    private final AtomicReference current =
        new AtomicReference();

    HostLatencyTracker(long scale, long thresholdToAccount) {
      this.scale = (double) scale; // We keep in double since that's how we'll use it.
      this.thresholdToAccount = thresholdToAccount;
    }

    public void add(long newLatencyNanos) {
      TimestampedAverage previous, next;
      do {
        previous = current.get();
        next = computeNextAverage(previous, newLatencyNanos);
      } while (next != null && !current.compareAndSet(previous, next));
    }

    private TimestampedAverage computeNextAverage(
        TimestampedAverage previous, long newLatencyNanos) {

      long currentTimestamp = System.nanoTime();

      long nbMeasure = previous == null ? 1 : previous.nbMeasure + 1;
      if (nbMeasure < thresholdToAccount)
        return new TimestampedAverage(currentTimestamp, -1L, nbMeasure);

      if (previous == null || previous.average < 0)
        return new TimestampedAverage(currentTimestamp, newLatencyNanos, nbMeasure);

      // Note: it's possible for the delay to be 0, in which case newLatencyNanos will basically be
      // discarded. It's fine: nanoTime is precise enough in practice that even if it happens, it
      // will be very rare, and discarding a latency every once in a while is not the end of the
      // world.
      // We do test for negative value, even though in theory that should not happen, because it
      // seems
      // that historically there has been bugs here
      // (https://blogs.oracle.com/dholmes/entry/inside_the_hotspot_vm_clocks)
      // so while this is almost surely not a problem anymore, there's no reason to break the
      // computation
      // if this even happen.
      long delay = currentTimestamp - previous.timestamp;
      if (delay <= 0) return null;

      double scaledDelay = ((double) delay) / scale;
      // Note: We don't use log1p because we it's quite a bit slower and we don't care about the
      // precision (and since we
      // refuse ridiculously big scales, scaledDelay can't be so low that scaledDelay+1 == 1.0 (due
      // to rounding)).
      double prevWeight = Math.log(scaledDelay + 1) / scaledDelay;
      long newAverage =
          (long) ((1.0 - prevWeight) * newLatencyNanos + prevWeight * previous.average);

      return new TimestampedAverage(currentTimestamp, newAverage, nbMeasure);
    }

    public TimestampedAverage getCurrentAverage() {
      return current.get();
    }
  }

  /**
   * Helper builder object to create a latency aware policy.
   *
   * 
This helper allows to configure the different parameters used by {@code LatencyAwarePolicy}.
   * The only mandatory parameter is the child policy that will be wrapped with latency awareness.
   * The other parameters can be set through the methods of this builder, but all have defaults
   * (that are documented in the javadoc of each method) if you don't.
   *
   * 
If you observe that the resulting policy excludes hosts too aggressively or not enough so,
   * the main parameters to check are the exclusion threshold ({@link #withExclusionThreshold}) and
   * scale ({@link #withScale}).
   *
   * @since 1.0.4
   */
  public static class Builder {

    public static final double DEFAULT_EXCLUSION_THRESHOLD = 2.0;
    public static final long DEFAULT_SCALE_NANOS = TimeUnit.MILLISECONDS.toNanos(100);
    public static final long DEFAULT_RETRY_PERIOD_NANOS = TimeUnit.SECONDS.toNanos(10);
    public static final long DEFAULT_UPDATE_RATE_NANOS = TimeUnit.MILLISECONDS.toNanos(100);
    public static final int DEFAULT_MIN_MEASURE = 50;

    private final LoadBalancingPolicy childPolicy;

    private double exclusionThreshold = DEFAULT_EXCLUSION_THRESHOLD;
    private long scale = DEFAULT_SCALE_NANOS;
    private long retryPeriod = DEFAULT_RETRY_PERIOD_NANOS;
    private long updateRate = DEFAULT_UPDATE_RATE_NANOS;
    private int minMeasure = DEFAULT_MIN_MEASURE;

    /**
     * Creates a new latency aware policy builder given the child policy that the resulting policy
     * wraps.
     *
     * @param childPolicy the load balancing policy to wrap with latency awareness.
     */
    public Builder(LoadBalancingPolicy childPolicy) {
      this.childPolicy = childPolicy;
    }

    /**
     * Sets the exclusion threshold to use for the resulting latency aware policy.
     *
     * 
The exclusion threshold controls how much worse the average latency of a node must be
     * compared to the fastest performing node for it to be penalized by the policy.
     *
     * 
The default exclusion threshold (if this method is not called) is 2. In other
     * words, the resulting policy excludes nodes that are more than twice slower than the fastest
     * node.
     *
     * @param exclusionThreshold the exclusion threshold to use. Must be greater or equal to 1.
     * @return this builder.
     * @throws IllegalArgumentException if {@code exclusionThreshold < 1}.
     */
    public Builder withExclusionThreshold(double exclusionThreshold) {
      if (exclusionThreshold < 1d)
        throw new IllegalArgumentException("Invalid exclusion threshold, must be greater than 1.");
      this.exclusionThreshold = exclusionThreshold;
      return this;
    }

    /**
     * Sets the scale to use for the resulting latency aware policy.
     *
     * 
The {@code scale} provides control on how the weight given to older latencies decreases
     * over time. For a given host, if a new latency {@code l} is received at time {@code t}, and
     * the previously calculated average is {@code prev} calculated at time {@code t'}, then the
     * newly calculated average {@code avg} for that host is calculated thusly:
     *
     * 
{@code d = (t - t') / scale
     * alpha = 1 - (ln(d+1) / d)
     * avg = alpha * l + (1 - alpha * prev)}
     *
     * Typically, with a {@code scale} of 100 milliseconds (the default), if a new latency is
     * measured and the previous measure is 10 millisecond old (so {@code d=0.1}), then {@code
     * alpha} will be around {@code 0.05}. In other words, the new latency will weight 5% of the
     * updated average. A bigger scale will get less weight to new measurements (compared to
     * previous ones), a smaller one will give them more weight.
     *
     * The default scale (if this method is not used) is of 100 milliseconds. If unsure,
     * try this default scale first and experiment only if it doesn't provide acceptable results
     * (hosts are excluded too quickly or not fast enough and tuning the exclusion threshold doesn't
     * help).
     *
     * @param scale the scale to use.
     * @param unit the unit of {@code scale}.
     * @return this builder.
     * @throws IllegalArgumentException if {@code scale <= 0}.
     */
    public Builder withScale(long scale, TimeUnit unit) {
      if (scale <= 0)
        throw new IllegalArgumentException("Invalid scale, must be strictly positive");
      this.scale = unit.toNanos(scale);
      return this;
    }

    /**
     * Sets the retry period for the resulting latency aware policy.
     *
     * 
The retry period defines how long a node may be penalized by the policy before it is given
     * a 2nd change. More precisely, a node is excluded from query plans if both his calculated
     * average latency is {@code exclusionThreshold} times slower than the fastest node average
     * latency (at the time the query plan is computed) and his calculated average latency
     * has been updated since less than {@code retryPeriod}. Since penalized nodes will likely not
     * see their latency updated, this is basically how long the policy will exclude a node.
     *
     * @param retryPeriod the retry period to use.
     * @param unit the unit for {@code retryPeriod}.
     * @return this builder.
     * @throws IllegalArgumentException if {@code retryPeriod < 0}.
     */
    public Builder withRetryPeriod(long retryPeriod, TimeUnit unit) {
      if (retryPeriod < 0)
        throw new IllegalArgumentException("Invalid retry period, must be positive");
      this.retryPeriod = unit.toNanos(retryPeriod);
      return this;
    }

    /**
     * Sets the update rate for the resulting latency aware policy.
     *
     * 
The update rate defines how often the minimum average latency is recomputed. While the
     * average latency score of each node is computed iteratively (updated each time a new latency
     * is collected), the minimum score needs to be recomputed from scratch every time, which is
     * slightly more costly. For this reason, the minimum is only re-calculated at the given fixed
     * rate and cached between re-calculation.
     *
     * 
The default update rate if 100 milliseconds, which should be appropriate for most
     * applications. In particular, note that while we want to avoid to recompute the minimum for
     * every query, that computation is not particularly intensive either and there is no reason to
     * use a very slow rate (more than second is probably unnecessarily slow for instance).
     *
     * @param updateRate the update rate to use.
     * @param unit the unit for {@code updateRate}.
     * @return this builder.
     * @throws IllegalArgumentException if {@code updateRate <e; 0}.
     */
    public Builder withUpdateRate(long updateRate, TimeUnit unit) {
      if (updateRate <= 0)
        throw new IllegalArgumentException("Invalid update rate value, must be strictly positive");
      this.updateRate = unit.toNanos(updateRate);
      return this;
    }

    /**
     * Sets the minimum number of measurements per-host to consider for the resulting latency aware
     * policy.
     *
     * 
Penalizing nodes is based on an average of their recently measured average latency. This
     * average is only meaningful if a minimum of measurements have been collected (moreover, a
     * newly started Cassandra node will tend to perform relatively poorly on the first queries due
     * to the JVM warmup). This is what this option controls. If less that {@code minMeasure} data
     * points have been collected for a given host, the policy will never penalize that host. Also,
     * the 30% first measurement will be entirely ignored (in other words, the {@code 30% *
     * minMeasure} first measurement to a node are entirely ignored, while the {@code 70%} next ones
     * are accounted in the latency computed but the node won't get convicted until we've had at
     * least {@code minMeasure} measurements).
     *
     * 
Note that the number of collected measurements for a given host is reset if the node is
     * restarted.
     *
     * The default for this option (if this method is not called) is 50. Note that it is
     * probably not a good idea to put this option too low if only to avoid the influence of JVM
     * warm-up on newly restarted nodes.
     *
     * @param minMeasure the minimum measurements to consider.
     * @return this builder.
     * @throws IllegalArgumentException if {@code minMeasure < 0}.
     */
    public Builder withMininumMeasurements(int minMeasure) {
      if (minMeasure < 0)
        throw new IllegalArgumentException("Invalid minimum measurements value, must be positive");
      this.minMeasure = minMeasure;
      return this;
    }

    /**
     * Builds a new latency aware policy using the options set on this builder.
     *
     * @return the newly created {@code LatencyAwarePolicy}.
     */
    public LatencyAwarePolicy build() {
      return new LatencyAwarePolicy(
          childPolicy, exclusionThreshold, scale, retryPeriod, updateRate, minMeasure);
    }
  }

  @Override
  public void close() {
    childPolicy.close();
    updaterService.shutdown();
  }

  private boolean hostMetricsEnabled() {
    return HOST_METRICS_ENABLED && metrics != null;
  }
}