All Downloads are FREE. Search and download functionalities are using the official Maven repository.

io.engineblock.activityapi.ratelimits.HybridRateLimiter Maven / Gradle / Ivy

Go to download

The driver API for engineblock; Provides the interfaces needed to build drivers that can be loaded by engineblock core

There is a newer version: 2.12.65
Show newest version
/*
 *
 *    Copyright 2016 jshook
 *    Licensed under the Apache License, Version 2.0 (the "License");
 *    you may not use this file except in compliance with the License.
 *    You may obtain a copy of the License at
 *
 *        http://www.apache.org/licenses/LICENSE-2.0
 *
 *    Unless required by applicable law or agreed to in writing, software
 *    distributed under the License is distributed on an "AS IS" BASIS,
 *    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 *    See the License for the specific language governing permissions and
 *    limitations under the License.
 * /
 */

package io.engineblock.activityapi.ratelimits;

import com.codahale.metrics.Gauge;
import io.engineblock.activityapi.core.Startable;
import io.engineblock.activityimpl.ActivityDef;
import io.engineblock.metrics.ActivityMetrics;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import java.util.concurrent.atomic.AtomicLong;

/**
 * 

Synopsis

*

This rate limiter uses nanoseconds as the unit of timing. This * works well because it is the native precision of the system timer * interface via {@link System#nanoTime()}. It is also low-error * in terms of rounding between floating point rates and nanoseconds, * at least in the round numbers that users tend to use. Further, * the current scheduling state is maintained as an atomic view of * accumulated nanoseconds granted to callers -- referred to here as the * ticks accumulator. This further simplifies the implementation by * allowing direct comparison of scheduled times with the current * state of the high-resolution system timer. * *

Design Notes

* This implementation makes certain trade-offs needed to support a combination of requirements. * Specifically, some small degree of inaccuracy is allowed to enable higher throughput when * needed. Some practical limitations affect how accurate we can be: * *
    *
  1. This is not a real-time system with guarantees on scheduling.
  2. *
  3. Calling overhead is significant for reading the RTC or sleeping.
  4. *
  5. Controlling the accuracy of a delay is not possible under any level of load.
  6. *
  7. It is undesirable (wasteful) to use spin loops to delay.
  8. *
* * Together, these factors mean a compromise is inevitable. In practice it means that a very accurate * implementation will likely be very slow, and a very fast implementation will likely be very inaccurate. * This implementation tries to strike a balance, providing accuracy near the microsecond level, * while allowing rates in the tens of millions per second, even under heavy thread contention. * *

Burst Ratio

*

* This rate limiter provides a sliding scale between strict rate limiting and average rate limiting, * the difference between the two controlled by a burst ratio parameter. When the burst * ratio is 1.0, the rate limiter acts as a strict rate limiter, disallowing faster operations * from using time that was previously forfeited by prior slower operations. This is a "use it * or lose it" mode that means things like GC events can steal throughput from a running client * as a necessary effect of losing time in a strict timing sense. *

* *

* When the burst ratio is set to higher than 1.0, faster operations may recover lost time from * previously slower operations. This means that any valleys created in the actual op rate of the * client can be converted into plateaus of throughput above the strict rate, but only at a speed that * fits within (op rate * burst ratio). This allows for workloads to approximate the average * target rate over time, with controllable bursting rates. This ability allows for near-strict * behavior while allowing clients to still track truer to rate limit expectations, so long as they * overall workload is not saturating resources. *

*/ public class HybridRateLimiter implements Startable, RateLimiter { private final static Logger logger = LoggerFactory.getLogger(HybridRateLimiter.class); private volatile TokenFiller filler; private volatile long starttime; // rate controls private RateSpec rateSpec; // basic state private ActivityDef activityDef; private String label; private State state = State.Idle; // metrics private Gauge delayGauge; private Gauge avgRateGauge; private Gauge burstRateGauge; private TokenPool tokens; // diagnostics // TODO Doc rate limiter scenarios, including when you want to reset the waittime, and when you don't private AtomicLong cumulativeWaitTimeNanos = new AtomicLong(0L); protected HybridRateLimiter() { } public HybridRateLimiter(ActivityDef def, String label, RateSpec rateSpec) { setActivityDef(def); setLabel(label); init(activityDef); this.applyRateSpec(rateSpec); } protected void setLabel(String label) { this.label = label; } protected void setActivityDef(ActivityDef def) { this.activityDef = def; } @Override public long maybeWaitForOp() { return tokens.blockAndTake(); } @Override public long getTotalWaitTime() { return this.cumulativeWaitTimeNanos.get() + getWaitTime(); } @Override public long getWaitTime() { return tokens.getWaitTime(); } @Override public RateSpec getRateSpec() { return this.rateSpec; } @Override public synchronized void applyRateSpec(RateSpec updatingRateSpec) { if (updatingRateSpec == null) { throw new RuntimeException("RateSpec must be defined"); } if (updatingRateSpec.equals(this.rateSpec) && !updatingRateSpec.isRestart()) { return; } this.rateSpec = updatingRateSpec; this.filler = (this.filler == null) ? new TokenFiller(rateSpec, activityDef) : filler.apply(rateSpec); this.tokens = this.filler.getTokenPool(); if (this.state == State.Idle && updatingRateSpec.isAutoStart()) { this.start(); } else if (updatingRateSpec.isRestart()) { this.restart(); } } protected void init(ActivityDef activityDef) { this.delayGauge = ActivityMetrics.gauge(activityDef, label + ".waittime", new RateLimiters.WaitTimeGauge(this)); this.avgRateGauge = ActivityMetrics.gauge(activityDef, label + ".config.cyclerate", new RateLimiters.RateGauge(this)); this.burstRateGauge = ActivityMetrics.gauge(activityDef, label + ".config.burstrate", new RateLimiters.BurstRateGauge(this)); } public synchronized void start() { switch (state) { case Started: logger.warn("Tried to start a rate limiter that was already started. If this is desired, use restart() instead"); case Idle: long nanos = getNanoClockTime(); this.starttime = nanos; this.filler.start(); state = State.Started; break; } } public synchronized long restart() { switch (state) { case Idle: this.start(); return 0L; case Started: long accumulatedWaitSinceLastStart = cumulativeWaitTimeNanos.get(); cumulativeWaitTimeNanos.set(0L); return this.filler.restart() + accumulatedWaitSinceLastStart; default: return 0L; } } @Override public long getStartTime() { return 0; } private synchronized void checkpointCumulativeWaitTime() { long nanos = getNanoClockTime(); this.starttime = nanos; cumulativeWaitTimeNanos.addAndGet(getWaitTime()); } protected long getNanoClockTime() { return System.nanoTime(); } @Override public String toString() { return //"ID:"+System.identityHashCode(this)+" "+ this.getRateSpec().toString() + "(" + this.state + ") pool:" + filler; } // public String getRefillLog() { // return this.filler.getRefillLog(); // } private enum State { Idle, Started } private class PoolGauge implements Gauge { private final HybridRateLimiter rl; public PoolGauge(HybridRateLimiter hybridRateLimiter) { this.rl = hybridRateLimiter; } @Override public Long getValue() { TokenPool pool = rl.filler.getTokenPool(); if (pool==null) { return 0L; } return pool.getWaitTime(); } } }




© 2015 - 2025 Weber Informatics LLC | Privacy Policy