io.nosqlbench.engine.api.activityapi.ratelimits.HybridRateLimiter Maven / Gradle / Ivy

Go to download
Show more of this group Show more artifacts with this name
Show all versions of engine-api Show documentation
The engine API for nosqlbench; Provides the interfaces needed to build internal modules for the nosqlbench core engine
There is a newer version: 5.17.0
/*
 *
 *    Copyright 2016 jshook
 *    Licensed under the Apache License, Version 2.0 (the "License");
 *    you may not use this file except in compliance with the License.
 *    You may obtain a copy of the License at
 *
 *        http://www.apache.org/licenses/LICENSE-2.0
 *
 *    Unless required by applicable law or agreed to in writing, software
 *    distributed under the License is distributed on an "AS IS" BASIS,
 *    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 *    See the License for the specific language governing permissions and
 *    limitations under the License.
 * /
 */

package io.nosqlbench.engine.api.activityapi.ratelimits;

import com.codahale.metrics.Gauge;
import io.nosqlbench.engine.api.activityapi.core.Startable;
import io.nosqlbench.engine.api.activityimpl.ActivityDef;
import io.nosqlbench.engine.api.metrics.ActivityMetrics;
import io.nosqlbench.nb.annotations.Service;
import org.apache.logging.log4j.LogManager;
import org.apache.logging.log4j.Logger;

import java.util.concurrent.atomic.AtomicLong;

/**
 * Synopsis
 * This rate limiter uses nanoseconds as the unit of timing. This
 * works well because it is the native precision of the system timer
 * interface via {@link System#nanoTime()}. It is also low-error
 * in terms of rounding between floating point rates and nanoseconds,
 * at least in the round numbers that users tend to use. Further,
 * the current scheduling state is maintained as an atomic view of
 * accumulated nanoseconds granted to callers -- referred to here as the
 * ticks accumulator. This further simplifies the implementation by
 * allowing direct comparison of scheduled times with the current
 * state of the high-resolution system timer.
 *
 * 
Design Notes
 * This implementation makes certain trade-offs needed to support a combination of requirements.
 * Specifically, some small degree of inaccuracy is allowed to enable higher throughput when
 * needed. Some practical limitations affect how accurate we can be:
 *
 * 
 * This is not a real-time system with guarantees on scheduling.
 * Calling overhead is significant for reading the RTC or sleeping.
 * Controlling the accuracy of a delay is not possible under any level of load.
 * It is undesirable (wasteful) to use spin loops to delay.
 * 
 *
 * Together, these factors mean a compromise is inevitable. In practice it means that a very accurate
 * implementation will likely be very slow, and a very fast implementation will likely be very inaccurate.
 * This implementation tries to strike a balance, providing accuracy near the microsecond level,
 * while allowing rates in the tens of millions per second, even under heavy thread contention.
 *
 * Burst Ratio
 * 
 * This rate limiter provides a sliding scale between strict rate limiting and average rate limiting,
 * the difference between the two controlled by a burst ratio parameter. When the burst
 * ratio is 1.0, the rate limiter acts as a strict rate limiter, disallowing faster operations
 * from using time that was previously forfeited by prior slower operations. This is a "use it
 * or lose it" mode that means things like GC events can steal throughput from a running client
 * as a necessary effect of losing time in a strict timing sense.
 * 
 *
 * 
 * When the burst ratio is set to higher than 1.0, faster operations may recover lost time from
 * previously slower operations. This means that any valleys created in the actual op rate of the
 * client can be converted into plateaus of throughput above the strict rate, but only at a speed that
 * fits within (op rate * burst ratio). This allows for workloads to approximate the average
 * target rate over time, with controllable bursting rates. This ability allows for near-strict
 * behavior while allowing clients to still track truer to rate limit expectations, so long as the
 * overall workload is not saturating resources.
 * 
 */
@Service(value = RateLimiter.class, selector = "hybrid")
public class HybridRateLimiter implements Startable, RateLimiter {

    private final static Logger logger = LogManager.getLogger(HybridRateLimiter.class);

    //private volatile TokenFiller filler;
    private volatile long starttime;

    // rate controls
    private RateSpec rateSpec;

    // basic state
    private ActivityDef activityDef;
    private String label;
    private State state = State.Idle;
    // metrics
    private Gauge delayGauge;
    private Gauge avgRateGauge;
    private Gauge burstRateGauge;
    private TokenPool tokens;
    // diagnostics

    // TODO Doc rate limiter scenarios, including when you want to reset the waittime, and when you don't
    private final AtomicLong cumulativeWaitTimeNanos = new AtomicLong(0L);

    protected HybridRateLimiter() {
    }

    public HybridRateLimiter(ActivityDef def, String label, RateSpec rateSpec) {
        setActivityDef(def);
        setLabel(label);
        init(activityDef);
        this.applyRateSpec(rateSpec);
    }

    protected void setLabel(String label) {
        this.label = label;
    }

    protected void setActivityDef(ActivityDef def) {
        this.activityDef = def;
    }

    @Override
    public long maybeWaitForOp() {
        return tokens.blockAndTake();
    }

    @Override
    public long getTotalWaitTime() {
        return this.cumulativeWaitTimeNanos.get() + getWaitTime();
    }

    @Override
    public long getWaitTime() {
        return tokens.getWaitTime();
    }

    @Override
    public RateSpec getRateSpec() {
        return this.rateSpec;
    }

    @Override
    public synchronized void applyRateSpec(RateSpec updatingRateSpec) {

        if (updatingRateSpec == null) {
            throw new RuntimeException("RateSpec must be defined");
        }

        if (updatingRateSpec.equals(this.rateSpec) && !updatingRateSpec.isRestart()) {
            return;
        }

        this.rateSpec = updatingRateSpec;
        this.tokens = (this.tokens == null) ? new ThreadDrivenTokenPool(rateSpec, activityDef) : this.tokens.apply(rateSpec);
//        this.filler = (this.filler == null) ? new TokenFiller(rateSpec, activityDef) : filler.apply(rateSpec);
//        this.tokens = this.filler.getTokenPool();

        if (this.state == State.Idle && updatingRateSpec.isAutoStart()) {
            this.start();
        } else if (updatingRateSpec.isRestart()) {
            this.restart();
        }
    }


    protected void init(ActivityDef activityDef) {
        this.delayGauge = ActivityMetrics.gauge(activityDef, label + ".waittime", new RateLimiters.WaitTimeGauge(this));
        this.avgRateGauge = ActivityMetrics.gauge(activityDef, label + ".config.cyclerate", new RateLimiters.RateGauge(this));
        this.burstRateGauge = ActivityMetrics.gauge(activityDef, label + ".config.burstrate", new RateLimiters.BurstRateGauge(this));
    }

    public synchronized void start() {

        switch (state) {
            case Started:
//                logger.warn("Tried to start a rate limiter that was already started. If this is desired, use restart() instead");
                // TODO: Find a better way to warn about spurious rate limiter
                // starts, since the check condition was not properly isolated
            case Idle:
                long nanos = getNanoClockTime();
                this.starttime = nanos;
                this.tokens.start();
                state = State.Started;
                break;
        }
    }

    public synchronized long restart() {
        switch (state) {
            case Idle:
                this.start();
                return 0L;
            case Started:
                long accumulatedWaitSinceLastStart = cumulativeWaitTimeNanos.get();
                cumulativeWaitTimeNanos.set(0L);
                return this.tokens.restart() + accumulatedWaitSinceLastStart;
            default:
                return 0L;
        }
    }

    @Override
    public long getStartTime() {
        return 0;
    }

    private synchronized void checkpointCumulativeWaitTime() {
        long nanos = getNanoClockTime();
        this.starttime = nanos;
        cumulativeWaitTimeNanos.addAndGet(getWaitTime());
    }

    protected long getNanoClockTime() {
        return System.nanoTime();
    }

    @Override
    public String toString() {
        StringBuilder sb = new StringBuilder(HybridRateLimiter.class.getSimpleName());
        sb.append("{\n");
        if (this.getRateSpec() != null) {
            sb.append("      spec:").append(this.getRateSpec().toString());
        }
        if (this.tokens != null) {
            sb.append(",\n tokenpool:").append(this.tokens.toString());
        }
        if (this.state != null) {
            sb.append(",\n     state:'").append(this.state).append("'");
        }
        sb.append("\n}");
        return sb.toString();
    }

//    public String getRefillLog() {
//        return this.filler.getRefillLog();
//    }

    private enum State {
        Idle,
        Started
    }

    private class PoolGauge implements Gauge {
        private final HybridRateLimiter rl;

        public PoolGauge(HybridRateLimiter hybridRateLimiter) {
            this.rl = hybridRateLimiter;
        }

        @Override
        public Long getValue() {
            TokenPool pool = rl.tokens;
            if (pool==null) {
                return 0L;
            }
            return pool.getWaitTime();
        }
    }
}