org.spf4j.failsafe.RateLimiter Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of spf4j-core Show documentation
Show all versions of spf4j-core Show documentation
A continuously growing collection of utilities to measure performance, get better diagnostics,
improve performance, or do things more reliably, faster that other open source libraries...
/*
* Copyright (c) 2001-2017, Zoltan Farkas All Rights Reserved.
*
* This library is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License as published by the Free Software Foundation; either
* version 2.1 of the License, or (at your option) any later version.
*
* This library is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with this program; if not, write to the Free Software
* Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
*
* Additionally licensed with:
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.spf4j.failsafe;
import com.google.common.annotations.Beta;
import edu.umd.cs.findbugs.annotations.SuppressFBWarnings;
import java.time.Duration;
import java.util.concurrent.ScheduledExecutorService;
import java.util.concurrent.ScheduledFuture;
import java.util.concurrent.TimeUnit;
import java.util.concurrent.atomic.AtomicLong;
import java.util.function.LongBinaryOperator;
import java.util.function.LongSupplier;
import javax.annotation.CheckReturnValue;
import javax.annotation.Nonnegative;
import javax.annotation.Signed;
import javax.annotation.concurrent.GuardedBy;
import org.spf4j.base.ExecutionContexts;
import org.spf4j.base.TimeSource;
import org.spf4j.concurrent.Atomics;
import org.spf4j.concurrent.DefaultScheduler;
import org.spf4j.concurrent.PermitSupplier;
/**
* Token bucket algorithm base call rate limiter. see https://en.wikipedia.org/wiki/Token_bucket for more detail.
* Unlike the Guava implementation, the token replenishment is done in a separate thread.
* As such permit acquisition methods have lower overhead
* (no System.nanotime invocation is made when permits available),
* This lower overhead comes at the cost of increasing the cost of RateLimiter object instance. (a scheduled runnable)
* This implementation also uses CAS to update the permit bucket which should yield better concurrency characteristics.
* there is a backoff to handle high contention better as well
* (see https://dzone.com/articles/wanna-get-faster-wait-bit)
*
* The different in performance can be observed in a benchmark where we try to limit 10000000 ops/s:
*
* Benchmark Mode Cnt Score Error Units
* com.google.common.util.concurrent.GuavaRateLimiterBenchmark.acquire thrpt 10 8197739.576 ± 163437.214 ops/s
* org.spf4j.failsafe.Spf4jRateLimiterBenchmark.acquire thrpt 10 9791489.540 ± 89480.010 ops/s
*
* The Guava implementation cannot really get as close to the desired rate as the spf4j implementation.
*
* The spf4j implementation tops of at about:
*
* Benchmark Mode Cnt Score Error Units
* Spf4jRateLimiterBenchmark.acquire thrpt 10 15270385.653 ± 507217.444 ops/s
*
* these benchmarks are artificial and really measure the overhead of permit acquisition alone without doing anything
* else, real use cases will accompany a permit acquision with some work which impacts the CAS/lock acquisition perf...
*
* Rate Limiter also implements the PermitSupplier abstraction along with GuavaRateLimiter allowing interchangeability
* between the 2 implementations based on what trade-of work better for you.
* PermitSupplier allows interchangeability and combination with Semaphore (extends PermitSupplier) implementations.
*
* @author Zoltan Farkas
*/
@Beta
public final class RateLimiter
implements AutoCloseable, PermitSupplier {
private static final int RE_READ_TIME_AFTER_RETRIES = Integer.getInteger("spf4j.rateLimiter.reReadTimeAfterTries", 5);
private static final long DEFAULT_MIN_REPLENISH_INTERVAL_MS
= Long.getLong("spf4j.rateLimiter.defaultMinReplenishIntervalMs", 10L);
private final AtomicLong permits;
private final ScheduledFuture> replenisher;
private final long permitsPerReplenishInterval;
private final long permitReplenishIntervalNanos;
private final LongSupplier nanoTimeSupplier;
/**
* the time at which replenishment has been made.
*/
@GuardedBy("sync")
private long lastReplenishmentNanos;
private final Object sync;
private final int maxBackoffNanos;
private final LongBinaryOperator accumulate;
public RateLimiter(final long permitsPerReplenishInterval,
final Duration replenishmentInterval,
final long maxBurstSize, final long minReplenishInterval, final TimeUnit tu) {
this(permitsPerReplenishInterval, replenishmentInterval, maxBurstSize, minReplenishInterval, tu,
DefaultScheduler.INSTANCE, TimeSource.nanoTimeSupplier());
}
public RateLimiter(final long permitsPerReplenishInterval,
final Duration replenishmentInterval,
final long maxBurstSize) {
this(permitsPerReplenishInterval, replenishmentInterval, maxBurstSize, DefaultScheduler.INSTANCE);
}
public RateLimiter(final long permitsPerReplenishInterval,
final Duration replenishmentInterval,
final long maxBurstSize,
final ScheduledExecutorService scheduler) {
this(permitsPerReplenishInterval, replenishmentInterval, maxBurstSize, scheduler, TimeSource.nanoTimeSupplier());
}
public RateLimiter(final long permitsPerReplenishInterval,
final Duration replenishmentInterval,
final long maxBurstSize,
final ScheduledExecutorService scheduler,
final LongSupplier nanoTimeSupplier) {
this(permitsPerReplenishInterval, replenishmentInterval, maxBurstSize, DEFAULT_MIN_REPLENISH_INTERVAL_MS,
TimeUnit.MILLISECONDS, scheduler, nanoTimeSupplier);
}
public RateLimiter(final long permitsPerReplenishInterval,
final Duration replenishmentInterval,
final long maxBurstSize,
final long minReplenishInterval,
final TimeUnit tu,
final ScheduledExecutorService scheduler,
final LongSupplier nanoTimeSupplier) {
this(permitsPerReplenishInterval, replenishmentInterval, maxBurstSize, minReplenishInterval, tu,
scheduler, nanoTimeSupplier, Atomics.MAX_BACKOFF_NANOS);
}
/**
* create the rate limiter.
*
* @param maxAvailablePermits the maximum number of permits that can accumulate.
* @param minReplenishInterval the minimum replenish interval, since a scheduler replenishes the tokens asynchronously
* there is a limit that is relative to the system clock resolution.
* @param tu the time unit of the minimum replenish interval.
* @param scheduler the scheduler to use to replenish the bucket.
* @param nanoTimeSupplier the time supplier.
* @param maxBackoffNanos expected concurrency level
*/
public RateLimiter(final long permitsPerReplenishInterval,
final Duration replenishmentInterval,
final long maxAvailablePermits,
final long minReplenishInterval,
final TimeUnit tu,
final ScheduledExecutorService scheduler,
final LongSupplier nanoTimeSupplier,
final int maxBackoffNanos) {
this(permitsPerReplenishInterval, replenishmentInterval, 0, maxAvailablePermits, minReplenishInterval, tu,
scheduler, nanoTimeSupplier, maxBackoffNanos);
}
/**
* create the rate limiter.
*
* @param maxAvailablePermits the maximum number of permits that can accumulate.
* @param minReplenishInterval the minimum replenish interval, since a scheduler replenishes the tokens asynchronously
* there is a limit that is relative to the system clock resolution.
* @param tu the time unit of the minimum replenish interval.
* @param scheduler the scheduler to use to replenish the bucket.
* @param nanoTimeSupplier the time supplier.
* @param maxBackoffNanos expected concurrency level
*/
public RateLimiter(final long permitsPerReplenishInterval,
final Duration replenishmentInterval,
final long initialNrOfPermits,
final long maxAvailablePermits,
final long minReplenishInterval,
final TimeUnit tu,
final ScheduledExecutorService scheduler,
final LongSupplier nanoTimeSupplier,
final int maxBackoffNanos) {
this.maxBackoffNanos = maxBackoffNanos;
this.sync = new Object();
this.nanoTimeSupplier = nanoTimeSupplier;
this.permitReplenishIntervalNanos = replenishmentInterval.toNanos();
this.permitsPerReplenishInterval = permitsPerReplenishInterval;
assert permitsPerReplenishInterval >= 1;
if (maxAvailablePermits < permitsPerReplenishInterval) {
throw new IllegalArgumentException("Invalid max burst size: " + maxAvailablePermits
+ ", increase maxBurstSize to something larger than " + permitsPerReplenishInterval
+ " we assume a clock resolution of " + permitReplenishIntervalNanos
+ " and that is the minimum replenish interval");
}
this.permits = new AtomicLong(initialNrOfPermits);
lastReplenishmentNanos = nanoTimeSupplier.getAsLong();
accumulate = (long left, long right) -> {
long result = left + right;
return (result > maxAvailablePermits) ? maxAvailablePermits : result;
};
this.replenisher = scheduler.scheduleAtFixedRate(() -> {
synchronized (sync) {
Atomics.accumulate(permits, permitsPerReplenishInterval, accumulate, maxBackoffNanos);
lastReplenishmentNanos = nanoTimeSupplier.getAsLong();
}
}, permitReplenishIntervalNanos, permitReplenishIntervalNanos, TimeUnit.NANOSECONDS);
}
@Override
public boolean addPermits(final int nrPermits) {
return Atomics.maybeAccumulate(permits, nrPermits, accumulate, maxBackoffNanos);
}
/**
* Try to acquire a permit if available.
*
* @return true if permit acquired. false otherwise.
*/
public boolean tryAcquire() {
return tryAcquire(1);
}
public boolean tryAcquire(final int nrPermits) {
return Atomics.maybeAccumulate(permits, nrPermits, (long prev, long x) -> {
long dif = prev - x;
// right will be -1d.
return (dif < 0) ? prev : dif;
}, maxBackoffNanos);
}
private final class ReservationHandler implements LongBinaryOperator, Acquisition {
private long currTimeNanos;
private final long deadlineNanos;
private long nsUntilResourcesAvailable;
private int reTimeCount;
private boolean isSuccess;
ReservationHandler(final long currTimeNanos, final long deadlineNanos) {
this.currTimeNanos = currTimeNanos;
this.deadlineNanos = deadlineNanos;
this.nsUntilResourcesAvailable = 0;
this.reTimeCount = RE_READ_TIME_AFTER_RETRIES;
this.isSuccess = false;
}
@Override
public long applyAsLong(final long prev, final long nrPermits) {
long remaimingPermits = prev - nrPermits;
if (remaimingPermits >= 0) {
isSuccess = true;
return remaimingPermits;
}
if (reTimeCount > 0) {
reTimeCount--;
} else {
// re-reading current time on every try is pointless since System.nanotime can take 30ns to exec...
reTimeCount = RE_READ_TIME_AFTER_RETRIES;
currTimeNanos = nanoTimeSupplier.getAsLong();
}
long timeoutNs = deadlineNanos - currTimeNanos;
long nsUntilNextReplenishment
= permitReplenishIntervalNanos - (currTimeNanos - lastReplenishmentNanos);
long permitsNeeded = -remaimingPermits;
if (permitsNeeded <= permitsPerReplenishInterval) {
nsUntilResourcesAvailable = nsUntilNextReplenishment;
return remaimingPermits;
} else {
int numberOfReplenishMentsNeed = permitsNeeded % permitsPerReplenishInterval == 0
? (int) (permitsNeeded / permitsPerReplenishInterval)
: (int) (permitsNeeded / permitsPerReplenishInterval + 1);
long nsNeeded = nsUntilNextReplenishment
+ (numberOfReplenishMentsNeed - 1) * permitReplenishIntervalNanos;
nsUntilResourcesAvailable = nsNeeded;
if (nsNeeded <= timeoutNs) {
isSuccess = true;
return remaimingPermits; // make reservation.
} else {
return prev;
}
}
}
public long getNsUntilResourcesAvailable() {
return nsUntilResourcesAvailable;
}
@Override
public String toString() {
return "ReservationHandler{" + "deadlineNanos=" + deadlineNanos + ", permits=" + permits
+ ", nsUntilResourcesAvailable=" + nsUntilResourcesAvailable + '}';
}
@Override
public boolean isSuccess() {
return isSuccess;
}
@Override
public long permitAvailableEstimateInNanos() {
return nsUntilResourcesAvailable;
}
}
public long getNrPermits() {
return permits.get();
}
@Override
@SuppressFBWarnings("MDM_THREAD_YIELD") //fb has a point here...
public boolean tryAcquire(final int nrPermits, final long deadlineNanos) throws InterruptedException {
Acquisition acq = tryAcquireGetDelayNanos(nrPermits, deadlineNanos);
if (acq.isSuccess()) {
long permitAvailableEstimateInNanos = acq.permitAvailableEstimateInNanos();
if (permitAvailableEstimateInNanos > 0) {
TimeUnit.NANOSECONDS.sleep(permitAvailableEstimateInNanos);
}
return true;
} else {
return false;
}
}
@CheckReturnValue
@Override
public boolean tryAcquire(@Nonnegative final int nrPermits, @Nonnegative final long timeout, final TimeUnit unit)
throws InterruptedException {
if (timeout < 0) {
throw new IllegalArgumentException("incalid timeout " + timeout + ' ' + unit);
}
boolean tryAcquire = tryAcquire(nrPermits);
if (tryAcquire) {
return true;
}
if (timeout == 0) {
return false;
}
Acquisition acq = forceReserve(ExecutionContexts.computeDeadline(timeout, unit), nrPermits);
if (acq.isSuccess()) {
long permitAvailableEstimateInNanos = acq.permitAvailableEstimateInNanos();
if (permitAvailableEstimateInNanos > 0) {
TimeUnit.NANOSECONDS.sleep(permitAvailableEstimateInNanos);
}
return true;
} else {
return false;
}
}
@Override
public Acquisition tryAcquireEx(final int nrPermits, final long timeout, final TimeUnit unit)
throws InterruptedException {
boolean tryAcquire = tryAcquire(nrPermits);
if (tryAcquire) {
return Acquisition.SUCCESS;
}
Acquisition acq = forceReserve(ExecutionContexts.computeDeadline(timeout, unit), nrPermits);
if (acq.isSuccess()) {
long permitAvailableEstimateInNanos = acq.permitAvailableEstimateInNanos();
if (permitAvailableEstimateInNanos > 0) {
TimeUnit.NANOSECONDS.sleep(permitAvailableEstimateInNanos);
}
}
return acq;
}
@Override
public Acquisition tryAcquireEx(final int nrPermits, final long deadlineNanos)
throws InterruptedException {
Acquisition acq = tryAcquireGetDelayNanos(nrPermits, deadlineNanos);
if (acq.isSuccess()) {
long permitAvailableEstimateInNanos = acq.permitAvailableEstimateInNanos();
if (permitAvailableEstimateInNanos > 0) {
TimeUnit.NANOSECONDS.sleep(permitAvailableEstimateInNanos);
}
}
return acq;
}
/**
* @param nrPermits nr of permits to acquire
* @param timeout the maximum time to wait to acquire the permits.
* @param unit the unit of time to wait.
* @return negative value if cannot acquire number of permits within time, or if positive it is the amount of ms
* we can wait to act of the acquired permissions.
* the user of this method needs to be trusted, since it can violate the contract.
* @throws InterruptedException
*/
@Signed
Acquisition tryAcquireGetDelayNanos(final int nrPermits, final long deadlineNanos) {
boolean tryAcquire = tryAcquire(nrPermits);
if (tryAcquire) {
return Acquisition.SUCCESS;
} else {
return forceReserve(deadlineNanos, nrPermits);
}
}
private ReservationHandler forceReserve(final long deadlineNanos, final int nrPermits) {
// no curent permits available, reserve the slots and get the wait time
if (replenisher.isCancelled()) {
throw new IllegalStateException("RateLimiter is closed: " + this);
}
ReservationHandler rh = new ReservationHandler(nanoTimeSupplier.getAsLong(), deadlineNanos);
synchronized (sync) {
Atomics.accumulate(permits, nrPermits, rh, maxBackoffNanos);
}
return rh;
}
@Override
public void close() {
replenisher.cancel(false);
}
public long getPermitsPerReplenishInterval() {
return permitsPerReplenishInterval;
}
public long getPermitReplenishIntervalNanos() {
return permitReplenishIntervalNanos;
}
public long getLastReplenishmentNanos() {
synchronized (sync) {
return lastReplenishmentNanos;
}
}
@Override
public String toString() {
return "RateLimiter{" + "permits=" + permits.get() + ", permitsPerReplenishInterval="
+ permitsPerReplenishInterval + ", permitReplenishIntervalNanos=" + permitReplenishIntervalNanos + '}';
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy