com.bazaarvoice.emodb.databus.core.Canary Maven / Gradle / Ivy
package com.bazaarvoice.emodb.databus.core;
import com.bazaarvoice.emodb.common.dropwizard.lifecycle.ServiceFailureListener;
import com.bazaarvoice.emodb.common.dropwizard.log.RateLimitedLog;
import com.bazaarvoice.emodb.common.dropwizard.log.RateLimitedLogFactory;
import com.bazaarvoice.emodb.common.dropwizard.metrics.MetricsGroup;
import com.bazaarvoice.emodb.databus.ChannelNames;
import com.bazaarvoice.emodb.databus.api.Databus;
import com.bazaarvoice.emodb.databus.api.Event;
import com.bazaarvoice.emodb.databus.api.PollResult;
import com.bazaarvoice.emodb.sor.condition.Condition;
import com.bazaarvoice.emodb.table.db.ClusterInfo;
import com.codahale.metrics.MetricRegistry;
import com.codahale.metrics.Timer;
import com.google.common.annotations.VisibleForTesting;
import com.google.common.collect.Lists;
import com.google.common.util.concurrent.AbstractScheduledService;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import javax.annotation.Nullable;
import java.time.Duration;
import java.util.Iterator;
import java.util.List;
import java.util.concurrent.ScheduledExecutorService;
import java.util.concurrent.TimeUnit;
import static java.util.Objects.requireNonNull;
/**
* Polls and acks events from all emo tables once every second (approx.)
*
* Databus canary is a single process in the EmoDB cluster.
* Since there's only one subscription - "__system_bus:canary" and all subscriptions are routed to a single Databus server,
* it's reasonable to use leader election between the EmoDB servers so that only one server polls the canary Databus subscription.
*/
public class Canary extends AbstractScheduledService {
private static final Logger _log = LoggerFactory.getLogger(Canary.class);
private static final Duration POLL_INTERVAL = Duration.ofSeconds(1);
private static final Duration CLAIM_TTL = Duration.ofSeconds(30);
private static final int EVENTS_LIMIT = 50;
private final RateLimitedLog _rateLimitedLog;
private final Databus _databus;
private final MetricsGroup _timers;
private final String _timerName;
private final String _subscriptionName;
private final Condition _subscriptionCondition;
private final ScheduledExecutorService _executor;
public Canary(ClusterInfo cluster, Condition subscriberCondition, Databus databus, RateLimitedLogFactory logFactory, MetricRegistry metricRegistry) {
this(cluster, subscriberCondition, databus, logFactory, metricRegistry, null);
}
@VisibleForTesting
Canary(ClusterInfo cluster, Condition subscriberCondition, Databus databus, RateLimitedLogFactory logFactory,
MetricRegistry metricRegistry, @Nullable ScheduledExecutorService executor) {
_databus = requireNonNull(databus, "databus");
_timers = new MetricsGroup(metricRegistry);
requireNonNull(cluster, "cluster");
_subscriptionName = ChannelNames.getMasterCanarySubscription(cluster.getCluster());
_subscriptionCondition = requireNonNull(subscriberCondition, "subscriptionCondition");
_timerName = newTimerName("readEventsByCanaryPoll-" + cluster.getClusterMetric());
_rateLimitedLog = logFactory.from(_log);
_executor = executor;
createCanarySubscription();
ServiceFailureListener.listenTo(this, metricRegistry);
}
private String newTimerName(String name) {
return MetricRegistry.name("bv.emodb.databus", "DatabusCanary", name, "readEvents");
}
private void createCanarySubscription() {
// Except for resetting the ttl, recreating a subscription that already exists has no effect.
// Assume that multiple servers that manage the same subscriptions can each attempt to create
// the subscription at startup. The subscription should last basically forever.
// Note: make sure that we don't ignore any events
_databus.subscribe(_subscriptionName, _subscriptionCondition,
Duration.ofDays(3650), DatabusChannelConfiguration.CANARY_TTL, false);
}
@Override
protected Scheduler scheduler() {
return Scheduler.newFixedDelaySchedule(0, POLL_INTERVAL.toMillis(), TimeUnit.MILLISECONDS);
}
@Override
protected void shutDown() throws Exception {
_timers.close(); // Lost leadership. Stop reporting metrics so we don't conflict with the new leader.
}
@Override
protected ScheduledExecutorService executor() {
// If an explicit executor was provided use it, otherwise create a default executor
return _executor != null ? _executor : super.executor();
}
@Override
protected void runOneIteration() {
try {
//noinspection StatementWithEmptyBody
while (isRunning() && pollAndAckEvents()) {
// Loop w/o sleeping as long as we keep finding events
}
} catch (Throwable t) {
_rateLimitedLog.error(t, "Unexpected canary exception: {}", t);
stopAsync().awaitTerminated(); // Give up leadership temporarily. Maybe another server will have more success.
}
}
private boolean pollAndAckEvents() {
// Poll for events on the canary bus subscription
long startTime = System.nanoTime();
List eventKeys = Lists.newArrayList();
PollResult result = _databus.poll(_subscriptionName, CLAIM_TTL, EVENTS_LIMIT);
// Get the keys for all events polled. This also forces resolution of all events for timing metrics
Iterator events = result.getEventIterator();
while (events.hasNext()) {
eventKeys.add(events.next().getEventKey());
}
long endTime = System.nanoTime();
trackAverageEventDuration(endTime - startTime, eventKeys.size());
// Last chance to check that we are the leader before doing anything that would be bad if we aren't.
if (!isRunning()) {
return false;
}
// Ack these events
if (!eventKeys.isEmpty()) {
_databus.acknowledge(_subscriptionName, eventKeys);
}
return result.hasMoreEvents();
}
private void trackAverageEventDuration(long durationInNs, int numEvents) {
if (numEvents == 0) {
return;
}
long durationPerEvent = (durationInNs + numEvents - 1) / numEvents; // round up
_timers.beginUpdates();
Timer timer = _timers.timer(_timerName, TimeUnit.MILLISECONDS, TimeUnit.MILLISECONDS);
for (int i = 0; i < numEvents; i++) {
timer.update(durationPerEvent, TimeUnit.NANOSECONDS);
}
_timers.endUpdates();
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy