All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.hubspot.singularity.SingularityLeaderController Maven / Gradle / Ivy

package com.hubspot.singularity;

import java.lang.management.ManagementFactory;
import java.lang.management.RuntimeMXBean;
import java.util.concurrent.TimeUnit;
import java.util.concurrent.atomic.AtomicBoolean;
import java.util.concurrent.locks.Lock;
import java.util.concurrent.locks.ReentrantLock;

import javax.inject.Singleton;

import org.apache.curator.framework.recipes.leader.LeaderLatchListener;
import org.apache.mesos.Protos;
import org.apache.mesos.Protos.MasterInfo;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import com.google.common.base.Optional;
import com.google.common.net.HostAndPort;
import com.google.inject.Inject;
import com.google.inject.name.Named;
import com.hubspot.mesos.MesosUtils;
import com.hubspot.singularity.SingularityAbort.AbortReason;
import com.hubspot.singularity.config.SingularityConfiguration;
import com.hubspot.singularity.data.StateManager;
import com.hubspot.singularity.mesos.SingularityMesosScheduler;
import com.hubspot.singularity.sentry.SingularityExceptionNotifier;

import io.dropwizard.lifecycle.Managed;

@Singleton
public class SingularityLeaderController implements Managed, LeaderLatchListener {

  private static final Logger LOG = LoggerFactory.getLogger(SingularityLeaderController.class);

  private final StateManager stateManager;
  private final SingularityDriverManager driverManager;
  private final SingularityAbort abort;
  private final SingularityExceptionNotifier exceptionNotifier;
  private final HostAndPort hostAndPort;
  private final long saveStateEveryMs;
  private final StatePoller statePoller;
  private final SingularityMesosScheduler scheduler;

  private volatile boolean master;


  @Inject
  public SingularityLeaderController(StateManager stateManager, SingularityConfiguration configuration, SingularityDriverManager driverManager, SingularityAbort abort, SingularityExceptionNotifier exceptionNotifier,
      @Named(SingularityMainModule.HTTP_HOST_AND_PORT) HostAndPort hostAndPort, SingularityMesosScheduler scheduler) {
    this.driverManager = driverManager;
    this.stateManager = stateManager;
    this.abort = abort;
    this.exceptionNotifier = exceptionNotifier;

    this.hostAndPort = hostAndPort;
    this.saveStateEveryMs = TimeUnit.SECONDS.toMillis(configuration.getSaveStateEverySeconds());
    this.statePoller = new StatePoller();
    this.scheduler = scheduler;

    this.master = false;

  }

  @Override
  public void start() throws Exception {
    statePoller.start();
  }

  @Override
  public void stop() throws Exception {
    statePoller.finish();
  }

  @Override
  public void isLeader() {
    LOG.info("We are now the leader! Current status {}", driverManager.getCurrentStatus());

    master = true;

    if (driverManager.getCurrentStatus() != Protos.Status.DRIVER_RUNNING) {
      try {
        driverManager.startMesos();
        statePoller.wake();
      } catch (Throwable t) {
        LOG.error("While starting driver", t);
        exceptionNotifier.notify(String.format("Error starting driver (%s)", t.getMessage()), t);
        abort.abort(AbortReason.UNRECOVERABLE_ERROR, Optional.of(t));
      }

      if (driverManager.getCurrentStatus() != Protos.Status.DRIVER_RUNNING) {
        abort.abort(AbortReason.UNRECOVERABLE_ERROR, Optional.absent());
      }
    }
  }

  public boolean isMaster() {
    return master;
  }

  public Optional getMaster() {
    return driverManager.getMaster();
  }

  public Optional getLastOfferTimestamp() {
    return driverManager.getLastOfferTimestamp();
  }

  public Protos.Status getCurrentStatus() {
    return driverManager.getCurrentStatus();
  }

  @Override
  public void notLeader() {
    LOG.info("We are not the leader! Current status {}", driverManager.getCurrentStatus());

    master = false;

    if (driverManager.getCurrentStatus() == Protos.Status.DRIVER_RUNNING) {
      try {
        driverManager.stop();

        statePoller.wake();
      } catch (Throwable t) {
        LOG.error("While stopping driver", t);
        exceptionNotifier.notify(String.format("Error while stopping driver (%s)", t.getMessage()), t);
      } finally {
        abort.abort(AbortReason.LOST_LEADERSHIP, Optional.absent());
      }
    }
  }

  private SingularityHostState getHostState() {
    final boolean master = isMaster();
    final Protos.Status driverStatus = getCurrentStatus();

    final RuntimeMXBean mxBean = ManagementFactory.getRuntimeMXBean();
    final long uptime = mxBean.getUptime();

    final long now = System.currentTimeMillis();
    final Optional lastOfferTimestamp = getLastOfferTimestamp();
    final Optional millisSinceLastOfferTimestamp = lastOfferTimestamp.isPresent() ? Optional.of(now - lastOfferTimestamp.get()) : Optional. absent();

    String mesosMaster = null;
    Optional mesosMasterInfo = getMaster();

    if (mesosMasterInfo.isPresent()) {
      mesosMaster = MesosUtils.getMasterHostAndPort(mesosMasterInfo.get());
    }

    return new SingularityHostState(master, uptime, driverStatus.name(), millisSinceLastOfferTimestamp, hostAndPort.getHostText(), hostAndPort.getHostText(), mesosMaster, scheduler.isConnected());
  }

  // This thread lives inside of this class solely so that we can instantly update the state when the leader latch changes.
  public class StatePoller extends Thread {
    private final AtomicBoolean finished = new AtomicBoolean();
    private Lock lock = new ReentrantLock();
    private volatile boolean interrupted = false;

    StatePoller() {
      super("SingularityStatePoller");
      setDaemon(true);
    }

    public void finish() {
      finished.set(true);
      this.interrupt();
    }

    public void wake() {
      this.interrupted = true;
      if (lock.tryLock()) {
        try {
          this.interrupt();
        }
        finally {
          lock.unlock();
        }
      }
      else {
        LOG.trace("state poller in zk code");
      }
    }

    @Override
    public void run() {
      while (!finished.get()) {

        try {
          lock.lock();
          // save current interrupt state and clear it.
          interrupted |= Thread.interrupted();
          final SingularityHostState state = getHostState();
          LOG.trace("Saving state in ZK: " + state);
          stateManager.save(state);
        } catch (InterruptedException e) {
          LOG.trace("Caught interrupted exception, running the loop");
        } catch (Throwable t) {
          LOG.error("Caught exception while saving state", t);
          exceptionNotifier.notify(String.format("Caught exception while saving state (%s)", t.getMessage()), t);
        }
        finally {
          lock.unlock();
          if (interrupted) {
            Thread.currentThread().interrupt();
          }
        }

        try {
          Thread.sleep(saveStateEveryMs);
        } catch (InterruptedException e) {
          interrupted = false;
          LOG.trace("Interrupted, running the loop");
        }
      }
    }
  }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy