All Downloads are FREE. Search and download functionalities are using the official Maven repository.

net.sf.hajdbc.state.health.ClusterHealthImpl Maven / Gradle / Ivy

There is a newer version: 3.6.61
Show newest version
package net.sf.hajdbc.state.health;

import java.io.File;
import java.net.InetAddress;
import java.net.NetworkInterface;
import java.net.SocketException;
import java.nio.file.Files;
import java.nio.file.Paths;
import java.util.*;
import java.util.Map.Entry;
import java.util.concurrent.*;
import java.util.concurrent.atomic.AtomicBoolean;
import java.util.concurrent.atomic.AtomicInteger;
import java.util.concurrent.locks.Lock;
import net.sf.hajdbc.Database;
import net.sf.hajdbc.DatabaseCluster;
import net.sf.hajdbc.DatabaseClusterListener;
import net.sf.hajdbc.distributed.Member;
import net.sf.hajdbc.logging.Level;
import net.sf.hajdbc.state.DatabaseEvent;
import net.sf.hajdbc.state.distributed.DistributedStateManager;
import net.sf.hajdbc.state.distributed.NodeState;
import net.sf.hajdbc.util.FileReader;
import net.sf.hajdbc.util.HaJdbcThreadFactory;
import net.sf.hajdbc.util.StopWatch;
import org.joda.time.DateTime;
import org.joda.time.DateTimeUtils;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

public class ClusterHealthImpl implements Runnable, ClusterHealth, DatabaseClusterListener {

  private final static Logger logger = LoggerFactory.getLogger(ClusterHealthImpl.class);

  public static final int MAX_INACTIVATED = 30;
  /**
   * 默认最大观察者探测失败生效次数
   */
  public static final int MAX_UNOBSERVABLE = 6;

  public static final String HOST_ELECT = "HOST_ELECT";
  public static final long DEFAULT_MAX_ELECT_TIME = 4 * 60 * 1000L;
  public static final String MAX_ELECT_TIME = "MAX_ELECT_TIME";
  public static final String NODE_DOWN_LOCK = "node_down";

  private DistributedStateManager stateManager;
  private final Arbiter arbiter;
  /**
   * 节点是否需要更新token,true:需要,false:不需要
   */
  private final AtomicBoolean nodeUpdated = new AtomicBoolean(false);
  //private volatile boolean unattended = true;
  private final ExecutorService executorService;

  private NodeState state = NodeState.offline;
  private volatile long offsetTime = 0;
  //准备选主
  private volatile boolean readyElect = false;
  private volatile Member host = null;
  private FileWatchDog fileWatchDog;

  private final FileReader maxUnobservableReader = FileReader.of4int("max_unobservable");

  private final HeartBeatCommand beatCommand = new HeartBeatCommand();
  private final NodeHealthCommand healthCommand = new NodeHealthCommand();

  private final UpdateTokenCommand updateTokenCommand = new UpdateTokenCommand();
  private final AtomicInteger dbInActivated = new AtomicInteger();
  private final AtomicInteger unObservable = new AtomicInteger();

  private final ScheduledExecutorService scheduledService = Executors.newScheduledThreadPool(1,
      HaJdbcThreadFactory.c("cluster-health-Thread"));


  public ClusterHealthImpl(DistributedStateManager stateManager) {
    this.stateManager = stateManager;
    this.stateManager.getDatabaseCluster().addListener(this);
    executorService = Executors.newFixedThreadPool(3, HaJdbcThreadFactory.c("cluster-executor-Thread"));
    stateManager.setExtContext(ClusterHealth.class.getName(),this);
    fileWatchDog = new FileWatchDog(new File("/proc/mounts"), MountPathHolder.H);
    arbiter = new Arbiter(stateManager.getDatabaseCluster().getId());
  }

  @Override
  public void start(){
    fileWatchDog.watch();
    String localIp = stateManager.getLocalIp();
    arbiter.setLocalIp(localIp);
    arbiter.setIps(this.stateManager.getDatabaseCluster().getNodes());
    this.run();
    scheduledService.scheduleWithFixedDelay(this,500,500, TimeUnit.MILLISECONDS);
  }



  @Override
  public void stop(){
    scheduledService.shutdown();
  }

  @Override
  public NodeHealth getNodeHealth(){
    NodeHealth health = new NodeHealth();
    health.setState(state);
    health.setLastOnlyHost(arbiter.getLocalTokenStore().isOnlyHost());
    health.setLocal(arbiter.getLocalTokenStore().getToken());
    health.setArbiter(arbiter.getArbiter().getToken());
    Set databases = stateManager.getActiveDatabases();
    health.getActiveDBs().retainAll(databases);
    health.getActiveDBs().addAll(databases);
    return health;
  }

  @Override
  public NodeHealth getNodeHealth(Member member) {
    NodeHealthCommand cmd = new NodeHealthCommand();
    return (NodeHealth) stateManager.execute(cmd,member);
  }


  /**
   * Receive host node heart beat.
   */
  @Override
  public void receiveHeartbeat(long sendTime){
    logger.debug("receive host heart beat.");
    DateTime now = new DateTime();
    long offset = ((sendTime - now.getMillis())/1000)*1000;
    if(offset!=offsetTime) {
      offsetTime = offset;
      DateTimeUtils.setCurrentMillisOffset(offsetTime);
    }

  }


  @Override
  public long getOffsetTime() {
    return offsetTime;
  }

  @Override
  public long getHostTime() {
    DateTime now = new DateTime();
    return now.getMillis();
  }

  @Override
  public boolean canWrite() {
    return state.isCanUpdate();
  }

  @Override
  public NodeState getState() {
    return state;
  }

  @Override
  public boolean isHost(){
    return NodeState.host.equals(state);
  }

  @Override
  public void setState(NodeState state) {
    if(state==null){
      state = NodeState.offline;
    }
    if(!state.equals(this.state)){
      NodeState old  = this.state;
      this.state = state;
      changeState(old,this.state);
    }
  }

  void changeState(NodeState oldState,NodeState newState){
    logger.info("node state from "+oldState+" to "+newState);
    stateManager.getDatabaseCluster().changeState(oldState,newState);
  }

  @Override
  public void incrementToken(){
    nodeUpdated.compareAndSet(false,true);
  }

  @Override
  public void updateToken(long token){
    if(canWrite()){
      arbiter.update(token);
    }
  }

  /**
   * Send heartbeat.
   */
  private void sendHeartbeat(){
    stateManager.executeAll(beatCommand.preSend(),stateManager.getLocal());
    logger.debug("host send heart beat end.");
  }


  private boolean isLostHost(){
    boolean lost = (host == null);
    if(host != null){
      NodeHealth health = this.getNodeHealth(host);
      if(health!=null&&health.getState()!=null&&!NodeState.host.equals(health.getState())){
        lost = true;
      }

    }
    return lost;
  }

  /**
   * Returns can it elect.
   * @return Can it elect.
   */
  private boolean canElect(){
    if(isUp()){
      if(arbiter.isObservable(false)){
        DatabaseCluster cluster = stateManager.getDatabaseCluster();
        Database database = cluster.getLocalDatabase();
        if(cluster.isAlive(database, Level.WARN)) {
          return true;
        }else{
          logger.info("database not active.");
        }
      }
    }else{
      logger.info("nic is down.");
    }
    return false;
  }

  /**
   * start elect host node.
   */
  private synchronized void elect() throws InterruptedException {
    //准备开始选主
    this.readyElect = true;
    Lock lock = stateManager.getDatabaseCluster().getLockManager().onlyLock(HOST_ELECT);
    lock.lockInterruptibly();
    try{
      //如果有别的节点完成选主了的话直接跳过,否者继续选主
      if(readyElect) {
        logger.info("host elect begin.");
        StopWatch stopWatch = StopWatch.createStarted();
        long waitTime = 1;
        long beginElectTime = System.nanoTime();
        Entry host = doElect(beginElectTime);
        while (host == null) {
          host = doElect(beginElectTime);
          if (host == null) {
            logger.info("can not elect host node. try elect again after " + waitTime + "s");
            Thread.sleep(waitTime * 1000);
            if (waitTime < 16) {
              long costTime = TimeUnit.NANOSECONDS.toMillis(System.nanoTime() - beginElectTime);
              //10s内等待时间不延长
              if(costTime>10000) {
                waitTime = waitTime * 2;
              }
            }
          } else {
            break;
          }
        }
        if (host != null) {
          logger.info("host elect:{}. cost time:{}", host.getKey(), stopWatch.toString());

          HostCommand hostCommand = new HostCommand();
          hostCommand.setHost(host.getKey());
          hostCommand.setToken(host.getValue().getLocal());
          this.host(host.getKey(), host.getValue().getLocal());
          stateManager.executeAll(hostCommand, stateManager.getLocal());
        }
        logger.info("host elect end. cost time:{}", stopWatch.toString());
      }
    }catch (Exception e){
      logger.warn("",e);
    }finally {
      lock.unlock();
    }

  }

  private Entry doElect(long beginElectTime) {
    Map all = stateManager.executeAll(healthCommand);

    //delete invalid data.
    remveInvalidReceive(all);
    //毫秒
    long costTime = TimeUnit.NANOSECONDS.toMillis(System.nanoTime() - beginElectTime);
    Entry host = null;
    if(all.size()>=stateManager.getMembers().size()){
      //find host
      host = findNodeByState(all, NodeState.host);
      if(host!=null){
        logger.info("elect host by host state. host={}", host);
      }else{
        //not find host node. find backup node
        host = findNodeByState(all, NodeState.backup);
        if(host!=null){
          logger.info("elect host by backup state. host={}", host);
        }else{
          //8s内不单节点选主
          if(costTime< 8000){
            return null;
          }
          //not find backup node. find by valid local node
          host = findNodeByValidLocal(all);
          if(host!=null){
            logger.info("elect host by valid local. host={}", host);
          }else{
            //not find valid local node. find last only host node
            host = findNodeByLastOnlyHost(all);
            if(host!=null){
              logger.info("elect host by only host. host={}", host);
            }else{
              //not find last only host node. find empty node
              host = findNodeByEmpty(all);
              if(host!=null){
                logger.info("elect host by empty node. host={}", host);
              }else{
                //满足最小节点数
                if(all.size()>=getMinNodeCount()){
                  host = findNodeByToken(all);
                }
                if(host!=null){
                  logger.info("elect any node by ge min node count. host={}", host);
                }else{

                  //选举超时
                  if((costTime > getMaxElectTime())){
                    host = findNodeByToken(all);
                  }
                  if(host!=null){
                    logger.info("elect any node by ge max elect time. host={}", host);
                  }
                }
              }
            }
          }
        }
      }

      if(host!=null){
        logger.info("find host node "+host.getKey()+".");
      }
    }else{
      logger.info("some nodes are not responding.");
    }
    return host;

  }

  @Override
  public long getMaxElectTime() {
    long maxElectTime =  DEFAULT_MAX_ELECT_TIME;
    try {
      maxElectTime = Long.parseLong(System.getProperty(MAX_ELECT_TIME, String.valueOf(DEFAULT_MAX_ELECT_TIME)));
    }catch (NumberFormatException e){
      logger.warn("MAX_ELECT_TIME format is error.", e);
    }
    return maxElectTime;
  }

  private int getMinNodeCount(){
    int count = stateManager.getDatabaseCluster().getNodeCount();
    return count;
  }

  @Override
  public void host(Member host, long token){
    this.host = host;
    if(host!=null){
      if(stateManager.getLocal().equals(host)){
        if(!state.equals(NodeState.host)){
          setState(NodeState.host);
          DatabaseCluster databaseCluster = stateManager.getDatabaseCluster();
          Database database = databaseCluster.getLocalDatabase();
          if(!database.isActive()){
            stateManager.activated(new DatabaseEvent(database));
            databaseCluster.getBalancer().add(database);
            database.setActive(true);
          }
        }
      }else{
        setState(NodeState.ready);
      }
    }else{
      //setState(NodeState.offline);
    }
    //选主结束
    readyElect = false;
  }

  @Override
  public Member getHost() {
    return host;
  }

  private Entry findNodeByToken(Map all) {
    Entry find = null;
    Iterator> iterator = all.entrySet().iterator();
    while(iterator.hasNext()) {
      Entry next = iterator.next();
      NodeHealth health = next.getValue();
      if (health != null) {
        if(find==null||health.getLocal()>find.getValue().getLocal()){
          find = next;
        }
      }
    }
    return find;
  }

  private Entry findNodeByEmpty(Map all) {
    Entry find = null;
    Iterator> iterator = all.entrySet().iterator();
    while(iterator.hasNext()) {
      Entry next = iterator.next();
      NodeHealth health = next.getValue();
      if (health != null && health.isEmpty()) {
        find = next;
        break;
      }
    }
    return find;
  }


  private Entry findNodeByLastOnlyHost(Map all) {
    Entry find = null;
    Iterator> iterator = all.entrySet().iterator();
    while(iterator.hasNext()) {
      Entry next = iterator.next();
      NodeHealth health = next.getValue();
      if (health != null && health.isLastOnlyHost()) {
        if(find==null||health.getLocal()>find.getValue().getLocal()){
          find = next;
        }
      }
    }
    return find;
  }

  private Entry findNodeByValidLocal(Map all) {
    Entry find = null;
    Iterator> iterator = all.entrySet().iterator();
    while(iterator.hasNext()) {
      Entry next = iterator.next();
      NodeHealth health = next.getValue();
      if (health != null && health.isValidLocal()) {
        find = next;
        break;
      }
    }
    return find;
  }

  private Entry findNodeByState(Map all,NodeState state) {
    Entry find = null;
    Iterator> iterator = all.entrySet().iterator();
    while(iterator.hasNext()) {
      Entry next = iterator.next();
      NodeHealth health = next.getValue();
      if (health != null && health.getState().equals(state)) {
        find = next;
        break;
      }
    }
    return find;
  }


  /**
   * 30以上次才认为数据库不是活的
   * @param database
   * @return
   */
  private boolean isActiveLocalDb(Database database){
    boolean active = true;
    if(!database.getDbType().equalsIgnoreCase("h2")) {
      if (database != null && !database.isActive()) {
        dbInActivated.incrementAndGet();
      } else {
        dbInActivated.set(0);
      }
      if (dbInActivated.get() > MAX_INACTIVATED) {
        active = false;
        dbInActivated.set(0);
      }
    }
    return active;
  }


  private int getMaxUnobservable(){
    int maxUnobservable = maxUnobservableReader
        .getData(MAX_UNOBSERVABLE);
    if(maxUnobservable<1){
      maxUnobservable = 1;
    }
    if(maxUnobservable>100){
      maxUnobservable = 100;
    }
    return maxUnobservable;
  }

  private boolean isObservable(){
    boolean observable = true;
    if(!arbiter.isObservable(true)){
      unObservable.incrementAndGet();
    }else{
      if(arbiter.isObservable(false)) {
        unObservable.set(0);
      }
    }
    if(unObservable.get()> getMaxUnobservable()){
      observable = false;
      dbInActivated.set(0);
    }
    return observable;
  }

  /**
   * Does it need to be down.
   * @return Does it need to be down?
   */
  private boolean isNeedDown(){
    boolean up = isUp();
    boolean observable = isObservable();
    Database database = stateManager.getDatabaseCluster().getLocalDatabase();
    boolean active = isActiveLocalDb(database);
    String db = database!=null?database.getId():"";
    if(!up ||!active){
      logger.warn("node need down. up={}, observable={}, db active={} db={}",up,observable,active, db);
      return true;
    }else if(!observable){
      Lock lock = stateManager.getDatabaseCluster().getLockManager().onlyLock(NODE_DOWN_LOCK);
      try {
        lock.lockInterruptibly();
        try {
          Map all = stateManager.executeAll(healthCommand, this.stateManager.getLocal());
          remveInvalidReceive(all);
          if(all.size()>0){
            for (Member member : all.keySet()) {
              NodeState nodeState = all.get(member).getState();
              if(nodeState.isCanUpdate()){
                logger.warn("node need down. observable={} find node {} state:{}", observable, member, nodeState);
                return true;
              }
            }
          }
        } finally {
          lock.unlock();
        }
        logger.warn("observable={}, online node is not find. node can not down.", observable);
      }catch (Exception e){
        //ignore e
      }
    }
    return false;
  }

  private void downNode(){
    setState(NodeState.offline);
  }


  @Override
  public void run() {
    fileWatchDog.watch();
    try {
      if(NodeState.host.equals(state)){
        watchHostNode();
      }else {
        watchNotHostNode();
      }

    }catch (Exception e){
      logger.warn("",e);
    }
  }

  private void watchHostNode() throws InterruptedException {
    if(findOtherHost()){
      if(canElect()){
        elect();
      }
    }else{
      if(isNeedDown()){
        downNode();
      }else
      {
        arbiter.getLocalTokenStore().setOnlyHost((stateManager.getActiveDatabases().size()<2));
        sendHeartbeat();
        executorService.submit(new Runnable() {
          @Override
          public void run() {
            updateNewToken();
          }
        });
      }
    }
  }

  private void watchNotHostNode() throws InterruptedException {
    DatabaseCluster databaseCluster = stateManager.getDatabaseCluster();
    if(NodeState.backup.equals(state)||NodeState.ready.equals(state)){
      arbiter.getLocalTokenStore().setOnlyHost(false);
      if(NodeState.backup.equals(state)){
        if(isNeedDown()) {
          downNode();
        }
      }else{
        if(isActiveNode(databaseCluster)) {
          setState(NodeState.backup);
        }
      }
      if(this.isLostHost()){
        if(canElect()){
          elect();
        }else if(NodeState.backup.equals(state)){
          //自己backup, 主丢失可以正常通信就再次选主
          NodeHealth health = this.getNodeHealth(host);
          if (health != null && !NodeState.host.equals(health.getState())) {
            elect();
          }
        }
      }
    }else{
      if(canElect()){
        elect();
      }
      if(NodeState.offline.equals(state)) {
        Database database = databaseCluster.getLocalDatabase();
        if (database.isActive()) {
          databaseCluster.deactivate(database, stateManager);
        }
        //移除其它的数据库
        if(databaseCluster.getBalancer().size()>0) {
          databaseCluster.getBalancer().clear();
        }
      }
    }
  }

  private boolean isActiveNode(DatabaseCluster databaseCluster) {
    boolean active = false;
    try {
      ServiceLoader load = ServiceLoader.load(NodeActiveChecker.class);
      Iterator iterator = load.iterator();
      while (iterator.hasNext()) {
        active = iterator.next().isActive(databaseCluster);
        if (!active) {
          break;
        }
      }
    }catch (Exception e){
      e.printStackTrace();
      active = false;
    }
    return active;
  }

  private boolean isTrace(){
    return Files.exists(Paths.get("/etc/ha-jdbc/trace/health"));
  }

  private void updateNewToken() {
    if(nodeUpdated.compareAndSet(true, false)) {
      long newToken = arbiter.getLocalTokenStore().getToken() + 1;
      if(isTrace()) {
        logger.info("update newToken=" + newToken);
      }
      updateTokenCommand.setToken(newToken);
      stateManager.executeAll(updateTokenCommand);
    }
  }

  /**
   * find other host or not
   * @return find other host or not
   */
  private boolean findOtherHost() {
    NodeHealthCommand cmd = new NodeHealthCommand();
    Map all = stateManager.executeAll(cmd, stateManager.getLocal());
    if(all.size()>0){
      Iterator iterator = all.values().iterator();
      while(iterator.hasNext()){
        NodeHealth next = (NodeHealth)iterator.next();
        if(next!=null&&next.getState().equals(NodeState.host)){
          return true;
        }
      }
    }
    return false;
  }

  private void remveInvalidReceive(Map all) {
    //delete invalid data.
    removeInvalidReceiveByState(all,null);
  }

  private void removeInvalidReceiveByState(Map all,NodeState state) {
    //delete invalid data.
    Iterator> iterator = all.entrySet().iterator();
    while (iterator.hasNext()) {
      Entry next = iterator.next();
      if (next.getValue() == null||(state!=null&&!state.equals(next.getValue().getState()))) {
        iterator.remove();
      }
    }
  }


  private  boolean isUp(){
    return isUp(stateManager.getLocalIp(), 1);
  }

  private  NetworkInterface getNic(String ip) {
    NetworkInterface nic = null;
    try {
      InetAddress address = InetAddress.getByName(ip);
      nic = NetworkInterface.getByInetAddress(address);
    }catch (Exception ex){
      ex.printStackTrace();
    }
    return nic;
  }

  /**
   *
   * @param ip 对应的IP
   * @param failedTryCount 失败后的尝试次数
   * @return
   */
  private  boolean isUp(String ip, int failedTryCount){
    NetworkInterface nic = getNic(ip);
    if(nic!=null){
      try {
        return nic.isUp();
      } catch (SocketException e) {
        logger.warn("is up fail.", e);
        return true;
      }
    }else{
      logger.info("not find nic for ip {}", ip);
      if(failedTryCount>1) {
        try {
          Thread.sleep(1000);
          return isUp(ip, failedTryCount-1);
        } catch (InterruptedException e) {
          //e.printStackTrace();
          return false;
        }
      }else{
        return false;
      }
    }
  }

  @Override
  public void activated(DatabaseEvent event) {
  }

  @Override
  public void deactivated(DatabaseEvent event) {

  }

  @Override
  public void added(Member member) {
    logger.info("added node:{}", member);
  }

  @Override
  public void removed(Member member) {
    logger.info("removed node:{}", member);
    if(member!=null&&member.equals(host)){
      this.host(null,0);
      logger.info("lost Host:{}", member);

    }
  }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy