All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.activemq.artemis.core.server.impl.jdbc.JdbcNodeManager Maven / Gradle / Ivy

/**
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements. See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License. You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.apache.activemq.artemis.core.server.impl.jdbc;

import java.util.concurrent.ScheduledExecutorService;
import java.util.concurrent.TimeUnit;
import java.util.function.Supplier;

import org.apache.activemq.artemis.api.core.SimpleString;
import org.apache.activemq.artemis.core.config.storage.DatabaseStorageConfiguration;
import org.apache.activemq.artemis.core.server.ActivateCallback;
import org.apache.activemq.artemis.core.server.ActiveMQLockAcquisitionTimeoutException;
import org.apache.activemq.artemis.core.server.ActiveMQServerLogger;
import org.apache.activemq.artemis.core.server.NodeManager;
import org.apache.activemq.artemis.core.server.impl.CleaningActivateCallback;
import org.apache.activemq.artemis.jdbc.store.drivers.JDBCConnectionProvider;
import org.apache.activemq.artemis.jdbc.store.sql.PropertySQLProvider;
import org.apache.activemq.artemis.jdbc.store.sql.SQLProvider;
import org.apache.activemq.artemis.utils.ExecutorFactory;
import org.apache.activemq.artemis.utils.UUID;
import org.apache.activemq.artemis.utils.UUIDGenerator;
import org.jboss.logging.Logger;

import static org.apache.activemq.artemis.core.server.impl.jdbc.LeaseLock.AcquireResult.Timeout;

/**
 * JDBC implementation of {@link NodeManager}.
 */
public final class JdbcNodeManager extends NodeManager {

   private static final Logger LOGGER = Logger.getLogger(JdbcNodeManager.class);
   private static final long MAX_PAUSE_MILLIS = 2000L;

   private final Supplier sharedStateManagerFactory;
   private final Supplier scheduledLiveLockFactory;
   private final Supplier scheduledBackupLockFactory;
   private SharedStateManager sharedStateManager;
   private ScheduledLeaseLock scheduledLiveLock;
   private ScheduledLeaseLock scheduledBackupLock;
   private final long lockAcquisitionTimeoutMillis;
   private volatile boolean interrupted = false;
   private final LeaseLock.Pauser pauser;

   public static JdbcNodeManager with(DatabaseStorageConfiguration configuration,
                                      ScheduledExecutorService scheduledExecutorService,
                                      ExecutorFactory executorFactory) {
      validateTimeoutConfiguration(configuration);
      final SQLProvider.Factory sqlProviderFactory;
      if (configuration.getSqlProviderFactory() != null) {
         sqlProviderFactory = configuration.getSqlProviderFactory();
      } else {
         sqlProviderFactory = new PropertySQLProvider.Factory(configuration.getConnectionProvider());
      }
      final String brokerId = java.util.UUID.randomUUID().toString();
      return usingConnectionProvider(brokerId,
                             configuration.getJdbcLockExpirationMillis(),
                             configuration.getJdbcLockRenewPeriodMillis(),
                             configuration.getJdbcLockAcquisitionTimeoutMillis(),
                             configuration.getConnectionProvider(),
                             sqlProviderFactory.create(configuration.getNodeManagerStoreTableName(), SQLProvider.DatabaseStoreType.NODE_MANAGER),
                             scheduledExecutorService,
                             executorFactory);
   }

   private static JdbcNodeManager usingConnectionProvider(String brokerId,
                                                  long lockExpirationMillis,
                                                  long lockRenewPeriodMillis,
                                                  long lockAcquisitionTimeoutMillis,
                                                  JDBCConnectionProvider connectionProvider,
                                                  SQLProvider provider,
                                                  ScheduledExecutorService scheduledExecutorService,
                                                  ExecutorFactory executorFactory) {
      return new JdbcNodeManager(() -> JdbcSharedStateManager.usingConnectionProvider(brokerId, lockExpirationMillis,
                                                                                      lockRenewPeriodMillis,
                                                                                      connectionProvider,
                                                                                      provider),
         lockExpirationMillis,
         lockRenewPeriodMillis,
         lockAcquisitionTimeoutMillis,
         scheduledExecutorService,
         executorFactory);
   }

   private static void validateTimeoutConfiguration(DatabaseStorageConfiguration configuration) {
      final long lockExpiration = configuration.getJdbcLockExpirationMillis();
      if (lockExpiration <= 0) {
         throw new IllegalArgumentException("jdbc-lock-expiration should be positive");
      }
      final long lockRenewPeriod = configuration.getJdbcLockRenewPeriodMillis();
      if (lockRenewPeriod <= 0) {
         throw new IllegalArgumentException("jdbc-lock-renew-period should be positive");
      }
      if (lockRenewPeriod >= lockExpiration) {
         throw new IllegalArgumentException("jdbc-lock-renew-period should be < jdbc-lock-expiration");
      }
      final int networkTimeout = configuration.getJdbcNetworkTimeout();
      if (networkTimeout >= 0) {
         if (networkTimeout > lockExpiration) {
            LOGGER.warn("jdbc-network-timeout isn't properly configured: the recommended value is <= jdbc-lock-expiration");
         }
      } else {
         LOGGER.warn("jdbc-network-timeout isn't properly configured: the recommended value is <= jdbc-lock-expiration");
      }
   }

   private JdbcNodeManager(Supplier sharedStateManagerFactory,
                           long lockExpirationMillis,
                           long lockRenewPeriodMillis,
                           long lockAcquisitionTimeoutMillis,
                           ScheduledExecutorService scheduledExecutorService,
                           ExecutorFactory executorFactory) {
      super(false);
      this.lockAcquisitionTimeoutMillis = lockAcquisitionTimeoutMillis;
      this.pauser = LeaseLock.Pauser.sleep(Math.min(lockRenewPeriodMillis, MAX_PAUSE_MILLIS), TimeUnit.MILLISECONDS);
      this.sharedStateManagerFactory = sharedStateManagerFactory;
      this.scheduledLiveLockFactory = () -> ScheduledLeaseLock.of(
         scheduledExecutorService,
         executorFactory != null ? executorFactory.getExecutor() : null,
         "live",
         this.sharedStateManager.liveLock(),
         lockRenewPeriodMillis,
         this::notifyLostLock);
      this.scheduledBackupLockFactory = () -> ScheduledLeaseLock.of(
         scheduledExecutorService,
         executorFactory != null ?
            executorFactory.getExecutor() : null,
         "backup",
         this.sharedStateManager.backupLock(),
         lockRenewPeriodMillis,
         this::notifyLostLock);
      this.sharedStateManager = null;
      this.scheduledLiveLock = null;
      this.scheduledBackupLock = null;
   }

   @Override
   protected synchronized void notifyLostLock() {
      try {
         super.notifyLostLock();
      } finally {
         // if any of the notified listener has stopped the node manager or
         // the node manager was already stopped
         if (!isStarted()) {
            return;
         }
         try {
            stop();
         } catch (Exception ex) {
            LOGGER.warn("Stopping node manager has errored on lost lock notification", ex);
         }
      }
   }

   @Override
   public synchronized void start() throws Exception {
      try {
         if (isStarted()) {
            return;
         }
         this.sharedStateManager = sharedStateManagerFactory.get();
         LOGGER.debug("setup sharedStateManager on start");
         final UUID nodeId = sharedStateManager.setup(UUIDGenerator.getInstance()::generateUUID);
         setUUID(nodeId);
         this.scheduledLiveLock = scheduledLiveLockFactory.get();
         this.scheduledBackupLock = scheduledBackupLockFactory.get();
         super.start();
      } catch (IllegalStateException e) {
         this.sharedStateManager = null;
         this.scheduledLiveLock = null;
         this.scheduledBackupLock = null;
         throw e;
      }
   }

   @Override
   public synchronized void stop() throws Exception {
      if (isStarted()) {
         try {
            this.scheduledLiveLock.stop();
            this.scheduledBackupLock.stop();
         } finally {
            super.stop();
            this.sharedStateManager.close();
            this.sharedStateManager = null;
            this.scheduledLiveLock = null;
            this.scheduledBackupLock = null;
         }
      }
   }

   @Override
   protected void finalize() throws Throwable {
      stop();
   }

   @Override
   public boolean isAwaitingFailback() throws NodeManagerException {
      checkStarted();
      LOGGER.debug("ENTER isAwaitingFailback");
      try {
         return readSharedState() == SharedStateManager.State.FAILING_BACK;
      } catch (IllegalStateException e) {
         LOGGER.warn("cannot retrieve the live state: assume it's not yet failed back", e);
         return false;
      } finally {
         LOGGER.debug("EXIT isAwaitingFailback");
      }
   }

   @Override
   public boolean isBackupLive() throws NodeManagerException {
      checkStarted();
      LOGGER.debug("ENTER isBackupLive");
      try {
         //is anyone holding the live lock?
         return this.scheduledLiveLock.lock().isHeld();
      } catch (IllegalStateException e) {
         throw new NodeManagerException(e);
      } finally {
         LOGGER.debug("EXIT isBackupLive");
      }
   }

   @Override
   public void interrupt() {
      LOGGER.debug("ENTER interrupted");
      //need to be volatile: must be called concurrently to work as expected
      interrupted = true;
      LOGGER.debug("EXIT interrupted");
   }

   @Override
   public void releaseBackup() throws NodeManagerException {
      checkStarted();
      LOGGER.debug("ENTER releaseBackup");
      try {
         if (this.scheduledBackupLock.isStarted()) {
            LOGGER.debug("scheduledBackupLock is running: stop it and release backup lock");
            this.scheduledBackupLock.stop();
            this.scheduledBackupLock.lock().release();
         } else {
            LOGGER.debug("scheduledBackupLock is not running");
         }
      } catch (IllegalStateException e) {
         throw new NodeManagerException(e);
      } finally {
         LOGGER.debug("EXIT releaseBackup");
      }
   }

   /**
    * Try to acquire a lock
    */
   private void lock(LeaseLock lock) throws ActiveMQLockAcquisitionTimeoutException, InterruptedException {
      final long lockAcquisitionTimeoutNanos = lockAcquisitionTimeoutMillis >= 0 ?
         TimeUnit.MILLISECONDS.toNanos(lockAcquisitionTimeoutMillis) : -1;
      LeaseLock.AcquireResult acquireResult = null;
      final long start = System.nanoTime();
      while (acquireResult == null) {
         checkStarted();
         // measure distance from the timeout
         final long remainingNanos = remainingNanos(start, lockAcquisitionTimeoutNanos);
         if (remainingNanos == 0) {
            acquireResult = Timeout;
            continue;
         }
         final long remainingMillis = remainingNanos > 0 ? TimeUnit.NANOSECONDS.toMillis(remainingNanos) : -1;
         try {
            acquireResult = lock.tryAcquire(remainingMillis, this.pauser, () -> !this.interrupted);
         } catch (IllegalStateException e) {
            LOGGER.warn("Errored while trying to acquire lock", e);
            if (remainingNanos(start, lockAcquisitionTimeoutNanos) == 0) {
               acquireResult = Timeout;
               continue;
            }
            // that's not precise, but it's ok: it can trigger the timeout right after the pause,
            // depending by the pause length. The sole purpose of the pause is to save
            // hammering with requests the DBMS if the connection is down
            this.pauser.idle();
         }
      }
      switch (acquireResult) {
         case Timeout:
            throw new ActiveMQLockAcquisitionTimeoutException("timed out waiting for lock");
         case Exit:
            this.interrupted = false;
            throw new InterruptedException("LeaseLock was interrupted");
         case Done:
            break;
         default:
            throw new AssertionError(acquireResult + " not managed");
      }

   }

   private static long remainingNanos(long start, long timeoutNanos) {
      if (timeoutNanos > 0) {
         final long elapsedNanos = (System.nanoTime() - start);
         if (elapsedNanos < timeoutNanos) {
            return timeoutNanos - elapsedNanos;
         } else {
            return 0;
         }
      } else {
         assert timeoutNanos == -1;
         return -1;
      }
   }

   private void checkInterrupted(Supplier message) throws InterruptedException {
      if (this.interrupted) {
         interrupted = false;
         throw new InterruptedException(message.get());
      }
   }

   private void renewLock(ScheduledLeaseLock lock) {
      boolean lostLock = true;
      IllegalStateException renewEx = null;
      try {
         lostLock = !this.scheduledLiveLock.lock().renew();
      } catch (IllegalStateException e) {
         renewEx = e;
      }
      if (lostLock) {
         notifyLostLock();
         if (renewEx == null) {
            renewEx = new IllegalStateException(lock.lockName() + " lock isn't renewed");
         }
         throw renewEx;
      }
   }

   /**
    * Lock live node and check for a live state, taking care to renew it (if needed) or releasing it otherwise
    */
   private boolean lockLiveAndCheckLiveState() throws ActiveMQLockAcquisitionTimeoutException, InterruptedException {
      try {
         lock(this.scheduledLiveLock.lock());
         //check if the state is live
         while (true) {
            try {
               final SharedStateManager.State stateWhileLocked = readSharedState();
               final long localExpirationTime = this.scheduledLiveLock.lock().localExpirationTime();
               if (System.currentTimeMillis() > localExpirationTime) {
                  // the lock can be assumed to be expired,
                  // so the state isn't worthy to be considered
                  return false;
               }
               if (stateWhileLocked == SharedStateManager.State.LIVE) {
                  // TODO need some tolerance//renew here?
                  return true;
               } else {
                  // state is not live: can (try to) release the lock
                  this.scheduledLiveLock.lock().release();
                  return false;
               }
            } catch (IllegalStateException e) {
               LOGGER.error("error while holding the live node lock and tried to read the shared state or to release the lock", e);
               checkStarted();
               checkInterrupted(() -> "interrupt on error while checking live state");
               pauser.idle();
               final long localExpirationTime = this.scheduledLiveLock.lock().localExpirationTime();
               if (System.currentTimeMillis() > localExpirationTime) {
                  return false;
               }
            }
         }
      } catch (InterruptedException e) {
         throw e;
      }
   }

   @Override
   public void awaitLiveNode() throws NodeManagerException, InterruptedException {
      checkStarted();
      LOGGER.debug("ENTER awaitLiveNode");
      try {
         boolean liveWhileLocked = false;
         while (!liveWhileLocked) {
            //check first without holding any lock
            SharedStateManager.State state = null;
            try {
               state = readSharedState();
            } catch (IllegalStateException e) {
               LOGGER.warn("Errored while reading shared state", e);
            }
            if (state == SharedStateManager.State.LIVE) {
               //verify if the state is live while holding the live node lock too
               liveWhileLocked = lockLiveAndCheckLiveState();
            } else {
               LOGGER.debugf("state while awaiting live node: %s", state);
            }
            if (!liveWhileLocked) {
               checkStarted();
               checkInterrupted(() -> "awaitLiveNode got interrupted!");
               pauser.idle();
            }
         }
         //state is LIVE and live lock is acquired and valid
         LOGGER.debugf("acquired live node lock while state is %s: starting scheduledLiveLock", SharedStateManager.State.LIVE);
         this.scheduledLiveLock.start();
      } catch (InterruptedException e) {
         throw e;
      } catch (ActiveMQLockAcquisitionTimeoutException | IllegalStateException e) {
         throw new NodeManagerException(e);
      } finally {
         LOGGER.debug("EXIT awaitLiveNode");
      }
   }

   @Override
   public void startBackup() throws NodeManagerException, InterruptedException {
      checkStarted();
      LOGGER.debug("ENTER startBackup");
      try {
         ActiveMQServerLogger.LOGGER.waitingToBecomeBackup();
         lock(scheduledBackupLock.lock());
         scheduledBackupLock.start();
         ActiveMQServerLogger.LOGGER.gotBackupLock();
         if (getUUID() == null)
            readNodeId();
      } catch (InterruptedException ie) {
         throw ie;
      } catch (ActiveMQLockAcquisitionTimeoutException | IllegalStateException e) {
         throw new NodeManagerException(e);
      } finally {
         LOGGER.debug("EXIT startBackup");
      }
   }

   @Override
   public ActivateCallback startLiveNode() throws NodeManagerException, InterruptedException {
      checkStarted();
      LOGGER.debug("ENTER startLiveNode");
      try {
         boolean done = false;
         while (!done) {
            try {
               setFailingBack();
               done = true;
            } catch (IllegalStateException e) {
               LOGGER.warn("cannot set failing back state, retry", e);
               pauser.idle();
               checkInterrupted(() -> "interrupt while trying to set failing back state");
            }
         }

         final String timeoutMessage = lockAcquisitionTimeoutMillis == -1 ? "indefinitely" : lockAcquisitionTimeoutMillis + " milliseconds";

         ActiveMQServerLogger.LOGGER.waitingToObtainLiveLock(timeoutMessage);

         lock(this.scheduledLiveLock.lock());

         this.scheduledLiveLock.start();

         ActiveMQServerLogger.LOGGER.obtainedLiveLock();

         return new CleaningActivateCallback() {
            @Override
            public void activationComplete() {
               LOGGER.debug("ENTER activationComplete");
               try {
                  //state can be written only if the live renew task is running
                  boolean done = false;
                  while (!done) {
                     try {
                        setLive();
                        done = true;
                     } catch (IllegalStateException e) {
                        LOGGER.warn("Errored while trying to setLive", e);
                        checkStarted();
                        pauser.idle();
                        final long localExpirationTime = scheduledLiveLock.lock().localExpirationTime();
                        // optimistic: is just to set a deadline while retrying
                        if (System.currentTimeMillis() > localExpirationTime) {
                           throw new IllegalStateException("live lock is probably expired: failed to setLive");
                        }
                     }
                  }
               } catch (IllegalStateException e) {
                  ActiveMQServerLogger.LOGGER.warn(e.getMessage(), e);
                  throw new NodeManagerException(e);
               } finally {
                  LOGGER.debug("EXIT activationComplete");
               }
            }
         };
      } catch (InterruptedException ie) {
         throw ie;
      } catch (ActiveMQLockAcquisitionTimeoutException | IllegalStateException e) {
         throw new NodeManagerException(e);
      } finally {
         LOGGER.debug("EXIT startLiveNode");
      }
   }

   @Override
   public void pauseLiveServer() throws NodeManagerException {
      checkStarted();
      LOGGER.debug("ENTER pauseLiveServer");
      try {
         if (scheduledLiveLock.isStarted()) {
            LOGGER.debug("scheduledLiveLock is running: set paused shared state, stop it and release live lock");
            setPaused();
            scheduledLiveLock.stop();
            scheduledLiveLock.lock().release();
         } else {
            LOGGER.debug("scheduledLiveLock is not running: try renew live lock");
            renewLock(scheduledLiveLock);
            LOGGER.debug("live lock renewed: set paused shared state and release live lock");
            setPaused();
            scheduledLiveLock.lock().release();
         }
      } catch (IllegalStateException e) {
         throw new NodeManagerException(e);
      } finally {
         LOGGER.debug("EXIT pauseLiveServer");
      }
   }

   @Override
   public void crashLiveServer() throws NodeManagerException {
      checkStarted();
      LOGGER.debug("ENTER crashLiveServer");
      try {
         if (this.scheduledLiveLock.isStarted()) {
            LOGGER.debug("scheduledLiveLock is running: request stop it and release live lock");
            this.scheduledLiveLock.stop();
            this.scheduledLiveLock.lock().release();
         } else {
            LOGGER.debug("scheduledLiveLock is not running");
         }
      } finally {
         LOGGER.debug("EXIT crashLiveServer");
      }
   }

   @Override
   public void awaitLiveStatus() {
      checkStarted();
      LOGGER.debug("ENTER awaitLiveStatus");
      try {
         SharedStateManager.State state = null;
         while (state != SharedStateManager.State.LIVE) {
            try {
               state = readSharedState();
            } catch (IllegalStateException e) {
               LOGGER.warn("Errored while trying to read shared state", e);
            }
            pauser.idle();
            checkStarted();
         }
      } finally {
         LOGGER.debug("EXIT awaitLiveStatus");
      }
   }

   private void setLive() {
      writeSharedState(SharedStateManager.State.LIVE);
   }

   private void setFailingBack() {
      writeSharedState(SharedStateManager.State.FAILING_BACK);
   }

   private void setPaused() {
      writeSharedState(SharedStateManager.State.PAUSED);
   }

   private void writeSharedState(SharedStateManager.State state) {
      LOGGER.debugf("writeSharedState state = %s", state);
      this.sharedStateManager.writeState(state);
   }

   private SharedStateManager.State readSharedState() {
      final SharedStateManager.State state = this.sharedStateManager.readState();
      LOGGER.debugf("readSharedState state = %s", state);
      return state;
   }

   @Override
   public SimpleString readNodeId() {
      checkStarted();
      final UUID nodeId = this.sharedStateManager.readNodeId();
      LOGGER.debugf("readNodeId nodeId = %s", nodeId);
      setUUID(nodeId);
      return getNodeId();
   }

}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy