All Downloads are FREE. Search and download functionalities are using the official Maven repository.

alluxio.master.backup.BackupLeaderRole Maven / Gradle / Ivy

The newest version!
/*
 * The Alluxio Open Foundation licenses this work under the Apache License, version 2.0
 * (the "License"). You may not use this work except in compliance with the License, which is
 * available at www.apache.org/licenses/LICENSE-2.0
 *
 * This software is distributed on an "AS IS" basis, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
 * either express or implied, as more fully set forth in the License.
 *
 * See the NOTICE file distributed with this work for information regarding copyright ownership.
 */

package alluxio.master.backup;

import alluxio.AlluxioURI;
import alluxio.collections.ConcurrentHashSet;
import alluxio.conf.Configuration;
import alluxio.conf.PropertyKey;
import alluxio.exception.AlluxioException;
import alluxio.exception.BackupAbortedException;
import alluxio.exception.BackupDelegationException;
import alluxio.exception.BackupException;
import alluxio.grpc.BackupPRequest;
import alluxio.grpc.BackupState;
import alluxio.grpc.BackupStatusPRequest;
import alluxio.grpc.GrpcService;
import alluxio.grpc.ServiceType;
import alluxio.master.CoreMasterContext;
import alluxio.master.StateLockManager;
import alluxio.master.StateLockOptions;
import alluxio.master.transport.GrpcMessagingConnection;
import alluxio.master.transport.GrpcMessagingServiceClientHandler;
import alluxio.resource.LockResource;
import alluxio.security.authentication.ClientContextServerInjector;
import alluxio.util.ConfigurationUtils;
import alluxio.util.network.NetworkAddressUtils;
import alluxio.wire.BackupStatus;

import io.grpc.ServerInterceptors;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import java.io.IOException;
import java.time.Duration;
import java.time.Instant;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import java.util.Set;
import java.util.UUID;
import java.util.concurrent.CompletableFuture;
import java.util.concurrent.ConcurrentHashMap;
import java.util.concurrent.Future;
import java.util.concurrent.ScheduledFuture;
import java.util.concurrent.TimeUnit;
import java.util.concurrent.locks.Lock;
import java.util.concurrent.locks.ReentrantLock;

/**
 * Implementation of {@link BackupRole} for primary mode.
 */
public class BackupLeaderRole extends AbstractBackupRole {
  private static final Logger LOG = LoggerFactory.getLogger(BackupLeaderRole.class);

  // Timeout after which backup will be abandoned if no heart-beat received.
  private final long mBackupAbandonTimeout;

  /** Metadata state pause lock. */
  private StateLockManager mStateLockManager;

  /** Scheduled future to time-put backups on leader. */
  private ScheduledFuture mTimeoutBackupFuture;
  /** Time at which the last heart-beat was received by leader. */
  private Instant mLastHeartBeat;

  /** Future for local backup task. */
  private Future mLocalBackupFuture;

  /** Used to mark remote connection through which delegated backup is being driven. */
  private GrpcMessagingConnection mRemoteBackupConnection;

  /** Backup-worker connections with the leader. */
  private Set mBackupWorkerConnections = new ConcurrentHashSet<>();

  /** Used to store host names for backup-worker connections. */
  private Map mBackupWorkerHostNames = new ConcurrentHashMap<>();

  /** Used to prevent concurrent scheduling of backups. */
  private Lock mBackupInitiateLock = new ReentrantLock(true);

  /**
   * Creates a new backup leader.
   *
   * @param masterContext the master context
   */
  public BackupLeaderRole(CoreMasterContext masterContext) {
    super(masterContext);
    LOG.info("Creating backup-leader role.");
    // Store state lock manager pausing state change when necessary.
    mStateLockManager = masterContext.getStateLockManager();
    // Read properties.
    mBackupAbandonTimeout = Configuration.getMs(PropertyKey.MASTER_BACKUP_ABANDON_TIMEOUT);
  }

  @Override
  public void close() throws IOException {
    if (mRoleClosed) {
      return;
    }

    LOG.info("Closing backup-leader role.");
    // Close each backup-worker connection.
    List> closeFutures = new ArrayList<>(mBackupWorkerConnections.size());
    for (GrpcMessagingConnection conn : mBackupWorkerConnections) {
      closeFutures.add(conn.close());
    }
    // Wait until all backup-worker connection is done closing.
    try {
      CompletableFuture.allOf(closeFutures.toArray(new CompletableFuture[0])).get();
    } catch (Exception e) {
      LOG.warn("Failed to close {} backup-worker connections. Error: {}", closeFutures.size(), e);
    }
    // Reset existing standby connections.
    mBackupWorkerConnections.clear();
    mBackupWorkerHostNames.clear();
    // Cancel ongoing local backup task.
    if (mLocalBackupFuture != null && !mLocalBackupFuture.isDone()) {
      mLocalBackupFuture.cancel(true);
    }
    // Stopping the base after because closing connection uses the base executor.
    super.close();
  }

  @Override
  public Map getRoleServices() {
    Map services = new HashMap<>();
    services
        .put(ServiceType.META_MASTER_BACKUP_MESSAGING_SERVICE,
            new GrpcService(
                ServerInterceptors.intercept(
                    new GrpcMessagingServiceClientHandler(
                        NetworkAddressUtils.getConnectAddress(
                            NetworkAddressUtils.ServiceType.MASTER_RPC,
                            Configuration.global()),
                        (conn) -> activateWorkerConnection(conn), mGrpcMessagingContext,
                        mExecutorService, mCatalystRequestTimeout),
                    new ClientContextServerInjector())).withCloseable(this));
    return services;
  }

  @Override
  public BackupStatus backup(BackupPRequest request, StateLockOptions stateLockOptions)
      throws AlluxioException {
    // Whether to delegate remote to a standby master.
    boolean delegateBackup;
    // Will be populated with initiated id if no back-up in progress.
    UUID backupId;
    // Initiate new backup status under lock.
    try (LockResource initiateLock = new LockResource(mBackupInitiateLock)) {
      if (mBackupTracker.inProgress()) {
        throw new BackupException("Backup in progress");
      }

      // Whether to attempt to delegate backup to a backup worker.
      delegateBackup = Configuration.getBoolean(PropertyKey.MASTER_BACKUP_DELEGATION_ENABLED)
          && ConfigurationUtils.isHaMode(Configuration.global());
      // Check if backup-delegation is suppressed by back-up client.
      if (delegateBackup && request.getOptions().getBypassDelegation()) {
        LOG.info("Back-up delegation is suppressed by back-up client.");
        delegateBackup = false;
      }
      // Fail, if in HA mode and no masters available to delegate,
      // unless `AllowLeader` flag in the backup request is set.
      if (delegateBackup && mBackupWorkerHostNames.size() == 0) {
        if (request.getOptions().getAllowLeader()) {
          LOG.info("Back-up delegation is deactivated for cluster with no followers.");
          delegateBackup = false;
        } else {
          throw new BackupDelegationException("No master found to delegate backup.");
        }
      }
      // Initialize backup status.
      mBackupTracker.reset();
      mBackupTracker.updateState(BackupState.Initiating);
      mBackupTracker.updateHostname(NetworkAddressUtils.getLocalHostName((int) Configuration
          .global().getMs(PropertyKey.NETWORK_HOST_RESOLUTION_TIMEOUT_MS)));

      // Store backup id to query later for async requests.
      backupId = mBackupTracker.getCurrentStatus().getBackupId();
    }
    // Initiate the backup.
    if (delegateBackup) {
      // Fail the backup if delegation failed.
      if (!scheduleRemoteBackup(backupId, request, stateLockOptions)) {
        LOG.error("Failed to schedule remote backup.");
        AlluxioException err = new BackupDelegationException("Failed to delegate the backup.");
        mBackupTracker.updateError(err);
        // Throw here for failing the backup call.
        throw err;
      }
    } else {
      scheduleLocalBackup(request, stateLockOptions);
    }

    // Return immediately if async is requested.
    if (request.getOptions().getRunAsync()) {
      // Client will always see 'Initiating' state first.
      return new BackupStatus(backupId, BackupState.Initiating);
    }

    // Wait until backup is completed.
    mBackupTracker.waitUntilFinished();
    return mBackupTracker.getStatus(backupId);
  }

  @Override
  public BackupStatus getBackupStatus(BackupStatusPRequest statusPRequest) throws AlluxioException {
    return mBackupTracker.getStatus(UUID.fromString(statusPRequest.getBackupId()));
  }

  /**
   * Prepares new follower connection.
   */
  private void activateWorkerConnection(GrpcMessagingConnection workerConnection) {
    LOG.info("Backup-leader connected with backup-worker: {}", workerConnection);
    // Register handshake message handler.
    workerConnection.handler(BackupHandshakeMessage.class, (message) -> {
      message.setConnection(workerConnection);
      return handleHandshakeMessage(message);
    });
    // Register heartbeat message handler.
    workerConnection.handler(BackupHeartbeatMessage.class, this::handleHeartbeatMessage);
    // Register connection error listener.
    workerConnection.onException((error) -> {
      LOG.warn(String.format("Backup-worker connection failed for %s.", workerConnection), error);
    });
    // Register connection close listener.
    workerConnection.onClose((conn) -> {
      LOG.info("Backup-worker connection closed for {}.", workerConnection);
      // Remove the connection when completed
      mBackupWorkerConnections.remove(conn);
      String backupWorkerHostname = mBackupWorkerHostNames.remove(conn);
      // Fail active backup if it was driven by the closed connection.
      if (mBackupTracker.inProgress() && mRemoteBackupConnection != null
          && mRemoteBackupConnection.equals(conn)) {
        LOG.warn("Abandoning current backup as backup-worker: {} is lost.", backupWorkerHostname);
        mBackupTracker.updateError(new BackupAbortedException("Backup-worker is lost."));
        mRemoteBackupConnection = null;
      }
    });
    // Store follower connection.
    // mBackupWorkerHostNames will be updated by handshake message.
    mBackupWorkerConnections.add(workerConnection);
  }

  /**
   * Schedule backup on this master.
   */
  private void scheduleLocalBackup(BackupPRequest request, StateLockOptions stateLockOptions) {
    LOG.info("Scheduling backup at the backup-leader.");
    mLocalBackupFuture = mExecutorService.submit(() -> {
      try (LockResource stateLockResource = mStateLockManager.lockExclusive(stateLockOptions)) {
        mBackupTracker.updateState(BackupState.Running);
        AlluxioURI backupUri = takeBackup(request, mBackupTracker.getEntryCounter());
        mBackupTracker.updateBackupUri(backupUri);
        mBackupTracker.updateState(BackupState.Completed);
      } catch (Exception e) {
        LOG.error("Local backup failed at the backup-leader.", e);
        mBackupTracker.updateError(
            new BackupException(String.format("Local backup failed: %s", e.getMessage()), e));
      }
    });
  }

  /**
   * Delegates a backup to a worker.
   *
   * After successful delegation, follower will send regular heartbeats to leader for updating the
   * backup status.
   *
   * @return {@code true} if delegation successful
   */
  private boolean scheduleRemoteBackup(UUID backupId, BackupPRequest request,
      StateLockOptions stateLockOptions) {
    // Try to delegate backup to a follower.
    LOG.info("Scheduling backup at remote backup-worker.");
    for (Map.Entry workerEntry
        : mBackupWorkerHostNames.entrySet()) {
      try {
        // Get consistent journal sequences.
        Map journalSequences;
        try (LockResource stateLockResource = mStateLockManager.lockExclusive(stateLockOptions,
            () -> {
              // Suspend journals on current follower for every lock attempt.
              LOG.info("Suspending journals at backup-worker: {}", workerEntry.getValue());
              sendMessageBlocking(workerEntry.getKey(), new BackupSuspendMessage());
            })) {
          journalSequences = mJournalSystem.getCurrentSequenceNumbers();
        }
        // Send backup request along with consistent journal sequences.
        BackupRequestMessage requestMessage =
            new BackupRequestMessage(backupId, request, journalSequences);
        LOG.info("Sending backup request to backup-worker: {}. Request message: {}",
            workerEntry.getValue(), requestMessage);
        sendMessageBlocking(workerEntry.getKey(), requestMessage);
        // Delegation successful.
        mRemoteBackupConnection = workerEntry.getKey();
        // Start abandon timer.
        adjustAbandonTimeout(false);
        LOG.info("Delegated the backup to backup-worker: {}", workerEntry.getValue());
        return true;
      } catch (Exception e) {
        LOG.warn(String.format("Failed to delegate backup to a backup-worker: %s",
            workerEntry.getValue()), e);
      }
    }
    return false;
  }

  /**
   * Handles worker heart-beat message.
   */
  private synchronized CompletableFuture handleHandshakeMessage(
      BackupHandshakeMessage handshakeMsg) {
    LOG.info("Received handshake message:{}", handshakeMsg);
    mBackupWorkerHostNames.put(handshakeMsg.getConnection(),
        handshakeMsg.getBackupWorkerHostname());
    // This future is only used for providing a receipt of message.
    return CompletableFuture.completedFuture(null);
  }

  /**
   * Handles worker heart-beat message.
   */
  private synchronized CompletableFuture handleHeartbeatMessage(
      BackupHeartbeatMessage heartbeatMsg) {
    LOG.info("Received heartbeat message:{}", heartbeatMsg);
    if (heartbeatMsg.getBackupStatus() != null) {
      // Process heart-beat.
      mBackupTracker.update(heartbeatMsg.getBackupStatus());
      // Adjust backup timeout.
      adjustAbandonTimeout(!mBackupTracker.inProgress());
    }
    // This future is only used for providing a receipt of message.
    return CompletableFuture.completedFuture(null);
  }

  /**
   * Used to set timer to abandon backup when not received a heart-beat for it.
   */
  private void adjustAbandonTimeout(boolean backupFinished) {
    // Mark last heart-beat time.
    mLastHeartBeat = Instant.now();
    // Cancel active timer.
    if (mTimeoutBackupFuture != null) {
      mTimeoutBackupFuture.cancel(true);
    }
    // Reschedule if backup is still in progress.
    if (!backupFinished) {
      mTimeoutBackupFuture = mTaskScheduler.schedule(() -> {
        Duration sinceLastHeartbeat = Duration.between(mLastHeartBeat, Instant.now());
        if (sinceLastHeartbeat.toMillis() >= mBackupAbandonTimeout) {
          // Abandon the backup.
          LOG.error("Abandoning the backup after not hearing for {}ms.", mBackupAbandonTimeout);
          mBackupTracker.updateError(new BackupAbortedException("Backup timed out"));
        }
      }, mBackupAbandonTimeout, TimeUnit.MILLISECONDS);
    }
  }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy