All Downloads are FREE. Search and download functionalities are using the official Maven repository.

alluxio.master.PollingMasterInquireClient Maven / Gradle / Ivy

There is a newer version: 313
Show newest version
/*
 * The Alluxio Open Foundation licenses this work under the Apache License, version 2.0
 * (the "License"). You may not use this work except in compliance with the License, which is
 * available at www.apache.org/licenses/LICENSE-2.0
 *
 * This software is distributed on an "AS IS" basis, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
 * either express or implied, as more fully set forth in the License.
 *
 * See the NOTICE file distributed with this work for information regarding copyright ownership.
 */

package alluxio.master;

import static java.util.stream.Collectors.joining;

import alluxio.conf.AlluxioConfiguration;
import alluxio.conf.PropertyKey;
import alluxio.exception.status.AlluxioStatusException;
import alluxio.exception.status.CancelledException;
import alluxio.exception.status.DeadlineExceededException;
import alluxio.exception.status.NotFoundException;
import alluxio.exception.status.UnavailableException;
import alluxio.grpc.GetServiceVersionPRequest;
import alluxio.grpc.GrpcChannel;
import alluxio.grpc.GrpcChannelBuilder;
import alluxio.grpc.GrpcServerAddress;
import alluxio.grpc.ServiceType;
import alluxio.grpc.ServiceVersionClientServiceGrpc;
import alluxio.retry.RetryPolicy;
import alluxio.retry.RetryUtils;
import alluxio.security.user.UserState;
import alluxio.uri.Authority;
import alluxio.uri.MultiMasterAuthority;

import com.google.common.collect.Lists;
import com.google.common.util.concurrent.ThreadFactoryBuilder;
import io.grpc.StatusRuntimeException;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import java.net.InetSocketAddress;
import java.util.ArrayList;
import java.util.Collections;
import java.util.List;
import java.util.Objects;
import java.util.concurrent.ExecutionException;
import java.util.concurrent.ExecutorCompletionService;
import java.util.concurrent.ExecutorService;
import java.util.concurrent.Executors;
import java.util.concurrent.Future;
import java.util.concurrent.TimeUnit;
import java.util.function.Supplier;
import javax.annotation.Nullable;

/**
 * PollingMasterInquireClient finds the address of the primary master by polling a list of master
 * addresses to see if their RPC servers are serving. This works because only primary masters serve
 * RPCs.
 */
public class PollingMasterInquireClient implements MasterInquireClient {
  private static final Logger LOG = LoggerFactory.getLogger(PollingMasterInquireClient.class);
  private static final ExecutorService EXECUTOR_SERVICE =
      Executors.newCachedThreadPool(
          new ThreadFactoryBuilder()
              .setDaemon(true)
              .setNameFormat("pollingMasterThread-%d")
              .build()
      );

  private final MultiMasterConnectDetails mConnectDetails;
  private final Supplier mRetryPolicySupplier;
  private final AlluxioConfiguration mConfiguration;
  private final UserState mUserState;
  private final ServiceType mServiceType;

  /**
   * @param masterAddresses the potential master addresses
   * @param alluxioConf Alluxio configuration
   * @param userState user state
   * @param serviceType service type
   */
  public PollingMasterInquireClient(List masterAddresses,
      AlluxioConfiguration alluxioConf,
      UserState userState, ServiceType serviceType) {
    this(masterAddresses, RetryUtils::defaultClientRetry,
        alluxioConf, userState, serviceType);
  }

  /**
   * @param masterAddresses the potential master addresses
   * @param retryPolicySupplier the retry policy supplier
   * @param alluxioConf Alluxio configuration
   * @param serviceType service type
   */
  public PollingMasterInquireClient(List masterAddresses,
      Supplier retryPolicySupplier,
      AlluxioConfiguration alluxioConf, ServiceType serviceType) {
    this(masterAddresses, retryPolicySupplier, alluxioConf,
        UserState.Factory.create(alluxioConf), serviceType);
  }

  /**
   * @param masterAddresses the potential master addresses
   * @param retryPolicySupplier the retry policy supplier
   * @param alluxioConf Alluxio configuration
   * @param userState user state
   * @param serviceType service type
   */
  public PollingMasterInquireClient(List masterAddresses,
      Supplier retryPolicySupplier,
      AlluxioConfiguration alluxioConf,
      UserState userState, ServiceType serviceType) {
    mConnectDetails = new MultiMasterConnectDetails(masterAddresses);
    mRetryPolicySupplier = retryPolicySupplier;
    mConfiguration = alluxioConf;
    mUserState = userState;
    mServiceType = serviceType;
  }

  @Override
  public InetSocketAddress getPrimaryRpcAddress() throws UnavailableException {
    RetryPolicy retry = mRetryPolicySupplier.get();
    while (retry.attempt()) {
      InetSocketAddress address = getAddress();
      if (address != null) {
        return address;
      }
    }
    throw new UnavailableException(String.format(
        "Failed to determine primary master rpc address after polling each of %s %d times",
        mConnectDetails.getAddresses(), retry.getAttemptCount()));
  }

  @Nullable
  private InetSocketAddress getAddress() {
    // Iterate over the masters and try to connect to each of their RPC ports.
    List addresses;
    if (mConfiguration.getBoolean(PropertyKey.USER_RPC_SHUFFLE_MASTERS_ENABLED)) {
      addresses =
          Lists.newArrayList(mConnectDetails.getAddresses());
      Collections.shuffle(addresses);
    } else {
      addresses = mConnectDetails.getAddresses();
    }

    if (mConfiguration.getBoolean(PropertyKey.USER_MASTER_POLLING_CONCURRENT)) {
      return findActiveAddressConcurrent(addresses);
    } else {
      return findActiveAddress(addresses);
    }
  }

  @Nullable
  private InetSocketAddress findActiveAddressConcurrent(List addresses) {
    List> futures = new ArrayList<>(addresses.size());
    try {
      ExecutorCompletionService completionService =
          new ExecutorCompletionService<>(EXECUTOR_SERVICE);
      for (InetSocketAddress address : addresses) {
        futures.add(completionService.submit(() -> checkActiveAddress(address)));
      }
      for (int i = 0; i < addresses.size(); i++) {
        try {
          Future future = completionService.take();
          InetSocketAddress address = future.get();
          if (address != null) {
            return address;
          }
        } catch (InterruptedException | ExecutionException e) {
          break;
        }
      }
      return null;
    } finally {
      futures.forEach(it -> it.cancel(true));
    }
  }

  @Nullable
  private InetSocketAddress findActiveAddress(List addresses) {
    for (InetSocketAddress address : addresses) {
      try {
        if (checkActiveAddress(address) != null) {
          return address;
        }
      } catch (AlluxioStatusException e) {
        break;
      }
    }
    return null;
  }

  private InetSocketAddress checkActiveAddress(InetSocketAddress address)
      throws AlluxioStatusException {
    try {
      LOG.debug("Checking whether {} is listening for RPCs", address);
      pingMetaService(address);
      LOG.debug("Successfully connected to {}", address);
      return address;
    } catch (UnavailableException e) {
      LOG.debug("Failed to connect to {}", address);
      return null;
    } catch (DeadlineExceededException e) {
      LOG.debug("Timeout while connecting to {}", address);
      return null;
    } catch (CancelledException e) {
      LOG.debug("Cancelled while connecting to {}", address);
      return null;
    } catch (NotFoundException e) {
      // If the gRPC server is enabled but the metadata service isn't enabled,
      // try the next master address.
      LOG.debug("Meta service rpc endpoint not found on {}. {}", address, e);
      return null;
    } catch (AlluxioStatusException e) {
      LOG.error("Error while connecting to {}. {}", address, e);
      // Breaking the loop on non filtered error.
      throw e;
    }
  }

  private void pingMetaService(InetSocketAddress address) throws AlluxioStatusException {
    // disable authentication in the channel since version service does not require authentication
    GrpcChannel channel =
        GrpcChannelBuilder.newBuilder(GrpcServerAddress.create(address), mConfiguration)
            .setSubject(mUserState.getSubject())
            .disableAuthentication().build();
    ServiceVersionClientServiceGrpc.ServiceVersionClientServiceBlockingStub versionClient =
        ServiceVersionClientServiceGrpc.newBlockingStub(channel)
            .withDeadlineAfter(mConfiguration.getMs(PropertyKey.USER_MASTER_POLLING_TIMEOUT),
                TimeUnit.MILLISECONDS);
    try {
      versionClient.getServiceVersion(GetServiceVersionPRequest.newBuilder()
          .setServiceType(mServiceType).build());
    } catch (StatusRuntimeException e) {
      throw AlluxioStatusException.fromThrowable(e);
    } finally {
      channel.shutdown();
    }
  }

  @Override
  public List getMasterRpcAddresses() {
    return mConnectDetails.getAddresses();
  }

  @Override
  public ConnectDetails getConnectDetails() {
    return mConnectDetails;
  }

  /**
   * Details used to connect to the leader Alluxio master when there are multiple potential leaders.
   */
  public static class MultiMasterConnectDetails implements ConnectDetails {
    private final List mAddresses;

    /**
     * @param addresses a list of addresses
     */
    public MultiMasterConnectDetails(List addresses) {
      mAddresses = addresses;
    }

    /**
     * @return the addresses
     */
    public List getAddresses() {
      return mAddresses;
    }

    @Override
    public Authority toAuthority() {
      return new MultiMasterAuthority(mAddresses.stream()
          .map(addr -> addr.getHostString() + ":" + addr.getPort()).collect(joining(",")));
    }

    @Override
    public boolean equals(Object o) {
      if (this == o) {
        return true;
      }
      if (!(o instanceof MultiMasterConnectDetails)) {
        return false;
      }
      MultiMasterConnectDetails that = (MultiMasterConnectDetails) o;
      return mAddresses.equals(that.mAddresses);
    }

    @Override
    public int hashCode() {
      return Objects.hash(mAddresses);
    }

    @Override
    public String toString() {
      return toAuthority().toString();
    }
  }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy