alluxio.master.PollingMasterInquireClient Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of alluxio-core-common Show documentation
Show all versions of alluxio-core-common Show documentation
Common utilities shared in Alluxio core modules
/*
* The Alluxio Open Foundation licenses this work under the Apache License, version 2.0
* (the "License"). You may not use this work except in compliance with the License, which is
* available at www.apache.org/licenses/LICENSE-2.0
*
* This software is distributed on an "AS IS" basis, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
* either express or implied, as more fully set forth in the License.
*
* See the NOTICE file distributed with this work for information regarding copyright ownership.
*/
package alluxio.master;
import static java.util.stream.Collectors.joining;
import alluxio.conf.AlluxioConfiguration;
import alluxio.conf.PropertyKey;
import alluxio.exception.status.AlluxioStatusException;
import alluxio.exception.status.CancelledException;
import alluxio.exception.status.DeadlineExceededException;
import alluxio.exception.status.NotFoundException;
import alluxio.exception.status.UnavailableException;
import alluxio.grpc.GetServiceVersionPRequest;
import alluxio.grpc.GrpcChannel;
import alluxio.grpc.GrpcChannelBuilder;
import alluxio.grpc.GrpcServerAddress;
import alluxio.grpc.ServiceType;
import alluxio.grpc.ServiceVersionClientServiceGrpc;
import alluxio.retry.RetryPolicy;
import alluxio.retry.RetryUtils;
import alluxio.security.user.UserState;
import alluxio.uri.Authority;
import alluxio.uri.MultiMasterAuthority;
import com.google.common.collect.Lists;
import com.google.common.util.concurrent.ThreadFactoryBuilder;
import io.grpc.StatusRuntimeException;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import java.net.InetSocketAddress;
import java.util.ArrayList;
import java.util.Collections;
import java.util.List;
import java.util.Objects;
import java.util.concurrent.ExecutionException;
import java.util.concurrent.ExecutorCompletionService;
import java.util.concurrent.ExecutorService;
import java.util.concurrent.Executors;
import java.util.concurrent.Future;
import java.util.concurrent.TimeUnit;
import java.util.function.Supplier;
import javax.annotation.Nullable;
/**
* PollingMasterInquireClient finds the address of the primary master by polling a list of master
* addresses to see if their RPC servers are serving. This works because only primary masters serve
* RPCs.
*/
public class PollingMasterInquireClient implements MasterInquireClient {
private static final Logger LOG = LoggerFactory.getLogger(PollingMasterInquireClient.class);
private static final ExecutorService EXECUTOR_SERVICE =
Executors.newCachedThreadPool(
new ThreadFactoryBuilder()
.setDaemon(true)
.setNameFormat("pollingMasterThread-%d")
.build()
);
private final MultiMasterConnectDetails mConnectDetails;
private final Supplier mRetryPolicySupplier;
private final AlluxioConfiguration mConfiguration;
private final UserState mUserState;
private final ServiceType mServiceType;
/**
* @param masterAddresses the potential master addresses
* @param alluxioConf Alluxio configuration
* @param userState user state
* @param serviceType service type
*/
public PollingMasterInquireClient(List masterAddresses,
AlluxioConfiguration alluxioConf,
UserState userState, ServiceType serviceType) {
this(masterAddresses, RetryUtils::defaultClientRetry,
alluxioConf, userState, serviceType);
}
/**
* @param masterAddresses the potential master addresses
* @param retryPolicySupplier the retry policy supplier
* @param alluxioConf Alluxio configuration
* @param serviceType service type
*/
public PollingMasterInquireClient(List masterAddresses,
Supplier retryPolicySupplier,
AlluxioConfiguration alluxioConf, ServiceType serviceType) {
this(masterAddresses, retryPolicySupplier, alluxioConf,
UserState.Factory.create(alluxioConf), serviceType);
}
/**
* @param masterAddresses the potential master addresses
* @param retryPolicySupplier the retry policy supplier
* @param alluxioConf Alluxio configuration
* @param userState user state
* @param serviceType service type
*/
public PollingMasterInquireClient(List masterAddresses,
Supplier retryPolicySupplier,
AlluxioConfiguration alluxioConf,
UserState userState, ServiceType serviceType) {
mConnectDetails = new MultiMasterConnectDetails(masterAddresses);
mRetryPolicySupplier = retryPolicySupplier;
mConfiguration = alluxioConf;
mUserState = userState;
mServiceType = serviceType;
}
@Override
public InetSocketAddress getPrimaryRpcAddress() throws UnavailableException {
RetryPolicy retry = mRetryPolicySupplier.get();
while (retry.attempt()) {
InetSocketAddress address = getAddress();
if (address != null) {
return address;
}
}
throw new UnavailableException(String.format(
"Failed to determine primary master rpc address after polling each of %s %d times",
mConnectDetails.getAddresses(), retry.getAttemptCount()));
}
@Nullable
private InetSocketAddress getAddress() {
// Iterate over the masters and try to connect to each of their RPC ports.
List addresses;
if (mConfiguration.getBoolean(PropertyKey.USER_RPC_SHUFFLE_MASTERS_ENABLED)) {
addresses =
Lists.newArrayList(mConnectDetails.getAddresses());
Collections.shuffle(addresses);
} else {
addresses = mConnectDetails.getAddresses();
}
if (mConfiguration.getBoolean(PropertyKey.USER_MASTER_POLLING_CONCURRENT)) {
return findActiveAddressConcurrent(addresses);
} else {
return findActiveAddress(addresses);
}
}
@Nullable
private InetSocketAddress findActiveAddressConcurrent(List addresses) {
List> futures = new ArrayList<>(addresses.size());
try {
ExecutorCompletionService completionService =
new ExecutorCompletionService<>(EXECUTOR_SERVICE);
for (InetSocketAddress address : addresses) {
futures.add(completionService.submit(() -> checkActiveAddress(address)));
}
for (int i = 0; i < addresses.size(); i++) {
try {
Future future = completionService.take();
InetSocketAddress address = future.get();
if (address != null) {
return address;
}
} catch (InterruptedException | ExecutionException e) {
break;
}
}
return null;
} finally {
futures.forEach(it -> it.cancel(true));
}
}
@Nullable
private InetSocketAddress findActiveAddress(List addresses) {
for (InetSocketAddress address : addresses) {
try {
if (checkActiveAddress(address) != null) {
return address;
}
} catch (AlluxioStatusException e) {
break;
}
}
return null;
}
private InetSocketAddress checkActiveAddress(InetSocketAddress address)
throws AlluxioStatusException {
try {
LOG.debug("Checking whether {} is listening for RPCs", address);
pingMetaService(address);
LOG.debug("Successfully connected to {}", address);
return address;
} catch (UnavailableException e) {
LOG.debug("Failed to connect to {}", address);
return null;
} catch (DeadlineExceededException e) {
LOG.debug("Timeout while connecting to {}", address);
return null;
} catch (CancelledException e) {
LOG.debug("Cancelled while connecting to {}", address);
return null;
} catch (NotFoundException e) {
// If the gRPC server is enabled but the metadata service isn't enabled,
// try the next master address.
LOG.debug("Meta service rpc endpoint not found on {}. {}", address, e);
return null;
} catch (AlluxioStatusException e) {
LOG.error("Error while connecting to {}. {}", address, e);
// Breaking the loop on non filtered error.
throw e;
}
}
private void pingMetaService(InetSocketAddress address) throws AlluxioStatusException {
// disable authentication in the channel since version service does not require authentication
GrpcChannel channel =
GrpcChannelBuilder.newBuilder(GrpcServerAddress.create(address), mConfiguration)
.setSubject(mUserState.getSubject())
.disableAuthentication().build();
ServiceVersionClientServiceGrpc.ServiceVersionClientServiceBlockingStub versionClient =
ServiceVersionClientServiceGrpc.newBlockingStub(channel)
.withDeadlineAfter(mConfiguration.getMs(PropertyKey.USER_MASTER_POLLING_TIMEOUT),
TimeUnit.MILLISECONDS);
try {
versionClient.getServiceVersion(GetServiceVersionPRequest.newBuilder()
.setServiceType(mServiceType).build());
} catch (StatusRuntimeException e) {
throw AlluxioStatusException.fromThrowable(e);
} finally {
channel.shutdown();
}
}
@Override
public List getMasterRpcAddresses() {
return mConnectDetails.getAddresses();
}
@Override
public ConnectDetails getConnectDetails() {
return mConnectDetails;
}
/**
* Details used to connect to the leader Alluxio master when there are multiple potential leaders.
*/
public static class MultiMasterConnectDetails implements ConnectDetails {
private final List mAddresses;
/**
* @param addresses a list of addresses
*/
public MultiMasterConnectDetails(List addresses) {
mAddresses = addresses;
}
/**
* @return the addresses
*/
public List getAddresses() {
return mAddresses;
}
@Override
public Authority toAuthority() {
return new MultiMasterAuthority(mAddresses.stream()
.map(addr -> addr.getHostString() + ":" + addr.getPort()).collect(joining(",")));
}
@Override
public boolean equals(Object o) {
if (this == o) {
return true;
}
if (!(o instanceof MultiMasterConnectDetails)) {
return false;
}
MultiMasterConnectDetails that = (MultiMasterConnectDetails) o;
return mAddresses.equals(that.mAddresses);
}
@Override
public int hashCode() {
return Objects.hash(mAddresses);
}
@Override
public String toString() {
return toAuthority().toString();
}
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy