org.apache.flink.runtime.taskmanager.TaskManagerLocation Maven / Gradle / Ivy
The newest version!
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.flink.runtime.taskmanager;
import org.apache.flink.annotation.VisibleForTesting;
import org.apache.flink.configuration.TaskManagerOptionsInternal;
import org.apache.flink.runtime.clusterframework.types.ResourceID;
import org.apache.flink.util.NetUtils;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import javax.annotation.Nonnull;
import java.io.Serializable;
import java.net.InetAddress;
import java.net.UnknownHostException;
import static org.apache.flink.util.Preconditions.checkArgument;
import static org.apache.flink.util.Preconditions.checkNotNull;
/**
* This class encapsulates the connection information of a TaskManager. It describes the host where
* the TaskManager operates and its server port for data exchange. This class also contains
* utilities to work with the TaskManager's host name, which is used to localize work assignments.
*/
public class TaskManagerLocation implements Comparable, java.io.Serializable {
private static final long serialVersionUID = -8254407801276350716L;
private static final Logger LOG = LoggerFactory.getLogger(TaskManagerLocation.class);
// ------------------------------------------------------------------------
/**
* The ID of the resource in which the TaskManager is started. This can be for example the YARN
* container ID or any other unique identifier.
*/
private final ResourceID resourceID;
/** The network address that the TaskManager binds its sockets to. */
private final InetAddress inetAddress;
/** The supplier for fully qualified host name and pure hostname. */
private final HostNameSupplier hostNameSupplier;
/** The port that the TaskManager receive data transport connection requests at. */
private final int dataPort;
/**
* The toString representation, eagerly constructed and cached to avoid repeated string
* building.
*/
private String stringRepresentation;
/**
* ID of the node where the TaskManager is located on. In Yarn and Native Kubernetes mode, this
* value will be set by resource manager when launch this TaskManager(via the config option
* {@link TaskManagerOptionsInternal#TASK_MANAGER_NODE_ID}). In other modes, this value will be
* the external address of the TaskManager.
*/
private final String nodeId;
/**
* Constructs a new instance connection info object. The constructor will attempt to retrieve
* the instance's host name and domain name through the operating system's lookup mechanisms.
*
* @param inetAddress the network address the instance's task manager binds its sockets to
* @param dataPort the port instance's task manager expects to receive transfer envelopes on
* @param hostNameSupplier the supplier for obtaining fully-qualified domain name and pure
* hostname of the task manager
* @param nodeId the ID of node where the task manager is located on.
*/
@VisibleForTesting
public TaskManagerLocation(
ResourceID resourceID,
InetAddress inetAddress,
int dataPort,
HostNameSupplier hostNameSupplier,
String nodeId) {
// -1 indicates a local instance connection info
checkArgument(dataPort > 0 || dataPort == -1, "dataPort must be > 0, or -1 (local)");
this.resourceID = checkNotNull(resourceID);
this.inetAddress = checkNotNull(inetAddress);
this.dataPort = dataPort;
this.hostNameSupplier = checkNotNull(hostNameSupplier);
this.nodeId = checkNotNull(nodeId);
}
/**
* Constructs a new instance connection info object. The constructor will attempt to retrieve
* the instance's host name and domain name through the operating system's lookup mechanisms.
*
* @param inetAddress the network address the instance's task manager binds its sockets to
* @param dataPort the port instance's task manager expects to receive transfer envelopes on
*/
@VisibleForTesting
public TaskManagerLocation(ResourceID resourceID, InetAddress inetAddress, int dataPort) {
this(
resourceID,
inetAddress,
dataPort,
new DefaultHostNameSupplier(inetAddress),
getHostName(inetAddress));
}
public static TaskManagerLocation fromUnresolvedLocation(
final UnresolvedTaskManagerLocation unresolvedLocation,
final ResolutionMode resolutionMode)
throws UnknownHostException {
InetAddress inetAddress = InetAddress.getByName(unresolvedLocation.getExternalAddress());
switch (resolutionMode) {
case RETRIEVE_HOST_NAME:
return new TaskManagerLocation(
unresolvedLocation.getResourceID(),
inetAddress,
unresolvedLocation.getDataPort(),
new DefaultHostNameSupplier(inetAddress),
unresolvedLocation.getNodeId());
case USE_IP_ONLY:
return new TaskManagerLocation(
unresolvedLocation.getResourceID(),
inetAddress,
unresolvedLocation.getDataPort(),
new IpOnlyHostNameSupplier(inetAddress),
unresolvedLocation.getNodeId());
default:
throw new UnsupportedOperationException("Unsupported resolution mode provided.");
}
}
// ------------------------------------------------------------------------
// Getters
// ------------------------------------------------------------------------
/**
* Gets the ID of the resource in which the TaskManager is started. The format of this depends
* on how the TaskManager is started:
*
*
* - If the TaskManager is started via YARN, this is the YARN container ID.
*
- If the TaskManager is started in standalone mode, or via a MiniCluster, this is a
* random ID.
*
- Other deployment modes can set the resource ID in other ways.
*
*
* @return The ID of the resource in which the TaskManager is started
*/
public ResourceID getResourceID() {
return resourceID;
}
/**
* Returns the port instance's task manager expects to receive transfer envelopes on.
*
* @return the port instance's task manager expects to receive transfer envelopes on
*/
public int dataPort() {
return dataPort;
}
/**
* Returns the network address the instance's task manager binds its sockets to.
*
* @return the network address the instance's task manager binds its sockets to
*/
public InetAddress address() {
return inetAddress;
}
/**
* Gets the IP address where the TaskManager operates.
*
* @return The IP address.
*/
public String addressString() {
return inetAddress.toString();
}
/**
* Returns the fully-qualified domain name of the TaskManager provided by {@link
* #hostNameSupplier}.
*
* @return The fully-qualified domain name of the TaskManager.
*/
public String getFQDNHostname() {
return hostNameSupplier.getFqdnHostName();
}
/**
* Gets the hostname of the TaskManager from {@link #hostNameSupplier}.
*
* @return The hostname of the TaskManager.
*/
public String getHostname() {
return hostNameSupplier.getHostName();
}
/**
* Return the ID of node where the task manager is located on.
*
* @return The ID of node where the task manager is located on.
*/
public String getNodeId() {
return nodeId;
}
/**
* Gets the endpoint of the TaskManager in the format of "$HOST:$PORT".
*
* @return The endpoint of the TaskManager.
*/
public String getEndpoint() {
return String.format("%s:%d", getFQDNHostname(), dataPort);
}
// --------------------------------------------------------------------------------------------
// Utilities
// --------------------------------------------------------------------------------------------
/**
* Gets the fully qualified hostname of the TaskManager based on the network address.
*
* @param inetAddress the network address that the TaskManager binds its sockets to
* @return fully qualified hostname of the TaskManager
*/
private static String getFqdnHostName(InetAddress inetAddress) {
String fqdnHostName;
try {
fqdnHostName = inetAddress.getCanonicalHostName();
} catch (Throwable t) {
LOG.warn(
"Unable to determine the canonical hostname. Input split assignment (such as "
+ "for HDFS files) may be non-local when the canonical hostname is missing.");
LOG.debug("getCanonicalHostName() Exception:", t);
fqdnHostName = inetAddress.getHostAddress();
}
return fqdnHostName;
}
/**
* Gets the hostname of the TaskManager based on the network address.
*
* @param inetAddress the network address that the TaskManager binds its sockets to
* @return hostname of the TaskManager
*/
public static String getHostName(InetAddress inetAddress) {
String hostName;
String fqdnHostName = getFqdnHostName(inetAddress);
if (fqdnHostName.equals(inetAddress.getHostAddress())) {
// this happens when the name lookup fails, either due to an exception,
// or because no hostname can be found for the address
// take IP textual representation
hostName = fqdnHostName;
LOG.warn(
"No hostname could be resolved for the IP address {}, using IP address as host name. "
+ "Local input split assignment (such as for HDFS files) may be impacted.",
inetAddress.getHostAddress());
} else {
hostName = NetUtils.getHostnameFromFQDN(fqdnHostName);
}
return hostName;
}
@Override
public String toString() {
if (stringRepresentation == null) {
this.stringRepresentation =
String.format("%s @ %s (dataPort=%d)", resourceID, getFQDNHostname(), dataPort);
}
return stringRepresentation;
}
@Override
public boolean equals(Object obj) {
if (obj == this) {
return true;
} else if (obj != null && obj.getClass() == getClass()) {
TaskManagerLocation that = (TaskManagerLocation) obj;
return this.resourceID.equals(that.resourceID)
&& this.inetAddress.equals(that.inetAddress)
&& this.dataPort == that.dataPort
&& this.nodeId.equals(that.nodeId);
} else {
return false;
}
}
@Override
public int hashCode() {
return resourceID.hashCode()
+ 17 * inetAddress.hashCode()
+ 129 * dataPort
+ 257 * nodeId.hashCode();
}
@Override
public int compareTo(@Nonnull TaskManagerLocation o) {
// decide based on resource ID first
int resourceIdCmp =
this.resourceID.getResourceIdString().compareTo(o.resourceID.getResourceIdString());
if (resourceIdCmp != 0) {
return resourceIdCmp;
}
// decide based on ip address next
byte[] thisAddress = this.inetAddress.getAddress();
byte[] otherAddress = o.inetAddress.getAddress();
if (thisAddress.length < otherAddress.length) {
return -1;
} else if (thisAddress.length > otherAddress.length) {
return 1;
} else {
for (int i = 0; i < thisAddress.length; i++) {
byte tb = thisAddress[i];
byte ob = otherAddress[i];
if (tb < ob) {
return -1;
} else if (tb > ob) {
return 1;
}
}
}
// addresses are identical, decide based on ports.
if (this.dataPort < o.dataPort) {
return -1;
} else if (this.dataPort > o.dataPort) {
return 1;
}
// finally, decided based on node id
return this.nodeId.compareTo(o.nodeId);
}
// --------------------------------------------------------------------------------------------
// Hostname Resolution Suppliers
// --------------------------------------------------------------------------------------------
public interface HostNameSupplier extends Serializable {
String getHostName();
String getFqdnHostName();
}
/**
* This Supplier class could retrieve the FQDN host name of the given InetAddress on demand,
* extract the pure host name and cache the results for later use.
*/
@VisibleForTesting
public static class DefaultHostNameSupplier implements HostNameSupplier {
private final InetAddress inetAddress;
private String hostName;
private String fqdnHostName;
public DefaultHostNameSupplier(InetAddress inetAddress) {
this.inetAddress = inetAddress;
}
/**
* Gets the hostname of the TaskManager. The hostname derives from the fully qualified
* domain name (FQDN, see {@link #getFQDNHostname()}):
*
*
* - If the FQDN is the textual IP address, then the hostname is also the IP address
*
- If the FQDN has only one segment (such as "localhost", or "host17"), then this is
* used as the hostname.
*
- If the FQDN has multiple segments (such as "worker3.subgroup.company.net"), then
* the first segment (here "worker3") will be used as the hostname.
*
*
* @return The hostname of the TaskManager.
*/
@Override
public String getHostName() {
if (hostName == null) {
hostName = TaskManagerLocation.getHostName(inetAddress);
}
return hostName;
}
/**
* Returns the fully-qualified domain name the TaskManager. If the name could not be
* determined, the return value will be a textual representation of the TaskManager's IP
* address.
*
* @return The fully-qualified domain name of the TaskManager.
*/
@Override
public String getFqdnHostName() {
if (fqdnHostName == null) {
fqdnHostName = TaskManagerLocation.getFqdnHostName(inetAddress);
}
return fqdnHostName;
}
}
/**
* This Supplier class returns the IP address of the given InetAddress directly, therefore no
* reverse DNS lookup is required.
*/
@VisibleForTesting
public static class IpOnlyHostNameSupplier implements HostNameSupplier {
private final InetAddress inetAddress;
public IpOnlyHostNameSupplier(InetAddress inetAddress) {
this.inetAddress = inetAddress;
}
/**
* Returns the textual representation of the TaskManager's IP address as host name.
*
* @return The textual representation of the TaskManager's IP address.
*/
@Override
public String getHostName() {
return inetAddress.getHostAddress();
}
/**
* Returns the textual representation of the TaskManager's IP address as FQDN host name.
*
* @return The textual representation of the TaskManager's IP address.
*/
@Override
public String getFqdnHostName() {
return inetAddress.getHostAddress();
}
}
/** The DNS resolution mode for TaskManager's IP address. */
public enum ResolutionMode {
RETRIEVE_HOST_NAME,
USE_IP_ONLY
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy