All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.datastax.driver.core.policies.DCAwareRoundRobinPolicy Maven / Gradle / Ivy

There is a newer version: 4.15.102
Show newest version
/*
 * Copyright DataStax, Inc.
 *
 * This software can be used solely with DataStax Enterprise. Please consult the license at
 * http://www.datastax.com/terms/datastax-dse-driver-license-terms
 */
package com.datastax.driver.core.policies;

import com.datastax.driver.core.Cluster;
import com.datastax.driver.core.Configuration;
import com.datastax.driver.core.ConsistencyLevel;
import com.datastax.driver.core.Host;
import com.datastax.driver.core.HostDistance;
import com.datastax.driver.core.Statement;
import com.google.common.annotations.VisibleForTesting;
import com.google.common.base.Joiner;
import com.google.common.base.Preconditions;
import com.google.common.base.Strings;
import com.google.common.collect.AbstractIterator;
import java.util.ArrayList;
import java.util.Collection;
import java.util.Collections;
import java.util.HashSet;
import java.util.Iterator;
import java.util.List;
import java.util.Random;
import java.util.Set;
import java.util.concurrent.ConcurrentHashMap;
import java.util.concurrent.ConcurrentMap;
import java.util.concurrent.CopyOnWriteArrayList;
import java.util.concurrent.atomic.AtomicInteger;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

/**
 * A data-center aware Round-robin load balancing policy.
 *
 * 

This policy provides round-robin queries over the node of the local data center. It also * includes in the query plans returned a configurable number of hosts in the remote data centers, * but those are always tried after the local nodes. In other words, this policy guarantees that no * host in a remote data center will be queried unless no host in the local data center can be * reached. * *

If used with a single data center, this policy is equivalent to the {@link RoundRobinPolicy}, * but its DC awareness incurs a slight overhead so the latter should be preferred to this policy in * that case. */ public class DCAwareRoundRobinPolicy implements LoadBalancingPolicy { private static final Logger logger = LoggerFactory.getLogger(DCAwareRoundRobinPolicy.class); /** * Returns a builder to create a new instance. * * @return the builder. */ public static Builder builder() { return new Builder(); } private static final String UNSET = ""; private final ConcurrentMap> perDcLiveHosts = new ConcurrentHashMap>(); private final AtomicInteger index = new AtomicInteger(); @VisibleForTesting volatile String localDc; private final int usedHostsPerRemoteDc; private final boolean dontHopForLocalCL; private boolean contactPointsMultipleDCs = false; private volatile Configuration configuration; private boolean useRemoteHostsForFailover; private DCAwareRoundRobinPolicy( String localDc, int usedHostsPerRemoteDc, boolean allowRemoteDCsForLocalConsistencyLevel, boolean allowEmptyLocalDc) { if (!allowEmptyLocalDc && Strings.isNullOrEmpty(localDc)) throw new IllegalArgumentException("Null or empty data center specified for DC-aware policy"); this.localDc = localDc == null ? UNSET : localDc; this.usedHostsPerRemoteDc = usedHostsPerRemoteDc; this.useRemoteHostsForFailover = allowRemoteDCsForLocalConsistencyLevel; this.dontHopForLocalCL = !allowRemoteDCsForLocalConsistencyLevel; } @Override public void init(Cluster cluster, Collection hosts) { if (localDc != UNSET) logger.info("Using provided data-center name '{}' for DCAwareRoundRobinPolicy", localDc); this.configuration = cluster.getConfiguration(); ArrayList notInLocalDC = new ArrayList(); for (Host host : hosts) { String dc = dc(host); // If the localDC was in "auto-discover" mode and it's the first host for which we have a DC, // use it. if (localDc == UNSET && dc != UNSET) { logger.info( "Using data-center name '{}' for DCAwareRoundRobinPolicy (if this is incorrect, please provide the correct datacenter name with DCAwareRoundRobinPolicy constructor)", dc); localDc = dc; } else if (!dc.equals(localDc)) notInLocalDC.add(String.format("%s (%s)", host.toString(), dc)); CopyOnWriteArrayList prev = perDcLiveHosts.get(dc); if (prev == null) perDcLiveHosts.put(dc, new CopyOnWriteArrayList(Collections.singletonList(host))); else prev.addIfAbsent(host); } if (notInLocalDC.size() > 0) { String nonLocalHosts = Joiner.on(",").join(notInLocalDC); contactPointsMultipleDCs = true; logger.warn( "Some contact points don't match local data center. Local DC = {}. Non-conforming contact points: {}", localDc, nonLocalHosts); } this.index.set(new Random().nextInt(Math.max(hosts.size(), 1))); } private String dc(Host host) { String dc = host.getDatacenter(); return dc == null ? localDc : dc; } @SuppressWarnings("unchecked") private static CopyOnWriteArrayList cloneList(CopyOnWriteArrayList list) { return (CopyOnWriteArrayList) list.clone(); } public boolean isContactPointsMultipleDCs() { return contactPointsMultipleDCs; } public boolean isUseRemoteHostsForFailover() { return useRemoteHostsForFailover; } /** * Return the HostDistance for the provided host. * *

This policy consider nodes in the local datacenter as {@code LOCAL}. For each remote * datacenter, it considers a configurable number of hosts as {@code REMOTE} and the rest is * {@code IGNORED}. * *

To configure how many hosts in each remote datacenter should be considered, see {@link * Builder#withUsedHostsPerRemoteDc(int)}. * * @param host the host of which to return the distance of. * @return the HostDistance to {@code host}. */ @Override public HostDistance distance(Host host) { String dc = dc(host); if (dc == UNSET || dc.equals(localDc)) return HostDistance.LOCAL; CopyOnWriteArrayList dcHosts = perDcLiveHosts.get(dc); if (dcHosts == null || usedHostsPerRemoteDc == 0) return HostDistance.IGNORED; // We need to clone, otherwise our subList call is not thread safe dcHosts = cloneList(dcHosts); return dcHosts.subList(0, Math.min(dcHosts.size(), usedHostsPerRemoteDc)).contains(host) ? HostDistance.REMOTE : HostDistance.IGNORED; } /** * Returns the hosts to use for a new query. * *

The returned plan will always try each known host in the local datacenter first, and then, * if none of the local host is reachable, will try up to a configurable number of other host per * remote datacenter. The order of the local node in the returned query plan will follow a * Round-robin algorithm. * * @param loggedKeyspace the keyspace currently logged in on for this query. * @param statement the query for which to build the plan. * @return a new query plan, i.e. an iterator indicating which host to try first for querying, * which one to use as failover, etc... */ @Override public Iterator newQueryPlan(String loggedKeyspace, final Statement statement) { CopyOnWriteArrayList localLiveHosts = perDcLiveHosts.get(localDc); final List hosts = localLiveHosts == null ? Collections.emptyList() : cloneList(localLiveHosts); final int startIdx = index.getAndIncrement(); return new AbstractIterator() { private int idx = startIdx; private int remainingLocal = hosts.size(); // For remote Dcs private Iterator remoteDcs; private List currentDcHosts; private int currentDcRemaining; @Override protected Host computeNext() { while (true) { if (remainingLocal > 0) { remainingLocal--; int c = idx++ % hosts.size(); if (c < 0) { c += hosts.size(); } return hosts.get(c); } if (currentDcHosts != null && currentDcRemaining > 0) { currentDcRemaining--; int c = idx++ % currentDcHosts.size(); if (c < 0) { c += currentDcHosts.size(); } return currentDcHosts.get(c); } ConsistencyLevel cl = statement.getConsistencyLevel() == null ? configuration.getQueryOptions().getConsistencyLevel() : statement.getConsistencyLevel(); if (dontHopForLocalCL && cl.isDCLocal()) return endOfData(); if (remoteDcs == null) { Set copy = new HashSet(perDcLiveHosts.keySet()); copy.remove(localDc); remoteDcs = copy.iterator(); } if (!remoteDcs.hasNext()) break; String nextRemoteDc = remoteDcs.next(); CopyOnWriteArrayList nextDcHosts = perDcLiveHosts.get(nextRemoteDc); if (nextDcHosts != null) { // Clone for thread safety List dcHosts = cloneList(nextDcHosts); currentDcHosts = dcHosts.subList(0, Math.min(dcHosts.size(), usedHostsPerRemoteDc)); currentDcRemaining = currentDcHosts.size(); } } return endOfData(); } }; } @Override public void onUp(Host host) { String dc = dc(host); // If the localDC was in "auto-discover" mode and it's the first host for which we have a DC, // use it. if (localDc == UNSET && dc != UNSET) { logger.info( "Using data-center name '{}' for DCAwareRoundRobinPolicy (if this is incorrect, please provide the correct datacenter name with DCAwareRoundRobinPolicy constructor)", dc); localDc = dc; } CopyOnWriteArrayList dcHosts = perDcLiveHosts.get(dc); if (dcHosts == null) { CopyOnWriteArrayList newMap = new CopyOnWriteArrayList(Collections.singletonList(host)); dcHosts = perDcLiveHosts.putIfAbsent(dc, newMap); // If we've successfully put our new host, we're good, otherwise we've been beaten so continue if (dcHosts == null) return; } dcHosts.addIfAbsent(host); } @Override public void onDown(Host host) { CopyOnWriteArrayList dcHosts = perDcLiveHosts.get(dc(host)); if (dcHosts != null) dcHosts.remove(host); } @Override public void onAdd(Host host) { onUp(host); } @Override public void onRemove(Host host) { onDown(host); } @Override public void close() { // nothing to do } /** Helper class to build the policy. */ public static class Builder { private String localDc; private int usedHostsPerRemoteDc; private boolean allowRemoteDCsForLocalConsistencyLevel; /** * Sets the name of the datacenter that will be considered "local" by the policy. * *

This must be the name as known by Cassandra (in other words, the name in that appears in * {@code system.peers}, or in the output of admin tools like nodetool). * *

If this method isn't called, the policy will default to the datacenter of the first node * connected to. This will always be ok if all the contact points use at {@code Cluster} * creation are in the local data-center. Otherwise, you should provide the name yourself with * this method. * * @param localDc the name of the datacenter. It should not be {@code null}. * @return this builder. */ public Builder withLocalDc(String localDc) { Preconditions.checkArgument( !Strings.isNullOrEmpty(localDc), "localDc name can't be null or empty. If you want to let the policy autodetect the datacenter, don't call Builder.withLocalDC"); this.localDc = localDc; return this; } /** * Sets the number of hosts per remote datacenter that the policy should consider. * *

The policy's {@code distance()} method will return a {@code HostDistance.REMOTE} distance * for only {@code usedHostsPerRemoteDc} hosts per remote datacenter. Other hosts of the remote * datacenters will be ignored (and thus no connections to them will be maintained). * *

If {@code usedHostsPerRemoteDc > 0}, then if for a query no host in the local datacenter * can be reached and if the consistency level of the query is not {@code LOCAL_ONE} or {@code * LOCAL_QUORUM}, then up to {@code usedHostsPerRemoteDc} hosts per remote datacenter will be * tried by the policy as a fallback. By default, no remote host will be used for {@code * LOCAL_ONE} and {@code LOCAL_QUORUM}, since this would change the meaning of the consistency * level, somewhat breaking the consistency contract (this can be overridden with {@link * #allowRemoteDCsForLocalConsistencyLevel()}). * *

If this method isn't called, the policy will default to 0. * * @param usedHostsPerRemoteDc the number. * @return this builder. * @deprecated This functionality will be removed in the next major release of the driver. DC * failover shouldn't be done in the driver, which does not have the necessary context to * know what makes sense considering application semantics. */ @Deprecated public Builder withUsedHostsPerRemoteDc(int usedHostsPerRemoteDc) { Preconditions.checkArgument( usedHostsPerRemoteDc >= 0, "usedHostsPerRemoteDc must be equal or greater than 0"); this.usedHostsPerRemoteDc = usedHostsPerRemoteDc; return this; } /** * Allows the policy to return remote hosts when building query plans for queries having * consistency level {@code LOCAL_ONE} or {@code LOCAL_QUORUM}. * *

When used in conjunction with {@link #withUsedHostsPerRemoteDc(int) usedHostsPerRemoteDc} * > 0, this overrides the policy of never using remote datacenter nodes for {@code LOCAL_ONE} * and {@code LOCAL_QUORUM} queries. It is however inadvisable to do so in almost all cases, as * this would potentially break consistency guarantees and if you are fine with that, it's * probably better to use a weaker consistency like {@code ONE}, {@code TWO} or {@code THREE}. * As such, this method should generally be avoided; use it only if you know and understand what * you do. * * @return this builder. * @deprecated This functionality will be removed in the next major release of the driver. DC * failover shouldn't be done in the driver, which does not have the necessary context to * know what makes sense considering application semantics. */ @Deprecated public Builder allowRemoteDCsForLocalConsistencyLevel() { this.allowRemoteDCsForLocalConsistencyLevel = true; return this; } /** * Builds the policy configured by this builder. * * @return the policy. */ public DCAwareRoundRobinPolicy build() { if (usedHostsPerRemoteDc == 0 && allowRemoteDCsForLocalConsistencyLevel) { logger.warn( "Setting allowRemoteDCsForLocalConsistencyLevel has no effect if usedHostsPerRemoteDc = 0. " + "This setting will be ignored"); } return new DCAwareRoundRobinPolicy( localDc, usedHostsPerRemoteDc, allowRemoteDCsForLocalConsistencyLevel, true); } } }





© 2015 - 2025 Weber Informatics LLC | Privacy Policy