com.fasterxml.clustermate.service.cluster.ClusterBootstrapper Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of clustermate-service Show documentation
Show all versions of clustermate-service Show documentation
Building blocks for ClusterMate-based services and servers.
package com.fasterxml.clustermate.service.cluster;
import java.io.IOException;
import java.net.InetAddress;
import java.util.*;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import com.fasterxml.storemate.shared.IpAndPort;
import com.fasterxml.clustermate.api.EntryKey;
import com.fasterxml.clustermate.api.KeyRange;
import com.fasterxml.clustermate.api.KeySpace;
import com.fasterxml.clustermate.api.NodeDefinition;
import com.fasterxml.clustermate.service.NodeStateStore;
import com.fasterxml.clustermate.service.ServerUtil;
import com.fasterxml.clustermate.service.SharedServiceStuff;
import com.fasterxml.clustermate.service.Stores;
import com.fasterxml.clustermate.service.cfg.ClusterConfig;
import com.fasterxml.clustermate.service.cfg.KeyRangeAllocationStrategy;
import com.fasterxml.clustermate.service.cfg.NodeConfig;
import com.fasterxml.clustermate.service.cfg.ServiceConfig;
import com.fasterxml.clustermate.service.store.StoredEntry;
/**
* Helper class which will initialize cluster state and set up.
*/
public class ClusterBootstrapper>
{
/* We will delete stale unrecognized entries after 24 hours, to
* keep Node store somewhat clean.
*/
private final static long SECS_IN_24H = 24 * 60 * 60;
private final Logger LOG = LoggerFactory.getLogger(getClass());
protected final SharedServiceStuff _stuff;
protected final ServiceConfig _serviceConfig;
protected final Stores _stores;
/**
* Timestamp we use as "current time": usually system time, but
* may be hard-coded by tests.
*/
protected final long _startTime;
protected final KeySpace _keyspace;
public ClusterBootstrapper(long startTime, SharedServiceStuff stuff, Stores stores)
{
_stuff = stuff;
_serviceConfig = stuff.getServiceConfig();
_stores = stores;
_startTime = startTime;
_keyspace = new KeySpace(_serviceConfig.cluster.clusterKeyspaceSize);
}
/**
* Factory method for constructing state object from static cluster
* configuration
*
* @param thisInstancePort Port number this instance is listening to; needed to
* find correct cluster configuration
*/
public ClusterViewByServerImpl bootstrap(final int thisInstancePort)
throws IOException
{
// First: need the keyspace definition, to build key ranges
NodeDefinition localDef = null;
// Then need to know IP interface(s) host has, to find "local" entry
Set localIps = new LinkedHashSet();
ServerUtil.findLocalIPs(localIps);
LOG.info("Local IPs: {}", localIps.toString());
Map nodeDefs = new LinkedHashMap();
for (NodeDefinition node : _readNodeDefs()) {
IpAndPort ip = node.getAddress();
LOG.info("Resolving node definitions for: "+ip.toString());
// Entry for this instance?
// NOTE: this call will resolve IP name to address; blocking call:
InetAddress addr = ip.getIP();
if (localIps.contains(addr) && ip.getPort() == thisInstancePort) {
if (localDef != null) {
throw new IllegalStateException("Ambiguous definition: both "
+localDef.getAddress()+" and "+ip+" refer to this host");
}
localDef = node;
continue;
}
// LOG.info("peer node: {}", node); // remove once in prod?
nodeDefs.put(ip, node);
}
// Error: MUST have local node definition (until more dynamic set up is implemented)
if (localDef == null) {
throw new IllegalStateException("Could not find Cluster node definitions for local instance (port "
+thisInstancePort+")");
}
LOG.info("Node definition used for this host: {}, found {} configured peer nodes",
localDef, nodeDefs.size());
final NodeStateStore nodes = _stores.getNodeStore();
// Next: load state definitions from BDB
List storedStates = nodes.readAll(_keyspace);
LOG.info("Read {} persisted node entries from local store", storedStates.size());
// First things first: find and update node for local node
ActiveNodeState localAct = _remove(storedStates, localDef.getAddress());
if (localAct == null) { // need to create?
if (!_stuff.isRunningTests()) {
LOG.warn("No persisted entry for local node: will create and store one");
}
localAct = new ActiveNodeState(localDef, _startTime);
} else {
// index may have changed; if so, override
if (localAct.getIndex() != localDef.getIndex()) {
LOG.warn("Node index of current node changed from {} to {} -- may change key range!",
localAct.getIndex(), localDef.getIndex());
localAct = localAct.withIndex(localDef.getIndex());
}
}
// one more thing: force dummy update on restart as well (official startup time too)
localAct = localAct.withLastUpdated(_startTime);
// Either way, need to update persisted version
nodes.upsertEntry(localAct);
// then merge entries; create/delete orphans
Map activeState = _mergeStates(nodes,
localAct, nodeDefs, storedStates);
LOG.info("Merged state of {} node entries (including local)", activeState.size());
// We could try to determine stored value; but let's reset on reboot, for now:
long clusterUpdateTime = _stuff.getTimeMaster().currentTimeMillis();
return new ClusterViewByServerImpl(_stuff, _stores, _keyspace,
localAct, activeState, clusterUpdateTime);
}
/*
/**********************************************************************
/* Internal methods
/**********************************************************************
*/
protected List _readNodeDefs()
throws IOException
{
ArrayList defs = new ArrayList();
ClusterConfig clusterConfig = _serviceConfig.cluster;
List nodes = clusterConfig.clusterNodes;
// And then let's read static definition
KeyRangeAllocationStrategy strategy = clusterConfig.type;
if (strategy == null) {
throw new IllegalStateException("Missing 'type' value for ClusterConfig");
}
final int nodeCount = nodes.size();
if (nodeCount < 1) {
throw new IllegalStateException("Missing node definitions in ClusterConfig");
}
// one twist: for single-node cluster, allow whatever copy count (simplifies configs)
final int copies;
if (nodeCount == 1) {
copies = 1;
} else {
int copies0 = clusterConfig.numberOfCopies;
// otherwise verify (NOTE: may need to change for dynamic registration)
if (copies0 > nodeCount) {
// actually, let's simply truncate
if (strategy == KeyRangeAllocationStrategy.SIMPLE_LINEAR) {
copies = nodeCount;
LOG.warn("Number of copies set to "+copies0+": but with "+copies+" nodes need to truncate to that value");
} else {
throw new IllegalStateException("Can not require "+copies0+" copies with "+nodeCount+" nodes");
}
} else if (copies0 < 1) {
// Ok for STATIC, but not for others
if (strategy == KeyRangeAllocationStrategy.STATIC) {
copies = copies0; // fine, whatever
} else if (copies0 < 0 && strategy == KeyRangeAllocationStrategy.SIMPLE_LINEAR) {
copies = nodes.size();
LOG.info("Number of copies set to "+copies0+": taken to mean 'maximum', in this case "+copies);
} else {
throw new IllegalStateException("Missing 'numbedOfCopies' setting in ClusterConfig (required with strategy "
+strategy+")");
}
} else {
copies = copies0;
}
}
for (int i = 0, end = nodes.size(); i < end; ++i) {
NodeConfig node = nodes.get(i);
IpAndPort ip = node.ipAndPort;
final int index = (i+1);
if (ip == null) {
throw new IllegalStateException("Missing 'ipAndPort' value for node #"
+index+" (out of "+end+")");
}
// Range definitions depend on strategy; static or somewhat dynamic...
KeyRange range;
switch (strategy) {
case STATIC:
if (node.keyRangeStart == 0 && node.keyRangeLength == 0) {
throw new IllegalStateException("Missing 'keyRangeStart' and/or 'keyRangeLength' for node "
+index+" (out of "+end+"), when using STATIC cluster type");
}
range = _keyspace.range(node.keyRangeStart, node.keyRangeLength);
break;
case SIMPLE_LINEAR:
range = _keyspace.calcSegment(i, nodeCount, copies);
// sanity check: no empty segments
if (range.getLength() == 0) {
throw new IllegalStateException("Empty range calculated for node "+index+" (of "+nodeCount
+" nodes), keyspace="+_keyspace+", "+copies+" copies");
}
break;
case DYNAMIC_WITH_APPEND: // not (yet!) supported
default:
throw new IllegalStateException("Unsupported (as-of-yet) cluster type: "+strategy);
}
// we'll use same range for both passive and active ranges, with static
defs.add(new NodeDefinition(ip, index, range, range));
}
return defs;
}
/**
* Helper method that takes both configured node definitions and persisted
* node states, to create active node definitions and update persisted
* state if and as necessary.
*/
protected Map _mergeStates(NodeStateStore nodeStore,
ActiveNodeState localState, Map nodeDefs,
List storedStates)
{
Map result = new LinkedHashMap();
// and then we'll go over peer nodes
Map orphanDefs = new LinkedHashMap(nodeDefs);
LOG.info("Merging {} configured peer entries with {} persistent entries",
nodeDefs.size(), storedStates.size());
// Iterate over entries that have been persisted:
for (ActiveNodeState state : storedStates) {
IpAndPort key = state.getAddress();
// Then: is there config for that entry? If not, skip or remove:
NodeDefinition def = orphanDefs.remove(key);
if (def == null) {
long staleTimeSecs = (_startTime - state.getLastSyncAttempt()) / 1000L;
if (staleTimeSecs < SECS_IN_24H) {
/* Skipping means that (a) we will leave the entry in the local DB, in case
* it MAY be useful via explicit info via cluster; but
* (b) will NOT include in current active state. Latter is
* useful in gracefully expiring information.
*/
LOG.warn("Unrecognized persisted Node state, key {}: less than 24h old, will skip", key);
continue;
}
// If too old, delete
if (!_stuff.isRunningTests()) {
LOG.warn("Unrecognized persisted Node state, key {}: more than 24h old ({} days), will DELETE",
key, (staleTimeSecs / SECS_IN_24H));
}
nodeStore.deleteEntry(key);
continue;
}
// We have both config and state: merge
state = _updatePersistentState(nodeStore, localState, def, state);
result.put(key, state);
}
LOG.info("Any orphan definitions? (node without persisted state) Found {}", orphanDefs.size());
// And then reverse check: any config entries for which we have no state?
// If we do, need to initialize state
int i = 0;
for (NodeDefinition def : orphanDefs.values()) {
ActiveNodeState state = new ActiveNodeState(def, _startTime);
state = state.withSyncRange(localState);
if (!_stuff.isRunningTests()) {
LOG.warn("Configuration entry without state, key {}: will need to (re)create state (sync range {})",
def.getAddress(), state.getRangeSync());
}
try {
nodeStore.upsertEntry(state);
} catch (Exception e) {
LOG.error("Failed to update node state entry #{}, must skip. Problem ({}): {}",
i, e.getClass().getName(), e.getMessage());
}
result.put(state.getAddress(), state);
++i;
}
return result;
}
private ActiveNodeState _remove(Collection nodes, IpAndPort key)
{
Iterator it = nodes.iterator();
while (it.hasNext()) {
ActiveNodeState curr = it.next();
if (key.equals(curr.getAddress())) {
it.remove();
return curr;
}
}
return null;
}
/**
* Helper method that will figure out how to modify persistent state,
* considering active configuration and persisted state.
*/
protected ActiveNodeState _updatePersistentState(NodeStateStore nodeStore,
ActiveNodeState localNode,
NodeDefinition remoteDef, ActiveNodeState remoteNode)
{
// The main thing is to see if sync range has changed...
final KeyRange oldSyncRange = remoteNode.getRangeSync();
KeyRange newSyncRange = localNode.totalRange().intersection(remoteNode.totalRange());
if (newSyncRange.equals(remoteNode.getRangeSync())) {
LOG.info("Sync range between local and {} unchanged: {}"
,remoteNode.getAddress(), newSyncRange);
} else {
long syncedTo = remoteNode.getSyncedUpTo();
// only need to reset if expanding...
if (oldSyncRange.contains(newSyncRange)) {
LOG.info("Sync range between local and {} changed from {} to {}: but new contained in old, no reset"
, new Object[] { remoteNode.getAddress(), oldSyncRange, newSyncRange});
} else {
LOG.warn("Sync range between local and {} changed from {} to {}; new not completely contained in old, MUST reset"
, new Object[] { remoteNode.getAddress(), oldSyncRange, newSyncRange});
syncedTo = 0L;
}
remoteNode = remoteNode.withSyncRange(newSyncRange, syncedTo);
try {
nodeStore.upsertEntry(remoteNode);
} catch (Exception e) {
LOG.error("Failed to update node state for {}, must skip. Problem ({}): {}",
remoteNode, e.getClass().getName(), e.getMessage());
}
// anything else?
}
return remoteNode;
}
}