com.datastax.driver.core.Token Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of cassandra-driver-core Show documentation
Show all versions of cassandra-driver-core Show documentation
A driver for Apache Cassandra 1.2+ that works exclusively with the Cassandra Query Language version 3
(CQL3) and Cassandra's binary protocol.
/*
* Copyright (C) 2012-2015 DataStax Inc.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.datastax.driver.core;
import com.datastax.driver.core.utils.Bytes;
import com.google.common.annotations.VisibleForTesting;
import com.google.common.collect.Lists;
import com.google.common.primitives.UnsignedBytes;
import java.math.BigInteger;
import java.nio.ByteBuffer;
import java.security.MessageDigest;
import java.security.NoSuchAlgorithmException;
import java.util.List;
/**
* A token on the Cassandra ring.
*/
public abstract class Token implements Comparable {
/**
* Returns the data type of this token's value.
*
* @return the datatype.
*/
public abstract DataType getType();
/**
* Returns the raw value of this token.
*
* @return the value.
*/
public abstract Object getValue();
/**
* Returns the serialized form of the current token,
* using the appropriate codec depending on the
* partitioner in use and the CQL datatype for
* the token.
*
* @param protocolVersion the protocol version in use.
* @return the serialized form of the current token
*/
public abstract ByteBuffer serialize(ProtocolVersion protocolVersion);
static Token.Factory getFactory(String partitionerName) {
if (partitionerName.endsWith("Murmur3Partitioner"))
return M3PToken.FACTORY;
else if (partitionerName.endsWith("RandomPartitioner"))
return RPToken.FACTORY;
else if (partitionerName.endsWith("OrderedPartitioner"))
return OPPToken.FACTORY;
else
return null;
}
static abstract class Factory {
abstract Token fromString(String tokenStr);
abstract DataType getTokenType();
abstract Token deserialize(ByteBuffer buffer, ProtocolVersion protocolVersion);
/**
* The minimum token is a special value that no key ever hashes to, it's used both as lower and upper bound.
*/
abstract Token minToken();
abstract Token hash(ByteBuffer partitionKey);
abstract List split(Token startToken, Token endToken, int numberOfSplits);
// Base implementation for split
protected List split(BigInteger start, BigInteger range,
BigInteger ringEnd, BigInteger ringLength,
int numberOfSplits) {
BigInteger[] tmp = range.divideAndRemainder(BigInteger.valueOf(numberOfSplits));
BigInteger divider = tmp[0];
int remainder = tmp[1].intValue();
List results = Lists.newArrayListWithExpectedSize(numberOfSplits - 1);
BigInteger current = start;
BigInteger dividerPlusOne = (remainder == 0) ? null // won't be used
: divider.add(BigInteger.ONE);
for (int i = 1; i < numberOfSplits; i++) {
current = current.add(remainder-- > 0 ? dividerPlusOne : divider);
if (ringEnd != null && current.compareTo(ringEnd) > 0)
current = current.subtract(ringLength);
results.add(current);
}
return results;
}
}
// Murmur3Partitioner tokens
static class M3PToken extends Token {
private final long value;
public static final Factory FACTORY = new M3PTokenFactory();
private static class M3PTokenFactory extends Factory {
private static final BigInteger RING_END = BigInteger.valueOf(Long.MAX_VALUE);
private static final BigInteger RING_LENGTH = RING_END.subtract(BigInteger.valueOf(Long.MIN_VALUE));
static final M3PToken MIN_TOKEN = new M3PToken(Long.MIN_VALUE);
static final M3PToken MAX_TOKEN = new M3PToken(Long.MAX_VALUE);
private long getblock(ByteBuffer key, int offset, int index) {
int i_8 = index << 3;
int blockOffset = offset + i_8;
return ((long) key.get(blockOffset + 0) & 0xff) + (((long) key.get(blockOffset + 1) & 0xff) << 8) +
(((long) key.get(blockOffset + 2) & 0xff) << 16) + (((long) key.get(blockOffset + 3) & 0xff) << 24) +
(((long) key.get(blockOffset + 4) & 0xff) << 32) + (((long) key.get(blockOffset + 5) & 0xff) << 40) +
(((long) key.get(blockOffset + 6) & 0xff) << 48) + (((long) key.get(blockOffset + 7) & 0xff) << 56);
}
private long rotl64(long v, int n) {
return ((v << n) | (v >>> (64 - n)));
}
private long fmix(long k) {
k ^= k >>> 33;
k *= 0xff51afd7ed558ccdL;
k ^= k >>> 33;
k *= 0xc4ceb9fe1a85ec53L;
k ^= k >>> 33;
return k;
}
// This is an adapted version of the MurmurHash.hash3_x64_128 from Cassandra used
// for M3P. Compared to that methods, there's a few inlining of arguments and we
// only return the first 64-bits of the result since that's all M3P uses.
@SuppressWarnings("fallthrough")
private long murmur(ByteBuffer data) {
int offset = data.position();
int length = data.remaining();
int nblocks = length >> 4; // Process as 128-bit blocks.
long h1 = 0;
long h2 = 0;
long c1 = 0x87c37b91114253d5L;
long c2 = 0x4cf5ad432745937fL;
//----------
// body
for (int i = 0; i < nblocks; i++) {
long k1 = getblock(data, offset, i * 2 + 0);
long k2 = getblock(data, offset, i * 2 + 1);
k1 *= c1;
k1 = rotl64(k1, 31);
k1 *= c2;
h1 ^= k1;
h1 = rotl64(h1, 27);
h1 += h2;
h1 = h1 * 5 + 0x52dce729;
k2 *= c2;
k2 = rotl64(k2, 33);
k2 *= c1;
h2 ^= k2;
h2 = rotl64(h2, 31);
h2 += h1;
h2 = h2 * 5 + 0x38495ab5;
}
//----------
// tail
// Advance offset to the unprocessed tail of the data.
offset += nblocks * 16;
long k1 = 0;
long k2 = 0;
switch (length & 15) {
case 15:
k2 ^= ((long) data.get(offset + 14)) << 48;
case 14:
k2 ^= ((long) data.get(offset + 13)) << 40;
case 13:
k2 ^= ((long) data.get(offset + 12)) << 32;
case 12:
k2 ^= ((long) data.get(offset + 11)) << 24;
case 11:
k2 ^= ((long) data.get(offset + 10)) << 16;
case 10:
k2 ^= ((long) data.get(offset + 9)) << 8;
case 9:
k2 ^= ((long) data.get(offset + 8)) << 0;
k2 *= c2;
k2 = rotl64(k2, 33);
k2 *= c1;
h2 ^= k2;
case 8:
k1 ^= ((long) data.get(offset + 7)) << 56;
case 7:
k1 ^= ((long) data.get(offset + 6)) << 48;
case 6:
k1 ^= ((long) data.get(offset + 5)) << 40;
case 5:
k1 ^= ((long) data.get(offset + 4)) << 32;
case 4:
k1 ^= ((long) data.get(offset + 3)) << 24;
case 3:
k1 ^= ((long) data.get(offset + 2)) << 16;
case 2:
k1 ^= ((long) data.get(offset + 1)) << 8;
case 1:
k1 ^= ((long) data.get(offset));
k1 *= c1;
k1 = rotl64(k1, 31);
k1 *= c2;
h1 ^= k1;
}
//----------
// finalization
h1 ^= length;
h2 ^= length;
h1 += h2;
h2 += h1;
h1 = fmix(h1);
h2 = fmix(h2);
h1 += h2;
h2 += h1;
return h1;
}
@Override
M3PToken fromString(String tokenStr) {
return new M3PToken(Long.parseLong(tokenStr));
}
@Override
DataType getTokenType() {
return DataType.bigint();
}
@Override
Token deserialize(ByteBuffer buffer, ProtocolVersion protocolVersion) {
return new M3PToken(TypeCodec.bigint().deserialize(buffer, protocolVersion));
}
@Override
Token minToken() {
return MIN_TOKEN;
}
@Override
M3PToken hash(ByteBuffer partitionKey) {
long v = murmur(partitionKey);
return new M3PToken(v == Long.MIN_VALUE ? Long.MAX_VALUE : v);
}
@Override
List split(Token startToken, Token endToken, int numberOfSplits) {
// edge case: ]min, min] means the whole ring
if (startToken.equals(endToken) && startToken.equals(MIN_TOKEN))
endToken = MAX_TOKEN;
BigInteger start = BigInteger.valueOf(((M3PToken) startToken).value);
BigInteger end = BigInteger.valueOf(((M3PToken) endToken).value);
BigInteger range = end.subtract(start);
if (range.compareTo(BigInteger.ZERO) < 0)
range = range.add(RING_LENGTH);
List values = super.split(start, range,
RING_END, RING_LENGTH,
numberOfSplits);
List tokens = Lists.newArrayListWithExpectedSize(values.size());
for (BigInteger value : values)
tokens.add(new M3PToken(value.longValue()));
return tokens;
}
}
private M3PToken(long value) {
this.value = value;
}
@Override
public DataType getType() {
return FACTORY.getTokenType();
}
@Override
public Object getValue() {
return value;
}
@Override
public ByteBuffer serialize(ProtocolVersion protocolVersion) {
return TypeCodec.bigint().serialize(value, protocolVersion);
}
@Override
public int compareTo(Token other) {
assert other instanceof M3PToken;
long otherValue = ((M3PToken) other).value;
return value < otherValue ? -1 : (value == otherValue) ? 0 : 1;
}
@Override
public boolean equals(Object obj) {
if (this == obj)
return true;
if (obj == null || this.getClass() != obj.getClass())
return false;
return value == ((M3PToken) obj).value;
}
@Override
public int hashCode() {
return (int) (value ^ (value >>> 32));
}
@Override
public String toString() {
return Long.toString(value);
}
}
// OPPartitioner tokens
static class OPPToken extends Token {
private final ByteBuffer value;
public static final Factory FACTORY = new OPPTokenFactory();
private static class OPPTokenFactory extends Factory {
private static final BigInteger TWO = BigInteger.valueOf(2);
private static final Token MIN_TOKEN = new OPPToken(ByteBuffer.allocate(0));
@Override
public OPPToken fromString(String tokenStr) {
// This method must be able to parse the contents of system.peers.tokens, which do not have the "0x" prefix.
// On the other hand, OPPToken#toString has the "0x" because it should be usable in a CQL query, and it's
// nice to have fromString and toString symetrical.
// So handle both cases:
if (!tokenStr.startsWith("0x")) {
String prefix = (tokenStr.length() % 2 == 0) ? "0x" : "0x0";
tokenStr = prefix + tokenStr;
}
ByteBuffer value = Bytes.fromHexString(tokenStr);
return new OPPToken(value);
}
@Override
DataType getTokenType() {
return DataType.blob();
}
@Override
Token deserialize(ByteBuffer buffer, ProtocolVersion protocolVersion) {
return new OPPToken(buffer);
}
@Override
Token minToken() {
return MIN_TOKEN;
}
@Override
OPPToken hash(ByteBuffer partitionKey) {
return new OPPToken(partitionKey);
}
@Override
List split(Token startToken, Token endToken, int numberOfSplits) {
int tokenOrder = startToken.compareTo(endToken);
// ]min,min] means the whole ring. However, since there is no "max token" with this partitioner, we can't come up
// with a magic end value that would cover the whole ring
if (tokenOrder == 0 && startToken.equals(MIN_TOKEN))
throw new IllegalArgumentException("Cannot split whole ring with ordered partitioner");
OPPToken oppStartToken = (OPPToken) startToken;
OPPToken oppEndToken = (OPPToken) endToken;
int significantBytes;
BigInteger start, end, range, ringEnd, ringLength;
BigInteger bigNumberOfSplits = BigInteger.valueOf(numberOfSplits);
if (tokenOrder < 0) {
// Since tokens are compared lexicographically, convert to integers using the largest length
// (ex: given 0x0A and 0x0BCD, switch to 0x0A00 and 0x0BCD)
significantBytes = Math.max(oppStartToken.value.capacity(), oppEndToken.value.capacity());
// If the number of splits does not fit in the difference between the two integers, use more bytes
// (ex: cannot fit 4 splits between 0x01 and 0x03, so switch to 0x0100 and 0x0300)
// At most 4 additional bytes will be needed, since numberOfSplits is an integer.
int addedBytes = 0;
while (true) {
start = toBigInteger(oppStartToken.value, significantBytes);
end = toBigInteger(oppEndToken.value, significantBytes);
range = end.subtract(start);
if (addedBytes == 4 || range.compareTo(bigNumberOfSplits) >= 0)
break;
significantBytes += 1;
addedBytes += 1;
}
ringEnd = ringLength = null; // won't be used
} else {
// Same logic except that we wrap around the ring
significantBytes = Math.max(oppStartToken.value.capacity(), oppEndToken.value.capacity());
int addedBytes = 0;
while (true) {
start = toBigInteger(oppStartToken.value, significantBytes);
end = toBigInteger(oppEndToken.value, significantBytes);
ringLength = TWO.pow(significantBytes * 8);
ringEnd = ringLength.subtract(BigInteger.ONE);
range = end.subtract(start).add(ringLength);
if (addedBytes == 4 || range.compareTo(bigNumberOfSplits) >= 0)
break;
significantBytes += 1;
addedBytes += 1;
}
}
List values = super.split(start, range,
ringEnd, ringLength,
numberOfSplits);
List tokens = Lists.newArrayListWithExpectedSize(values.size());
for (BigInteger value : values)
tokens.add(new OPPToken(toBytes(value, significantBytes)));
return tokens;
}
// Convert a token's byte array to a number in order to perform computations.
// This depends on the number of "significant bytes" that we use to normalize all tokens to the same size.
// For example if the token is 0x01 but significantBytes is 2, the result is 8 (0x0100).
private BigInteger toBigInteger(ByteBuffer bb, int significantBytes) {
byte[] bytes = Bytes.getArray(bb);
byte[] target;
if (significantBytes != bytes.length) {
target = new byte[significantBytes];
System.arraycopy(bytes, 0, target, 0, bytes.length);
} else
target = bytes;
return new BigInteger(1, target);
}
// Convert a numeric representation back to a byte array.
// Again, the number of significant bytes matters: if the input value is 1 but significantBytes is 2, the
// expected result is 0x0001 (a simple conversion would produce 0x01).
protected ByteBuffer toBytes(BigInteger value, int significantBytes) {
byte[] rawBytes = value.toByteArray();
byte[] result;
if (rawBytes.length == significantBytes)
result = rawBytes;
else {
result = new byte[significantBytes];
int start, length;
if (rawBytes[0] == 0) { // that's a sign byte, ignore (it can cause rawBytes.length == significantBytes + 1)
start = 1;
length = rawBytes.length - 1;
} else {
start = 0;
length = rawBytes.length;
}
System.arraycopy(rawBytes, start, result, significantBytes - length, length);
}
return ByteBuffer.wrap(result);
}
}
@VisibleForTesting
OPPToken(ByteBuffer value) {
this.value = stripTrailingZeroBytes(value);
}
/**
* @return A new ByteBuffer from the input Buffer with any trailing 0-bytes stripped off.
*/
private static ByteBuffer stripTrailingZeroBytes(ByteBuffer b) {
byte result[] = Bytes.getArray(b);
int zeroIndex = result.length;
for (int i = result.length - 1; i > 0; i--) {
if (result[i] == 0) {
zeroIndex = i;
} else {
break;
}
}
return ByteBuffer.wrap(result, 0, zeroIndex);
}
@Override
public DataType getType() {
return FACTORY.getTokenType();
}
@Override
public Object getValue() {
return value;
}
@Override
public ByteBuffer serialize(ProtocolVersion protocolVersion) {
return TypeCodec.blob().serialize(value, protocolVersion);
}
@Override
public int compareTo(Token other) {
assert other instanceof OPPToken;
return UnsignedBytes.lexicographicalComparator().compare(
Bytes.getArray(value),
Bytes.getArray(((OPPToken) other).value));
}
@Override
public boolean equals(Object obj) {
if (this == obj)
return true;
if (obj == null || this.getClass() != obj.getClass())
return false;
return value.equals(((OPPToken) obj).value);
}
@Override
public int hashCode() {
return value.hashCode();
}
@Override
public String toString() {
return Bytes.toHexString(value);
}
}
// RandomPartitioner tokens
static class RPToken extends Token {
private final BigInteger value;
public static final Factory FACTORY = new RPTokenFactory();
private static class RPTokenFactory extends Factory {
private static final BigInteger MIN_VALUE = BigInteger.ONE.negate();
private static final BigInteger MAX_VALUE = BigInteger.valueOf(2).pow(127);
private static final BigInteger RING_LENGTH = MAX_VALUE.add(BigInteger.ONE);
private static final Token MIN_TOKEN = new RPToken(MIN_VALUE);
private static final Token MAX_TOKEN = new RPToken(MAX_VALUE);
private final MessageDigest prototype;
private final boolean supportsClone;
private RPTokenFactory() {
prototype = createMessageDigest();
boolean supportsClone;
try {
prototype.clone();
supportsClone = true;
} catch (CloneNotSupportedException e) {
supportsClone = false;
}
this.supportsClone = supportsClone;
}
private static MessageDigest createMessageDigest() {
try {
return MessageDigest.getInstance("MD5");
} catch (NoSuchAlgorithmException e) {
throw new RuntimeException("MD5 doesn't seem to be available on this JVM", e);
}
}
private MessageDigest newMessageDigest() {
if (supportsClone) {
try {
return (MessageDigest) prototype.clone();
} catch (CloneNotSupportedException ignored) {
}
}
return createMessageDigest();
}
private BigInteger md5(ByteBuffer data) {
MessageDigest digest = newMessageDigest();
digest.update(data.duplicate());
return new BigInteger(digest.digest()).abs();
}
@Override
RPToken fromString(String tokenStr) {
return new RPToken(new BigInteger(tokenStr));
}
@Override
DataType getTokenType() {
return DataType.varint();
}
@Override
Token deserialize(ByteBuffer buffer, ProtocolVersion protocolVersion) {
return new RPToken(TypeCodec.varint().deserialize(buffer, protocolVersion));
}
@Override
Token minToken() {
return MIN_TOKEN;
}
@Override
RPToken hash(ByteBuffer partitionKey) {
return new RPToken(md5(partitionKey));
}
@Override
List split(Token startToken, Token endToken, int numberOfSplits) {
// edge case: ]min, min] means the whole ring
if (startToken.equals(endToken) && startToken.equals(MIN_TOKEN))
endToken = MAX_TOKEN;
BigInteger start = ((RPToken) startToken).value;
BigInteger end = ((RPToken) endToken).value;
BigInteger range = end.subtract(start);
if (range.compareTo(BigInteger.ZERO) < 0)
range = range.add(RING_LENGTH);
List values = super.split(start, range,
MAX_VALUE, RING_LENGTH,
numberOfSplits);
List tokens = Lists.newArrayListWithExpectedSize(values.size());
for (BigInteger value : values)
tokens.add(new RPToken(value));
return tokens;
}
}
private RPToken(BigInteger value) {
this.value = value;
}
@Override
public DataType getType() {
return FACTORY.getTokenType();
}
@Override
public Object getValue() {
return value;
}
@Override
public ByteBuffer serialize(ProtocolVersion protocolVersion) {
return TypeCodec.varint().serialize(value, protocolVersion);
}
@Override
public int compareTo(Token other) {
assert other instanceof RPToken;
return value.compareTo(((RPToken) other).value);
}
@Override
public boolean equals(Object obj) {
if (this == obj)
return true;
if (obj == null || this.getClass() != obj.getClass())
return false;
return value.equals(((RPToken) obj).value);
}
@Override
public int hashCode() {
return value.hashCode();
}
@Override
public String toString() {
return value.toString();
}
}
}