
com.signalcollect.triplerush.util.TripleRushVertexMap.scala Maven / Gradle / Ivy
The newest version!
/*
* @author Philip Stutz
*
* Copyright 2012 University of Zurich
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.signalcollect.triplerush.util
import com.signalcollect.Vertex
import com.signalcollect.interfaces.VertexStore
import com.signalcollect.triplerush.EfficientIndexPattern._
import scala.util.hashing.MurmurHash3._
final object Hashing {
/**
* Inlined Murmur3, equivalent to:
* finalizeHash(mixLast(a, b), 7)
*/
@inline def hash(a: Int, b: Int): Int = {
var k = b
k *= 0xcc9e2d51
k = (k << 15) | (k >>> -15)
k *= 0x1b873593
var h = a ^ k
h ^= 7
h ^= h >>> 16
h *= 0x85ebca6b
h ^= h >>> 13
h *= 0xc2b2ae35
h ^= h >>> 16
h
}
@inline def avalanche(hash: Int): Int = {
var h = hash
h ^= h >>> 16
h *= 0x85ebca6b
h ^= h >>> 13
h *= 0xc2b2ae35
h ^= h >>> 16
h
}
@inline def finalizeHash(h: Int, length: Int): Int = avalanche(h ^ length)
@inline def rotateLeft(i: Int, distance: Int): Int = {
(i << distance) | (i >>> -distance)
}
@inline def mixLast(a: Int, b: Int): Int = {
var k = b
k *= 0xcc9e2d51
k = rotateLeft(k, 15)
k *= 0x1b873593
a ^ k
}
}
// A special adaptation of LongHashMap[Vertex[Long, _, Long, Any]].
// We allow arbitrary types for the vertex id to make
// the usage of the framework simple.
// This unfortunately means that we cannot use the id
// as the key, as these keys might be expensive to
// compare and require more space than an array of Ints.
// As a proxy we use the hashCode of a vertex id as
// the key in this map. In order to handle (rare) collisions,
// we have to do an additional check to verify that the vertex id
// matches indeed (and not just the hash of the vertex id).
final class TripleRushVertexMap(
initialSize: Int = 32768,
rehashFraction: Float = 0.75f) extends VertexStore[Long, Any] {
assert(initialSize > 0)
var maxSize = nextPowerOfTwo(initialSize)
assert(1.0f >= rehashFraction && rehashFraction > 0.1f, "Unreasonable rehash fraction.")
assert(maxSize > 0 && maxSize >= initialSize, "Initial size is too large.")
private[this] var maxElements: Int = (rehashFraction * maxSize).floor.toInt
private[this] var values: Array[Vertex[Long, _, Long, Any]] = new Array[Vertex[Long, _, Long, Any]](maxSize)
private[this] var keys: Array[Long] = new Array[Long](maxSize)
// 0 means empty
private[this] var mask: Int = maxSize - 1
private[this] var nextPositionToProcess: Int = 0
@inline override def size: Long = numberOfElements
@inline def isEmpty: Boolean = numberOfElements == 0
private[this] var numberOfElements: Int = 0
def stream: Stream[Vertex[Long, _, Long, Any]] = {
def remainder(i: Int, elementsProcessed: Int): Stream[Vertex[Long, _, Long, Any]] = {
if (elementsProcessed == numberOfElements) {
Stream.empty
} else {
var index = i
var vertex = values(index)
while (vertex == null) {
index += 1
vertex = values(index)
}
Stream.cons(vertex, remainder(index + 1, elementsProcessed + 1))
}
}
remainder(0, 0)
}
def close(): Unit = Unit
def updateStateOfVertex(vertex: Vertex[Long, _, Long, Any]): Unit = Unit
def clear(): Unit = {
values = new Array[Vertex[Long, _, Long, Any]](maxSize)
keys = new Array[Long](maxSize)
numberOfElements = 0
nextPositionToProcess = 0
}
def foreach(f: Vertex[Long, _, Long, Any] => Unit): Unit = {
var i = 0
var elementsProcessed = 0
while (elementsProcessed < numberOfElements) {
val vertex = values(i)
if (vertex != null) {
f(vertex)
elementsProcessed += 1
}
i += 1
}
}
// Removes the vertices after they have been processed.
def process(p: Vertex[Long, _, Long, Any] => Unit, numberOfVertices: Option[Int] = None): Int = {
val limit = math.min(numberOfElements, numberOfVertices.getOrElse(numberOfElements))
var elementsProcessed = 0
while (elementsProcessed < limit) {
val vertex = values(nextPositionToProcess)
if (vertex != null) {
p(vertex)
elementsProcessed += 1
keys(nextPositionToProcess) = 0
values(nextPositionToProcess) = null
numberOfElements -= 1
}
nextPositionToProcess = (nextPositionToProcess + 1) & mask
}
if (elementsProcessed > 0) {
optimizeFromPosition(nextPositionToProcess)
}
limit
}
// Removes the vertices after they have been processed.
def processWithCondition(p: Vertex[Long, _, Long, Any] => Unit, breakCondition: () => Boolean): Int = {
val limit = numberOfElements
var elementsProcessed = 0
while (elementsProcessed < limit && !breakCondition()) {
val vertex = values(nextPositionToProcess)
if (vertex != null) {
p(vertex)
elementsProcessed += 1
keys(nextPositionToProcess) = 0
values(nextPositionToProcess) = null
numberOfElements -= 1
}
nextPositionToProcess = (nextPositionToProcess + 1) & mask
}
if (elementsProcessed > 0) {
optimizeFromPosition(nextPositionToProcess)
}
elementsProcessed
}
private[this] def tryDouble(): Unit = {
// 1073741824 is the largest size and cannot be doubled anymore.
if (maxSize != 1073741824) {
val oldSize = maxSize
val oldValues = values
val oldKeys = keys
val oldNumberOfElements = numberOfElements
maxSize *= 2
maxElements = (rehashFraction * maxSize).floor.toInt
values = new Array[Vertex[Long, _, Long, Any]](maxSize)
keys = new Array[Long](maxSize)
mask = maxSize - 1
numberOfElements = 0
var i = 0
var elementsMoved = 0
while (elementsMoved < oldNumberOfElements) {
if (oldKeys(i) != 0) {
put(oldValues(i))
elementsMoved += 1
}
i += 1
}
}
}
def remove(vertexId: Long): Unit = {
remove(vertexId, true)
}
private[this] def remove(vertexId: Long, optimize: Boolean): Unit = {
var position = keyToPosition(vertexId)
var keyAtPosition = keys(position)
while (keyAtPosition != 0 && vertexId != keyAtPosition) {
position = (position + 1) & mask
keyAtPosition = keys(position)
}
// We can only remove the entry if it was found.
if (keyAtPosition != 0) {
keys(position) = 0
values(position) = null
numberOfElements -= 1
if (optimize) {
optimizeFromPosition((position + 1) & mask)
}
}
}
// Try to reinsert all elements that are not optimally placed until an empty position is found.
// See http://stackoverflow.com/questions/279539/best-way-to-remove-an-entry-from-a-hash-table
@inline private[this] def optimizeFromPosition(startingPosition: Int): Unit = {
var currentPosition = startingPosition
var keyAtPosition = keys(currentPosition)
while (isCurrentPositionOccupied) {
val perfectPositionForEntry = keyToPosition(keyAtPosition)
if (perfectPositionForEntry != currentPosition) {
// We try to optimize the placement of the entry by removing and then reinserting it.
val vertex = values(currentPosition)
removeCurrentEntry
putWithKey(keyAtPosition, vertex)
}
advance
}
@inline def advance(): Unit = {
currentPosition = ((currentPosition + 1) & mask)
keyAtPosition = keys(currentPosition)
}
@inline def isCurrentPositionOccupied: Boolean = {
keyAtPosition != 0
}
@inline def removeCurrentEntry(): Unit = {
keys(currentPosition) = 0
values(currentPosition) = null
numberOfElements -= 1
}
}
@inline def get(vertexId: Long): Vertex[Long, _, Long, Any] = {
var position = keyToPosition(vertexId)
var keyAtPosition = keys(position)
while (keyAtPosition != 0 && vertexId != keyAtPosition) {
position = (position + 1) & mask
keyAtPosition = keys(position)
}
if (keyAtPosition != 0) {
values(position)
} else {
null
}
}
// Only put if no vertex with the same id is present. If a vertex was put, return true.
def put(vertex: Vertex[Long, _, Long, Any]): Boolean = {
val success = putWithKey(vertex.id, vertex)
success
}
private[this] def putWithKey(key: Long, vertex: Vertex[Long, _, Long, Any]): Boolean = {
var position = keyToPosition(key)
var keyAtPosition = keys(position)
while (keyAtPosition != 0 && key != keyAtPosition) {
position = (position + 1) & mask
keyAtPosition = keys(position)
}
var doPut = keyAtPosition == 0
// Only put if the there is no vertex with the same id yet.
if (doPut) {
keys(position) = key
values(position) = vertex
numberOfElements += 1
if (numberOfElements >= maxElements) {
tryDouble
if (numberOfElements >= maxSize) {
throw new OutOfMemoryError("The hash map is full and cannot be expanded any further.")
}
}
}
doPut
}
@inline private[this] def keyToPosition(efficientIndexPattern: Long): Int = {
Hashing.hash(efficientIndexPattern.extractFirst, efficientIndexPattern.extractSecond) & mask
}
private[this] def nextPowerOfTwo(x: Int): Int = {
var r = x - 1
r |= r >> 1
r |= r >> 2
r |= r >> 4
r |= r >> 8
r |= r >> 16
r + 1
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy