All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.opentripplanner.framework.geometry.HashGridSpatialIndex Maven / Gradle / Ivy

The newest version!
package org.opentripplanner.framework.geometry;

import gnu.trove.map.hash.TLongObjectHashMap;
import gnu.trove.set.TLongSet;
import gnu.trove.set.hash.TLongHashSet;
import java.io.Serializable;
import java.util.ArrayList;
import java.util.HashSet;
import java.util.List;
import java.util.Locale;
import java.util.Set;
import org.locationtech.jts.geom.Coordinate;
import org.locationtech.jts.geom.Envelope;
import org.locationtech.jts.geom.LineString;
import org.locationtech.jts.index.ItemVisitor;
import org.locationtech.jts.index.SpatialIndex;
import org.opentripplanner.framework.lang.IntBox;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

/**
 * A spatial index using a 2D fast long hashtable (Trove lib).
 * 

* Objects to index are placed in all grid bins touching the bounding envelope. We *do not store* * any bouding envelope for each object, so this imply that we will return false positive when * querying, and it's up to the client to filter them out (with whatever knowledge it has on the * location of the object). *

* Note: For performance reasons, write operation are not synchronized, it must be taken care by the * client. Read-only operation are multi-thread-safe though. * * @param Type of objects to be spatial indexed. * @author laurent */ public class HashGridSpatialIndex implements SpatialIndex, Serializable { @SuppressWarnings("unused") private static final Logger LOG = LoggerFactory.getLogger(HashGridSpatialIndex.class); /* Computation done based on geographical coordinates. */ // private static final double DEFAULT_Y_BIN_SIZE = 0.010; // ~1km private static final double DEFAULT_Y_BIN_SIZE = 0.005; // ~500m /* Computation done based on geographical coordinates at ~45 degree lat */ // private static final double DEFAULT_X_BIN_SIZE = 0.007; // ~1km private static final double DEFAULT_X_BIN_SIZE = 0.0035; // ~500m /* Size of bin in X and Y direction, in coordinates units. */ private final double xBinSize, yBinSize; /* The map of all bins. Please see visit() and xKey/yKey for details on the key. */ private final TLongObjectHashMap> bins; private int nBins = 0; private int nObjects = 0; private int nEntries = 0; public HashGridSpatialIndex(double xBinSize, double yBinSize) { if (xBinSize <= 0 || yBinSize <= 0) throw new IllegalStateException( "bin size must be positive." ); this.xBinSize = xBinSize; this.yBinSize = yBinSize; // For 200m bins, 500x500 = 100x100km = 250000 bins bins = new TLongObjectHashMap<>(); } /** Create a HashGrid with the default grid dimensions. */ public HashGridSpatialIndex() { this(DEFAULT_X_BIN_SIZE, DEFAULT_Y_BIN_SIZE); } @Override public final void insert(Envelope envelope, final Object item) { visit( envelope, true, (bin, mapKey) -> { /* * Note: here we can end-up having several time the same object in the same bin, if * the client insert multiple times the same object with different envelopes. * However we do filter duplicated when querying, so apart for memory/performance * reasons it should work. If this becomes a problem, we can use a set instead of a * list. */ bin.add((T) item); nEntries++; return false; } ); nObjects++; } @Override public final List query(Envelope envelope) { final Set ret = new HashSet<>(1024); visit( envelope, false, (bin, mapKey) -> { ret.addAll(bin); return false; } ); return new ArrayList<>(ret); } @Override public final void query(Envelope envelope, ItemVisitor visitor) { // We are cheating a bit here... But who cares? Never called in OTP. List tlist = query(envelope); for (T t : tlist) { visitor.visitItem(t); } } @Override public final boolean remove(Envelope envelope, final Object item) { // This iterates over the entire rectangular envelope of the edge rather than the segments // making it up. It will be inefficient for very long edges, but creating a new remove method // mirroring the more efficient insert logic is not trivial and would require additional // testing of the spatial index. final IntBox removedCount = new IntBox(0); visit( envelope, false, (bin, mapKey) -> { boolean removed = bin.remove(item); if (removed) { nEntries--; removedCount.inc(); } return removed; } ); if (removedCount.get() > 0) { nObjects--; return true; } else { return false; } } public final void insert(LineString geom, final Object item) { Coordinate[] coord = geom.getCoordinates(); final TLongSet keys = new TLongHashSet(coord.length * 8); for (int i = 0; i < coord.length - 1; i++) { // TODO Cut the segment if longer than bin size // to reduce the number of wrong bins Envelope env = new Envelope(coord[i], coord[i + 1]); visit( env, true, (bin, mapKey) -> { keys.add(mapKey); return false; } ); } keys.forEach(key -> { // Note: bins have been initialized in the previous visit bins.get(key).add((T) item); nEntries++; return true; }); nObjects++; } /** * Make each bin be exactly the required size. This is helpful for large indices, which are mostly * used for reads only. */ public void compact() { bins.forEachValue(ts -> { ts.trimToSize(); return true; }); } public String toString() { return String.format( Locale.ROOT, "HashGridSpatialIndex %f x %f, %d bins allocated, %d objs, %d entries (avg %.2f entries/bin, %.2f entries/object)", this.xBinSize, this.yBinSize, this.nBins, this.nObjects, this.nEntries, this.nEntries * 1.0 / this.nBins, this.nEntries * 1.0 / this.nObjects ); } /** Clamp a coordinate to allowable lat/lon values */ private static Coordinate clamp(Coordinate coord) { if (Math.abs(coord.x) > 180 || Math.abs(coord.y) > 90) { LOG.warn( "Corner of envelope {} was invalid, clamping to valid range. Perhaps you're buffering something near a pole?", coord ); // make a defensive copy as we're about to modify the coordinate coord = new Coordinate(coord); if (coord.x > 180) { coord.x = 180; } if (coord.x < -180) { coord.x = -180; } if (coord.y > 90) { coord.y = 90; } if (coord.y < -90) { coord.y = -90; } } return coord; } /** * Visit each bin touching the envelope. * * @param envelope Self-descripting. * @param createIfEmpty Create a new bin if not existing. * @param binVisitor The callback to call for each visited bin. */ private void visit(Envelope envelope, boolean createIfEmpty, final BinVisitor binVisitor) { Coordinate min = new Coordinate(envelope.getMinX(), envelope.getMinY()); Coordinate max = new Coordinate(envelope.getMaxX(), envelope.getMaxY()); // clamp coordinates to earth. TODO: handle cross-date-line envelopes. min = clamp(min); max = clamp(max); long minXKey = Math.round(min.x / xBinSize); long maxXKey = Math.round(max.x / xBinSize); long minYKey = Math.round(min.y / yBinSize); long maxYKey = Math.round(max.y / yBinSize); for (long xKey = minXKey; xKey <= maxXKey; xKey++) { for (long yKey = minYKey; yKey <= maxYKey; yKey++) { /* * For all known use, the average absolute value of x/y keys will be rather small * compared to Integer.MAX_VALUE. We need to swap the two words (MSB and LSB) of * xKey in order to have a well-behaving long hash, fitting in an int, because the * default implementation is: hashInt = (int)(value ^ (value >>> 32)); */ long mapKey = (yKey << 32) | ((xKey & 0xFFFF) << 16) | ((xKey >> 16) & 0xFFFF); ArrayList bin = bins.get(mapKey); if (createIfEmpty && bin == null) { bin = new ArrayList<>(); bins.put(mapKey, bin); nBins++; } if (bin != null) { boolean modified = binVisitor.visit(bin, mapKey); if (modified && bin.isEmpty()) { bins.remove(mapKey); nBins--; } } } } } private interface BinVisitor { /** * Bin visitor callback. * * @return true if something has been removed from the bin. */ boolean visit(List bin, long mapKey); } }





© 2015 - 2025 Weber Informatics LLC | Privacy Policy