All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.heigit.bigspatialdata.oshdb.api.mapreducer.GeometrySplitter Maven / Gradle / Ivy

Go to download

API to query the OpenStreetMap History Database. Includes MapReduce functionality to filter, analyze and aggregate data.

There is a newer version: 1.2.3
Show newest version
package org.heigit.bigspatialdata.oshdb.api.mapreducer;

import java.io.IOException;
import java.io.ObjectInputStream;
import java.io.ObjectOutputStream;
import java.io.ObjectStreamException;
import java.io.Serializable;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import java.util.Map.Entry;
import java.util.TreeMap;
import java.util.stream.Collectors;
import java.util.stream.Stream;
import org.heigit.bigspatialdata.oshdb.api.object.OSMContribution;
import org.heigit.bigspatialdata.oshdb.api.object.OSMEntitySnapshot;
import org.heigit.bigspatialdata.oshdb.util.OSHDBBoundingBox;
import org.heigit.bigspatialdata.oshdb.util.celliterator.ContributionType;
import org.heigit.bigspatialdata.oshdb.util.celliterator.LazyEvaluatedObject;
import org.heigit.bigspatialdata.oshdb.util.geometry.OSHDBGeometryBuilder;
import org.heigit.bigspatialdata.oshdb.util.geometry.fip.FastBboxInPolygon;
import org.heigit.bigspatialdata.oshdb.util.geometry.fip.FastBboxOutsidePolygon;
import org.heigit.bigspatialdata.oshdb.util.geometry.fip.FastPolygonOperations;
import org.locationtech.jts.geom.Geometry;
import org.locationtech.jts.geom.GeometryFactory;
import org.locationtech.jts.geom.Polygonal;
import org.locationtech.jts.geom.TopologyException;
import org.locationtech.jts.geom.prep.PreparedGeometry;
import org.locationtech.jts.geom.prep.PreparedGeometryFactory;
import org.locationtech.jts.index.strtree.STRtree;
import org.locationtech.jts.io.ParseException;
import org.locationtech.jts.io.WKBReader;
import org.locationtech.jts.io.WKBWriter;

/**
 * Helper class to split "MapReducible" objects into sub-regions of an area of interest.
 *
 * @param  an arbitrary index type to identify supplied sub-regions
 */
class GeometrySplitter> implements Serializable {
  private static final long serialVersionUID = 1L;

  private STRtree spatialIndex = new STRtree();
  private Map bips = new HashMap<>();
  private Map bops = new HashMap<>();
  private Map poops = new HashMap<>();
  private Map pgs = new HashMap<>();

  private Map subregions;

  

GeometrySplitter(Map subregions) { PreparedGeometryFactory pgf = new PreparedGeometryFactory(); subregions.forEach((index, geometry) -> { spatialIndex.insert(geometry.getEnvelopeInternal(), index); bips.put(index, new FastBboxInPolygon(geometry)); bops.put(index, new FastBboxOutsidePolygon(geometry)); poops.put(index, new FastPolygonOperations(geometry)); pgs.put(index, pgf.create(geometry)); }); this.subregions = subregions; } private static class IndexData { private final I index; private final D data; IndexData(I index, D data) { this.index = index; this.data = data; } I getIndex() { return index; } D getData() { return data; } } /** * Splits osm entity snapshot objects into sub-regions. * * @param data the OSMEntitySnapshot to split into the given sub-regions * @return a list of OSMEntitySnapshot objects */ public Map splitOSMEntitySnapshot(OSMEntitySnapshot data) { OSHDBBoundingBox oshBoundingBox = data.getOSHEntity().getBoundingBox(); @SuppressWarnings("unchecked") // STRtree works with raw types unfortunately List candidates = (List) spatialIndex.query( OSHDBGeometryBuilder.getGeometry(oshBoundingBox).getEnvelopeInternal() ); return candidates.stream() // OSH entity fully outside -> skip .filter(index -> !bops.get(index).test(oshBoundingBox)) .flatMap(index -> { if (bips.get(index).test(oshBoundingBox)) { // OSH entity fully inside -> directly return return Stream.of(new IndexData<>(index, data)); } // now we can check against the actual contribution geometry Geometry snapshotGeometry = data.getGeometry(); OSHDBBoundingBox snapshotBbox = OSHDBGeometryBuilder.boundingBoxOf( snapshotGeometry.getEnvelopeInternal() ); // OSM entity fully outside -> skip if (bops.get(index).test(snapshotBbox)) { return Stream.empty(); } // OSM entity fully inside -> directly return if (bips.get(index).test(snapshotBbox)) { return Stream.of(new IndexData<>(index, data)); } FastPolygonOperations poop = poops.get(index); PreparedGeometry pg = pgs.get(index); try { boolean intersects = pg.intersects(snapshotGeometry); if (!intersects) { // not actually intersecting -> skip return Stream.empty(); } else { return Stream.of(new IndexData<>(index, new OSMEntitySnapshot(data, new LazyEvaluatedObject<>(() -> faultTolerantIntersection(snapshotGeometry, poop)) ))); } } catch (TopologyException ignored) { // JTS cannot handle broken osm geometry -> skip return Stream.empty(); } }).collect(Collectors.toMap(IndexData::getIndex, IndexData::getData)); } /** * Splits osm contributions into sub-regions. * *

* The original contribution type is preserved during this operation. * For example, when a building was moved inside the area of interest from sub-region A into sub- * region B, there will be two contribution objects in the result, both of type "geometry change" * (note that in this case the contribution object of sub-region A will … * todo: ^ is this the right behaviour of contribution types when splitting into sub-regions? *

* * @param data the OSMContribution to split into the given sub-regions * @return a list of OSMContribution objects */ public Map splitOSMContribution(OSMContribution data) { OSHDBBoundingBox oshBoundingBox = data.getOSHEntity().getBoundingBox(); @SuppressWarnings("unchecked") // STRtree works with raw types unfortunately List candidates = (List) spatialIndex.query( OSHDBGeometryBuilder.getGeometry(oshBoundingBox).getEnvelopeInternal() ); return candidates.stream() // OSH entity fully outside -> skip .filter(index -> !bops.get(index).test(oshBoundingBox)) .flatMap(index -> { // OSH entity fully inside -> directly return if (bips.get(index).test(oshBoundingBox)) { return Stream.of(new IndexData<>(index, data)); } // now we can check against the actual contribution geometry Geometry contributionGeometryBefore = data.getGeometryBefore(); Geometry contributionGeometryAfter = data.getGeometryAfter(); OSHDBBoundingBox contributionGeometryBbox; if (data.is(ContributionType.CREATION)) { contributionGeometryBbox = OSHDBGeometryBuilder.boundingBoxOf( contributionGeometryAfter.getEnvelopeInternal() ); } else if (data.is(ContributionType.DELETION)) { contributionGeometryBbox = OSHDBGeometryBuilder.boundingBoxOf( contributionGeometryBefore.getEnvelopeInternal() ); } else { contributionGeometryBbox = OSHDBGeometryBuilder.boundingBoxOf( contributionGeometryBefore.getEnvelopeInternal() ); contributionGeometryBbox.add(OSHDBGeometryBuilder.boundingBoxOf( contributionGeometryAfter.getEnvelopeInternal() )); } if (bops.get(index).test(contributionGeometryBbox)) { // contribution fully outside -> skip return Stream.empty(); } if (bips.get(index).test(contributionGeometryBbox)) { // contribution fully inside -> directly return return Stream.of(new IndexData<>(index, data)); } FastPolygonOperations poop = poops.get(index); PreparedGeometry pg = pgs.get(index); try { boolean intersectsBefore = contributionGeometryBefore != null && pg.intersects(contributionGeometryBefore); boolean intersectsAfter = contributionGeometryAfter != null && pg.intersects(contributionGeometryAfter); if ((!intersectsBefore) && (!intersectsAfter)) { // not actually intersecting -> skip return Stream.empty(); } else { return Stream.of(new IndexData<>(index, new OSMContribution(data, new LazyEvaluatedObject<>(() -> faultTolerantIntersection(contributionGeometryBefore, poop)), new LazyEvaluatedObject<>(() -> faultTolerantIntersection(contributionGeometryAfter, poop))) )); } } catch (TopologyException ignored) { // JTS cannot handle broken osm geometry -> skip return Stream.empty(); } }).collect(Collectors.toMap(IndexData::getIndex, IndexData::getData)); } private static Geometry faultTolerantIntersection(Geometry subject, FastPolygonOperations poop) { try { return poop.intersection(subject); } catch (TopologyException ignored) { // JTS cannot handle broken osm geometry -> return empty geometry return (new GeometryFactory()).createGeometryCollection(); } } /** * Custom object serialization/deserialization. * *

* Sometimes, a GeometrySplitter can end up containing quite many deeply nested child-objects. * Which can lead to relatively slow object serialization. It is then faster to just transfer * the geometries and re-create the indices at the destination after de-serializing. *

*/ private void writeObject(ObjectOutputStream out) throws IOException { WKBWriter writer = new WKBWriter(); out.writeInt(this.subregions.size()); for (Entry entry : this.subregions.entrySet()) { out.writeObject(entry.getKey()); byte[] data = writer.write(entry.getValue()); out.writeInt(data.length); out.write(data); } } private

void readObject(ObjectInputStream in) throws IOException, ClassNotFoundException { WKBReader reader = new WKBReader(); int numEntries = in.readInt(); TreeMap result = new TreeMap<>(); for (int i = 0; i < numEntries; i++) { @SuppressWarnings("unchecked") // we only write `U` data in these places in `writeObject` U key = (U) in.readObject(); int dataLength = in.readInt(); byte[] data = new byte[dataLength]; int bytesRead = in.read(data); assert bytesRead == dataLength : "fewer bytes read than expected"; try { @SuppressWarnings("unchecked") // we only write `P` data in these places in `writeObject` P readData = (P) reader.read(data); result.put(key, readData); } catch (ParseException e) { throw new RuntimeException(e); } } this.subregions = result; } protected

Object readResolve() throws ObjectStreamException { @SuppressWarnings("unchecked") // constructor checks that `subregions` only contain `P` entries Map subregions = (Map) this.subregions; return new GeometrySplitter<>(subregions); } }