org.heigit.bigspatialdata.oshdb.api.mapreducer.GeometrySplitter Maven / Gradle / Ivy
Show all versions of oshdb-api Show documentation
package org.heigit.bigspatialdata.oshdb.api.mapreducer;
import java.io.IOException;
import java.io.ObjectInputStream;
import java.io.ObjectOutputStream;
import java.io.ObjectStreamException;
import java.io.Serializable;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import java.util.Map.Entry;
import java.util.TreeMap;
import java.util.stream.Collectors;
import java.util.stream.Stream;
import org.heigit.bigspatialdata.oshdb.api.object.OSMContribution;
import org.heigit.bigspatialdata.oshdb.api.object.OSMEntitySnapshot;
import org.heigit.bigspatialdata.oshdb.util.OSHDBBoundingBox;
import org.heigit.bigspatialdata.oshdb.util.celliterator.ContributionType;
import org.heigit.bigspatialdata.oshdb.util.celliterator.LazyEvaluatedObject;
import org.heigit.bigspatialdata.oshdb.util.geometry.OSHDBGeometryBuilder;
import org.heigit.bigspatialdata.oshdb.util.geometry.fip.FastBboxInPolygon;
import org.heigit.bigspatialdata.oshdb.util.geometry.fip.FastBboxOutsidePolygon;
import org.heigit.bigspatialdata.oshdb.util.geometry.fip.FastPolygonOperations;
import org.locationtech.jts.geom.Geometry;
import org.locationtech.jts.geom.GeometryFactory;
import org.locationtech.jts.geom.Polygonal;
import org.locationtech.jts.geom.TopologyException;
import org.locationtech.jts.geom.prep.PreparedGeometry;
import org.locationtech.jts.geom.prep.PreparedGeometryFactory;
import org.locationtech.jts.index.strtree.STRtree;
import org.locationtech.jts.io.ParseException;
import org.locationtech.jts.io.WKBReader;
import org.locationtech.jts.io.WKBWriter;
/**
* Helper class to split "MapReducible" objects into sub-regions of an area of interest.
*
* @param an arbitrary index type to identify supplied sub-regions
*/
class GeometrySplitter> implements Serializable {
private static final long serialVersionUID = 1L;
private STRtree spatialIndex = new STRtree();
private Map bips = new HashMap<>();
private Map bops = new HashMap<>();
private Map poops = new HashMap<>();
private Map pgs = new HashMap<>();
private Map subregions;
GeometrySplitter(Map subregions) {
PreparedGeometryFactory pgf = new PreparedGeometryFactory();
subregions.forEach((index, geometry) -> {
spatialIndex.insert(geometry.getEnvelopeInternal(), index);
bips.put(index, new FastBboxInPolygon(geometry));
bops.put(index, new FastBboxOutsidePolygon(geometry));
poops.put(index, new FastPolygonOperations(geometry));
pgs.put(index, pgf.create(geometry));
});
this.subregions = subregions;
}
private static class IndexData {
private final I index;
private final D data;
IndexData(I index, D data) {
this.index = index;
this.data = data;
}
I getIndex() {
return index;
}
D getData() {
return data;
}
}
/**
* Splits osm entity snapshot objects into sub-regions.
*
* @param data the OSMEntitySnapshot to split into the given sub-regions
* @return a list of OSMEntitySnapshot objects
*/
public Map splitOSMEntitySnapshot(OSMEntitySnapshot data) {
OSHDBBoundingBox oshBoundingBox = data.getOSHEntity().getBoundingBox();
@SuppressWarnings("unchecked") // STRtree works with raw types unfortunately
List candidates = (List) spatialIndex.query(
OSHDBGeometryBuilder.getGeometry(oshBoundingBox).getEnvelopeInternal()
);
return candidates.stream()
// OSH entity fully outside -> skip
.filter(index -> !bops.get(index).test(oshBoundingBox))
.flatMap(index -> {
if (bips.get(index).test(oshBoundingBox)) {
// OSH entity fully inside -> directly return
return Stream.of(new IndexData<>(index, data));
}
// now we can check against the actual contribution geometry
Geometry snapshotGeometry = data.getGeometry();
OSHDBBoundingBox snapshotBbox = OSHDBGeometryBuilder.boundingBoxOf(
snapshotGeometry.getEnvelopeInternal()
);
// OSM entity fully outside -> skip
if (bops.get(index).test(snapshotBbox)) {
return Stream.empty();
}
// OSM entity fully inside -> directly return
if (bips.get(index).test(snapshotBbox)) {
return Stream.of(new IndexData<>(index, data));
}
FastPolygonOperations poop = poops.get(index);
PreparedGeometry pg = pgs.get(index);
try {
boolean intersects = pg.intersects(snapshotGeometry);
if (!intersects) {
// not actually intersecting -> skip
return Stream.empty();
} else {
return Stream.of(new IndexData<>(index, new OSMEntitySnapshot(data,
new LazyEvaluatedObject<>(() ->
faultTolerantIntersection(snapshotGeometry, poop))
)));
}
} catch (TopologyException ignored) {
// JTS cannot handle broken osm geometry -> skip
return Stream.empty();
}
}).collect(Collectors.toMap(IndexData::getIndex, IndexData::getData));
}
/**
* Splits osm contributions into sub-regions.
*
*
* The original contribution type is preserved during this operation.
* For example, when a building was moved inside the area of interest from sub-region A into sub-
* region B, there will be two contribution objects in the result, both of type "geometry change"
* (note that in this case the contribution object of sub-region A will …
* todo: ^ is this the right behaviour of contribution types when splitting into sub-regions?
*
*
* @param data the OSMContribution to split into the given sub-regions
* @return a list of OSMContribution objects
*/
public Map splitOSMContribution(OSMContribution data) {
OSHDBBoundingBox oshBoundingBox = data.getOSHEntity().getBoundingBox();
@SuppressWarnings("unchecked") // STRtree works with raw types unfortunately
List candidates = (List) spatialIndex.query(
OSHDBGeometryBuilder.getGeometry(oshBoundingBox).getEnvelopeInternal()
);
return candidates.stream()
// OSH entity fully outside -> skip
.filter(index -> !bops.get(index).test(oshBoundingBox))
.flatMap(index -> {
// OSH entity fully inside -> directly return
if (bips.get(index).test(oshBoundingBox)) {
return Stream.of(new IndexData<>(index, data));
}
// now we can check against the actual contribution geometry
Geometry contributionGeometryBefore = data.getGeometryBefore();
Geometry contributionGeometryAfter = data.getGeometryAfter();
OSHDBBoundingBox contributionGeometryBbox;
if (data.is(ContributionType.CREATION)) {
contributionGeometryBbox = OSHDBGeometryBuilder.boundingBoxOf(
contributionGeometryAfter.getEnvelopeInternal()
);
} else if (data.is(ContributionType.DELETION)) {
contributionGeometryBbox = OSHDBGeometryBuilder.boundingBoxOf(
contributionGeometryBefore.getEnvelopeInternal()
);
} else {
contributionGeometryBbox = OSHDBGeometryBuilder.boundingBoxOf(
contributionGeometryBefore.getEnvelopeInternal()
);
contributionGeometryBbox.add(OSHDBGeometryBuilder.boundingBoxOf(
contributionGeometryAfter.getEnvelopeInternal()
));
}
if (bops.get(index).test(contributionGeometryBbox)) {
// contribution fully outside -> skip
return Stream.empty();
}
if (bips.get(index).test(contributionGeometryBbox)) {
// contribution fully inside -> directly return
return Stream.of(new IndexData<>(index, data));
}
FastPolygonOperations poop = poops.get(index);
PreparedGeometry pg = pgs.get(index);
try {
boolean intersectsBefore = contributionGeometryBefore != null
&& pg.intersects(contributionGeometryBefore);
boolean intersectsAfter = contributionGeometryAfter != null
&& pg.intersects(contributionGeometryAfter);
if ((!intersectsBefore) && (!intersectsAfter)) {
// not actually intersecting -> skip
return Stream.empty();
} else {
return Stream.of(new IndexData<>(index, new OSMContribution(data,
new LazyEvaluatedObject<>(() ->
faultTolerantIntersection(contributionGeometryBefore, poop)),
new LazyEvaluatedObject<>(() ->
faultTolerantIntersection(contributionGeometryAfter, poop)))
));
}
} catch (TopologyException ignored) {
// JTS cannot handle broken osm geometry -> skip
return Stream.empty();
}
}).collect(Collectors.toMap(IndexData::getIndex, IndexData::getData));
}
private static Geometry faultTolerantIntersection(Geometry subject, FastPolygonOperations poop) {
try {
return poop.intersection(subject);
} catch (TopologyException ignored) {
// JTS cannot handle broken osm geometry -> return empty geometry
return (new GeometryFactory()).createGeometryCollection();
}
}
/**
* Custom object serialization/deserialization.
*
*
* Sometimes, a GeometrySplitter can end up containing quite many deeply nested child-objects.
* Which can lead to relatively slow object serialization. It is then faster to just transfer
* the geometries and re-create the indices at the destination after de-serializing.
*
*/
private void writeObject(ObjectOutputStream out) throws IOException {
WKBWriter writer = new WKBWriter();
out.writeInt(this.subregions.size());
for (Entry entry : this.subregions.entrySet()) {
out.writeObject(entry.getKey());
byte[] data = writer.write(entry.getValue());
out.writeInt(data.length);
out.write(data);
}
}
private void readObject(ObjectInputStream in)
throws IOException, ClassNotFoundException {
WKBReader reader = new WKBReader();
int numEntries = in.readInt();
TreeMap result = new TreeMap<>();
for (int i = 0; i < numEntries; i++) {
@SuppressWarnings("unchecked") // we only write `U` data in these places in `writeObject`
U key = (U) in.readObject();
int dataLength = in.readInt();
byte[] data = new byte[dataLength];
int bytesRead = in.read(data);
assert bytesRead == dataLength : "fewer bytes read than expected";
try {
@SuppressWarnings("unchecked") // we only write `P` data in these places in `writeObject`
P readData = (P) reader.read(data);
result.put(key, readData);
} catch (ParseException e) {
throw new RuntimeException(e);
}
}
this.subregions = result;
}
protected
Object readResolve() throws ObjectStreamException {
@SuppressWarnings("unchecked") // constructor checks that `subregions` only contain `P` entries
Map subregions = (Map) this.subregions;
return new GeometrySplitter<>(subregions);
}
}