com.graphhopper.osm.pbf.PbfBlobDecoder Maven / Gradle / Ivy
// This software is released into the Public Domain. See copying.txt for details.
package com.graphhopper.osm.pbf;
import com.carrotsearch.hppc.LongIndexedContainer;
import com.google.protobuf.InvalidProtocolBufferException;
import com.graphhopper.reader.ReaderElement;
import com.graphhopper.reader.ReaderNode;
import com.graphhopper.reader.ReaderRelation;
import com.graphhopper.reader.ReaderWay;
import com.graphhopper.osm.OSMFileHeader;
import com.graphhopper.util.Helper;
import org.openstreetmap.osmosis.osmbinary.Fileformat;
import org.openstreetmap.osmosis.osmbinary.Osmformat;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import java.io.IOException;
import java.util.*;
import java.util.zip.DataFormatException;
import java.util.zip.Inflater;
/**
* Converts PBF block data into decoded entities ready to be passed into an Osmosis pipeline. This
* class is designed to be passed into a pool of worker threads to allow multi-threaded decoding.
*
*
* @author Brett Henderson
*/
public class PbfBlobDecoder implements Runnable {
private static final Logger log = LoggerFactory.getLogger(PbfBlobDecoder.class);
private final boolean checkData = false;
private final String blobType;
private final byte[] rawBlob;
private final PbfBlobDecoderListener listener;
private List decodedEntities;
/**
* Creates a new instance.
*
*
* @param blobType The type of blob.
* @param rawBlob The raw data of the blob.
* @param listener The listener for receiving decoding results.
*/
public PbfBlobDecoder(String blobType, byte[] rawBlob, PbfBlobDecoderListener listener) {
this.blobType = blobType;
this.rawBlob = rawBlob;
this.listener = listener;
}
private byte[] readBlobContent() throws IOException {
Fileformat.Blob blob = Fileformat.Blob.parseFrom(rawBlob);
byte[] blobData;
if (blob.hasRaw()) {
blobData = blob.getRaw().toByteArray();
} else if (blob.hasZlibData()) {
Inflater inflater = new Inflater();
inflater.setInput(blob.getZlibData().toByteArray());
blobData = new byte[blob.getRawSize()];
try {
inflater.inflate(blobData);
} catch (DataFormatException e) {
throw new RuntimeException("Unable to decompress PBF blob.", e);
}
if (!inflater.finished()) {
throw new RuntimeException("PBF blob contains incomplete compressed data.");
}
} else {
throw new RuntimeException("PBF blob uses unsupported compression, only raw or zlib may be used.");
}
return blobData;
}
private void processOsmHeader(byte[] data) throws InvalidProtocolBufferException {
Osmformat.HeaderBlock header = Osmformat.HeaderBlock.parseFrom(data);
// Build the list of active and unsupported features in the file.
List supportedFeatures = Arrays.asList("OsmSchema-V0.6", "DenseNodes");
List unsupportedFeatures = new ArrayList();
for (String feature : header.getRequiredFeaturesList()) {
if (supportedFeatures.contains(feature)) {
} else {
unsupportedFeatures.add(feature);
}
}
// We can't continue if there are any unsupported features. We wait
// until now so that we can display all unsupported features instead of
// just the first one we encounter.
if (unsupportedFeatures.size() > 0) {
throw new RuntimeException("PBF file contains unsupported features " + unsupportedFeatures);
}
OSMFileHeader fileheader = new OSMFileHeader();
long milliSecondDate = header.getOsmosisReplicationTimestamp();
fileheader.setTag("timestamp", Helper.createFormatter().format(new Date(milliSecondDate * 1000)));
decodedEntities.add(fileheader);
// Build a new bound object which corresponds to the header.
/*
Bound bound;
if (header.hasBbox()) {
HeaderBBox bbox = header.getBbox();
bound = new Bound(bbox.getRight() * COORDINATE_SCALING_FACTOR, bbox.getLeft() * COORDINATE_SCALING_FACTOR,
bbox.getTop() * COORDINATE_SCALING_FACTOR, bbox.getBottom() * COORDINATE_SCALING_FACTOR,
header.getSource());
} else {
bound = new Bound(header.getSource());
}
// Add the bound object to the results.
decodedEntities.add(new BoundContainer(bound));
*/
}
private Map buildTags(List keys, List values, PbfFieldDecoder fieldDecoder) {
// Ensure parallel lists are of equal size.
if (checkData) {
if (keys.size() != values.size()) {
throw new RuntimeException("Number of tag keys (" + keys.size() + ") and tag values ("
+ values.size() + ") don't match");
}
}
Iterator keyIterator = keys.iterator();
Iterator valueIterator = values.iterator();
if (keyIterator.hasNext()) {
Map tags = new HashMap(keys.size());
while (keyIterator.hasNext()) {
String key = fieldDecoder.decodeString(keyIterator.next());
String value = fieldDecoder.decodeString(valueIterator.next());
tags.put(key, value);
}
return tags;
}
return null;
}
private void processNodes(List nodes, PbfFieldDecoder fieldDecoder) {
for (Osmformat.Node node : nodes) {
Map tags = buildTags(node.getKeysList(), node.getValsList(), fieldDecoder);
ReaderNode osmNode = new ReaderNode(node.getId(), fieldDecoder.decodeLatitude(node
.getLat()), fieldDecoder.decodeLatitude(node.getLon()));
osmNode.setTags(tags);
// Add the bound object to the results.
decodedEntities.add(osmNode);
}
}
private void processNodes(Osmformat.DenseNodes nodes, PbfFieldDecoder fieldDecoder) {
List idList = nodes.getIdList();
List latList = nodes.getLatList();
List lonList = nodes.getLonList();
// Ensure parallel lists are of equal size.
if (checkData) {
if ((idList.size() != latList.size()) || (idList.size() != lonList.size())) {
throw new RuntimeException("Number of ids (" + idList.size() + "), latitudes (" + latList.size()
+ "), and longitudes (" + lonList.size() + ") don't match");
}
}
Iterator keysValuesIterator = nodes.getKeysValsList().iterator();
/*
Osmformat.DenseInfo denseInfo;
if (nodes.hasDenseinfo()) {
denseInfo = nodes.getDenseinfo();
} else {
denseInfo = null;
}
*/
long nodeId = 0;
long latitude = 0;
long longitude = 0;
// int userId = 0;
// int userSid = 0;
// long timestamp = 0;
// long changesetId = 0;
for (int i = 0; i < idList.size(); i++) {
// Delta decode node fields.
nodeId += idList.get(i);
latitude += latList.get(i);
longitude += lonList.get(i);
/*
if (denseInfo != null) {
// Delta decode dense info fields.
userId += denseInfo.getUid(i);
userSid += denseInfo.getUserSid(i);
timestamp += denseInfo.getTimestamp(i);
changesetId += denseInfo.getChangeset(i);
// Build the user, but only if one exists.
OsmUser user;
if (userId >= 0) {
user = new OsmUser(userId, fieldDecoder.decodeString(userSid));
} else {
user = OsmUser.NONE;
}
entityData = new CommonEntityData(nodeId, denseInfo.getVersion(i),
fieldDecoder.decodeTimestamp(timestamp), user, changesetId);
} else {
entityData = new CommonEntityData(nodeId, EMPTY_VERSION, EMPTY_TIMESTAMP, OsmUser.NONE,
EMPTY_CHANGESET);
}
*/
// Build the tags. The key and value string indexes are sequential
// in the same PBF array. Each set of tags is delimited by an index
// with a value of 0.
Map tags = null;
while (keysValuesIterator.hasNext()) {
int keyIndex = keysValuesIterator.next();
if (keyIndex == 0) {
break;
}
if (checkData) {
if (!keysValuesIterator.hasNext()) {
throw new RuntimeException(
"The PBF DenseInfo keys/values list contains a key with no corresponding value.");
}
}
int valueIndex = keysValuesIterator.next();
if (tags == null) {
// devide by 2 as key&value, multiple by 2 because of the better approximation
tags = new HashMap(Math.max(3, 2 * (nodes.getKeysValsList().size() / 2) / idList.size()));
}
tags.put(fieldDecoder.decodeString(keyIndex), fieldDecoder.decodeString(valueIndex));
}
ReaderNode node = new ReaderNode(nodeId, ((double) latitude) / 10000000, ((double) longitude) / 10000000);
node.setTags(tags);
// Add the bound object to the results.
decodedEntities.add(node);
}
}
private void processWays(List ways, PbfFieldDecoder fieldDecoder) {
for (Osmformat.Way way : ways) {
Map tags = buildTags(way.getKeysList(), way.getValsList(), fieldDecoder);
ReaderWay osmWay = new ReaderWay(way.getId());
osmWay.setTags(tags);
// Build up the list of way nodes for the way. The node ids are
// delta encoded meaning that each id is stored as a delta against
// the previous one.
long nodeId = 0;
LongIndexedContainer wayNodes = osmWay.getNodes();
for (long nodeIdOffset : way.getRefsList()) {
nodeId += nodeIdOffset;
wayNodes.add(nodeId);
}
decodedEntities.add(osmWay);
}
}
private void buildRelationMembers(ReaderRelation relation,
List memberIds, List memberRoles, List memberTypes,
PbfFieldDecoder fieldDecoder) {
// Ensure parallel lists are of equal size.
if (checkData) {
if ((memberIds.size() != memberRoles.size()) || (memberIds.size() != memberTypes.size())) {
throw new RuntimeException("Number of member ids (" + memberIds.size() + "), member roles ("
+ memberRoles.size() + "), and member types (" + memberTypes.size() + ") don't match");
}
}
Iterator memberIdIterator = memberIds.iterator();
Iterator memberRoleIterator = memberRoles.iterator();
Iterator memberTypeIterator = memberTypes.iterator();
// Build up the list of relation members for the way. The member ids are
// delta encoded meaning that each id is stored as a delta against
// the previous one.
long refId = 0;
while (memberIdIterator.hasNext()) {
Osmformat.Relation.MemberType memberType = memberTypeIterator.next();
refId += memberIdIterator.next();
int entityType = ReaderRelation.Member.NODE;
if (memberType == Osmformat.Relation.MemberType.WAY) {
entityType = ReaderRelation.Member.WAY;
} else if (memberType == Osmformat.Relation.MemberType.RELATION) {
entityType = ReaderRelation.Member.RELATION;
}
if (checkData) {
if (entityType == ReaderRelation.Member.NODE && memberType != Osmformat.Relation.MemberType.NODE) {
throw new RuntimeException("Member type of " + memberType + " is not supported.");
}
}
ReaderRelation.Member member = new ReaderRelation.Member(entityType, refId, fieldDecoder.decodeString(memberRoleIterator.next()));
relation.add(member);
}
}
private void processRelations(List relations, PbfFieldDecoder fieldDecoder) {
for (Osmformat.Relation relation : relations) {
Map tags = buildTags(relation.getKeysList(), relation.getValsList(), fieldDecoder);
ReaderRelation osmRelation = new ReaderRelation(relation.getId());
osmRelation.setTags(tags);
buildRelationMembers(osmRelation, relation.getMemidsList(), relation.getRolesSidList(),
relation.getTypesList(), fieldDecoder);
// Add the bound object to the results.
decodedEntities.add(osmRelation);
}
}
private void processOsmPrimitives(byte[] data) throws InvalidProtocolBufferException {
Osmformat.PrimitiveBlock block = Osmformat.PrimitiveBlock.parseFrom(data);
PbfFieldDecoder fieldDecoder = new PbfFieldDecoder(block);
for (Osmformat.PrimitiveGroup primitiveGroup : block.getPrimitivegroupList()) {
processNodes(primitiveGroup.getDense(), fieldDecoder);
processNodes(primitiveGroup.getNodesList(), fieldDecoder);
processWays(primitiveGroup.getWaysList(), fieldDecoder);
processRelations(primitiveGroup.getRelationsList(), fieldDecoder);
}
}
private void runAndTrapExceptions() {
try {
decodedEntities = new ArrayList();
if ("OSMHeader".equals(blobType)) {
processOsmHeader(readBlobContent());
} else if ("OSMData".equals(blobType)) {
processOsmPrimitives(readBlobContent());
} else if (log.isDebugEnabled())
log.debug("Skipping unrecognised blob type " + blobType);
} catch (IOException e) {
throw new RuntimeException("Unable to process PBF blob", e);
}
}
@Override
public void run() {
try {
runAndTrapExceptions();
listener.complete(decodedEntities);
} catch (RuntimeException e) {
listener.error(e);
}
}
}