org.geolatte.geom.codec.WktTokenizer Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of geolatte-geom Show documentation
Show all versions of geolatte-geom Show documentation
This geoLatte-geom library offers a geometry model that conforms to the OGC Simple Features for SQL
specification.
/*
* This file is part of the GeoLatte project.
*
* GeoLatte is free software: you can redistribute it and/or modify
* it under the terms of the GNU Lesser General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* GeoLatte is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public License
* along with GeoLatte. If not, see .
*
* Copyright (C) 2010 - 2011 and Ownership of code is shared by:
* Qmino bvba - Romeinsestraat 18 - 3001 Heverlee (http://www.qmino.com)
* Geovise bvba - Generaal Eisenhowerlei 9 - 2140 Antwerpen (http://www.geovise.com)
*/
package org.geolatte.geom.codec;
import org.geolatte.geom.PositionSequenceBuilder;
import org.geolatte.geom.PositionSequenceBuilders;
import org.geolatte.geom.crs.CoordinateReferenceSystem;
import org.geolatte.geom.crs.CoordinateReferenceSystems;
import org.geolatte.geom.crs.CrsRegistry;
import org.geolatte.geom.crs.Unit;
import static org.geolatte.geom.crs.CoordinateReferenceSystems.*;
/**
* A tokenizer for WKT representations.
*
* The variant of WKT that this tokenizer recognizes is determined by the {@link WktVariant}
* that is passed upon construction.
*
* @author Karel Maesen, Geovise BVBA, 2011
*/
class WktTokenizer extends AbstractWktTokenizer {
private boolean isMeasured = false;
protected final CoordinateReferenceSystem> baseCRS;
protected final boolean forceToCRS;
private CoordinateReferenceSystem> targetCRS;
/**
* A Tokenizer for the specified WKT string
*
* @param wkt the string to tokenize
* @param variant the list of words to recognize as separate variant
* @param baseCRS the CoordinateReferenceSystem
for the points in the WKT representation.
*/
protected WktTokenizer(CharSequence wkt, WktVariant variant, CoordinateReferenceSystem> baseCRS, boolean forceToCRS) {
super(wkt, variant);
if (wkt == null || variant == null)
throw new IllegalArgumentException("Input WKT and variant must not be null");
if (baseCRS == null) {
this.baseCRS = CoordinateReferenceSystems.PROJECTED_2D_METER;
this.forceToCRS = false;
} else {
this.baseCRS = baseCRS;
this.forceToCRS = forceToCRS;
}
}
protected WktTokenizer(CharSequence wkt, WktVariant variant, CoordinateReferenceSystem> baseCRS) {
this(wkt, variant, baseCRS, false);
}
@Override
WktToken numericToken() {
CoordinateReferenceSystem> crs = getCoordinateReferenceSystem();
int numPoints = countPoints();
//Note that the coords array can be larger than the number of coordinates available in the pointsequence
// e.g. when a composite CRS is passed in the decode function for a 2D WKT.
// this works because fastReadNumber returns 0 when attempting to read beyond a point delimiter
double[] coords = new double[crs.getCoordinateDimension()];
PositionSequenceBuilder> psBuilder = PositionSequenceBuilders.fixedSized(numPoints, crs.getPositionClass());
for (int i = 0; i < numPoints; i++) {
readPoint(coords);
psBuilder.add(coords);
skipPointDelimiter();
}
return new WktPointSequenceToken(psBuilder.toPositionSequence(), getCoordinateReferenceSystem());
}
private void readPoint(double[] coords) {
for (int i = 0; i < coords.length; i++) {
coords[i] = fastReadNumber();
}
}
/**
* Reads a number at the current position.
* Note that this method loses precision, e.g. 51.16666723333333 becomes 51.16666723333332)
*
* @return
*/
protected double fastReadNumber() {
skipWhitespace();
int startPos = currentPos;
char c = wkt.charAt(currentPos);
double sign = 1.0d;
//read the sign
if (c == '-') {
sign = -1.0d;
c = wkt.charAt(++currentPos);
}
//read the number and put it in form E
long s = 0l;
boolean decPntSeen = false;
long decPos = -1;
while (true) {
if (Character.isDigit(c)) {
s = 10 * s + (c - '0');
} else if (c == '.' ) {
if (decPntSeen) {
throw new WktDecodeException("Invalid number format at position " + currentPos);
}
decPntSeen = true;
} else {
break;
}
if (decPntSeen) {
decPos++;
}
c = wkt.charAt(++currentPos);
}
//read the exponent (scientific notation)
long exp = 0l;
long expSign = 1l;
if (c == 'e' || c == 'E') {
c = wkt.charAt(++currentPos);
if (c == '-') {
expSign = -1l;
c = wkt.charAt(++currentPos);
}
while (Character.isDigit(c)) {
exp = 10 * exp + (c - '0');
c = wkt.charAt(++currentPos);
}
}
long p = decPos >= 0 ? expSign * exp - decPos : expSign * exp;
int endPos = currentPos;
return toDouble(sign, s, p, startPos, endPos);
}
private int countPoints() {
int pos = currentPos + 1;
char c = wkt.charAt(pos);
int num = 1;
while (c != ')') {
if (c == ',') num++;
c = wkt.charAt(++pos);
}
return num;
}
private CoordinateReferenceSystem> getCoordinateReferenceSystem() {
if (targetCRS == null) {
targetCRS = determineTargetCRS();
}
return targetCRS;
}
private CoordinateReferenceSystem> determineTargetCRS() {
int pos = currentPos;
int num = 1;
boolean inNumber = true;
//move to the end of this point (ends with a ',' or a ')'
char c = wkt.charAt(pos);
while (!(c == ',' || c == variant.getCloseListChar())) {
if (!(Character.isDigit(c) || c == '.' || c == '-' || c == 'e' || c == 'E')) {
inNumber = false;
} else if (!inNumber) {
num++;
inNumber = true;
}
if (pos == wkt.length() - 1) throw new WktDecodeException("");
c = wkt.charAt(++pos);
}
if (num == 4) return ensureZM(baseCRS, true, true);
if (num == 3 && isMeasured) return ensureZM(baseCRS, false, true);
if (num == 3 && !isMeasured) return ensureZM(baseCRS, true, false);
if (num == 2) return baseCRS;
throw new WktDecodeException("Point with less than 2 coordinates at position " + currentPos);
}
private CoordinateReferenceSystem> ensureZM(CoordinateReferenceSystem> crs, boolean needZ, boolean needM) {
CoordinateReferenceSystem> compound = crs;
if (needZ && ! hasVerticalAxis(compound)) {
compound = addVerticalSystem(compound, Unit.METER);
}
if (needM && ! hasMeasureAxis(compound)) {
compound = addLinearSystem(compound, Unit.METER);
}
if (forceToCRS && !compound.equals(crs)) {
throw new WktDecodeException("WKT inconsistent with specified Coordinate Reference System");
}
return compound;
}
private void skipPointDelimiter() {
skipWhitespace();
if (wkt.charAt(currentPos) == ',') currentPos++;
}
protected WktToken matchKeyword(int currentPos, int endPos) {
WktToken token = variant.matchKeyword(wkt, currentPos, endPos);
if (token instanceof WktGeometryToken) {
this.isMeasured = isMeasured || ((WktGeometryToken) token).isMeasured();
}
return token;
}
/**
* Converts the decimal number representation into a double
*
* This routine tries to apply the "Fast path" to get a really fast conversion, if applicable. If not, it
* delegates to the more expensive Double.parseDouble() StdLib conversion.
*
* See: http://www.exploringbinary.com/fast-path-decimal-to-floating-point-conversion/
* and Handbook of Floating-Point Arithmetic, p. 47-8 (Muller e.a)
*
* @param sign the sign of the number
* @param s the decimal mantissa or significand as a long
* @param p the exponent as a long
* @param startPos the start position in the Wkt for the parsed number
* @param endPos the end position in the wkt for the parsed number
* @return
*/
protected double toDouble(double sign, long s, long p, int startPos, int endPos) {
//check if the Fast-path is applicable.
// we also test for negative s values to account for overrun/underrun conditions in the calling fastNumber procedure
if (s == 0) {
return 0.0d;
} else if (s > 0 && s <= S_MAX && Math.abs(p) <= P_MAX) {
if (p == 0l) {
return sign * s;
} else if (p < 0) {
return sign * (s / Math.pow(10,-p));
} else {
return sign * (s * Math.pow(10,p));
}
} else {
return Double.parseDouble(wkt.subSequence(startPos, endPos).toString());
}
}
private static long S_MAX = 9007199254740991L;
private static long P_MAX = 22l;
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy