src.main.java.com.dd.plist.BinaryPropertyListParser Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of dd-plist Show documentation
Show all versions of dd-plist Show documentation
This library enables Java applications to work with property lists in various formats.
Supported formats for reading and writing are OS X/iOS binary and XML property lists.
ASCII property lists are also supported.
The library also provides access to basic functions of NeXTSTEP/Cocoa classes like
NSDictionary, NSArray, etc.
/*
* plist - An open source library to parse and generate property lists
* Copyright (C) 2011-2014 Daniel Dreibrodt
*
* Permission is hereby granted, free of charge, to any person obtaining a copy
* of this software and associated documentation files (the "Software"), to deal
* in the Software without restriction, including without limitation the rights
* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
* copies of the Software, and to permit persons to whom the Software is
* furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice shall be included in
* all copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
* SOFTWARE.
*/
package com.dd.plist;
import java.io.*;
import java.math.BigInteger;
/**
* Parses property lists that are in Apple's binary format.
* Use this class when you are sure about the format of the property list.
* Otherwise use the PropertyListParser class.
*
* Parsing is done by calling the static parse
methods.
*
* @author Daniel Dreibrodt
*/
public final class BinaryPropertyListParser {
/**
* Major version of the property list format
*/
@SuppressWarnings("FieldCanBeLocal") //Useful when the features of different format versions are implemented
private int majorVersion;
/**
* Minor version of the property list format
*/
@SuppressWarnings("FieldCanBeLocal") //Useful when the features of different format versions are implemented
private int minorVersion;
/**
* property list in bytes
*/
private byte[] bytes;
/**
* Length of an object reference in bytes
*/
private int objectRefSize;
/**
* The table holding the information at which offset each object is found
*/
private int[] offsetTable;
/**
* Protected constructor so that instantiation is fully controlled by the
* static parse methods.
*
* @see BinaryPropertyListParser#parse(byte[])
*/
private BinaryPropertyListParser() {
/** empty **/
}
/**
* Parses a binary property list from a byte array.
*
* @param data The binary property list's data.
* @return The root object of the property list. This is usually a NSDictionary but can also be a NSArray.
* @throws PropertyListFormatException When the property list's format could not be parsed.
* @throws java.io.UnsupportedEncodingException When a NSString object could not be decoded.
*/
public static NSObject parse(byte[] data) throws PropertyListFormatException, UnsupportedEncodingException {
BinaryPropertyListParser parser = new BinaryPropertyListParser();
return parser.doParse(data);
}
/**
* Parses a binary property list from a byte array.
*
* @param data The binary property list's data.
* @return The root object of the property list. This is usually a NSDictionary but can also be a NSArray.
* @throws PropertyListFormatException When the property list's format could not be parsed.
* @throws java.io.UnsupportedEncodingException When a NSString object could not be decoded.
*/
private NSObject doParse(byte[] data) throws PropertyListFormatException, UnsupportedEncodingException {
bytes = data;
String magic = new String(copyOfRange(bytes, 0, 8));
if (!magic.startsWith("bplist")) {
throw new IllegalArgumentException("The given data is no binary property list. Wrong magic bytes: " + magic);
}
majorVersion = magic.charAt(6) - 0x30; //ASCII number
minorVersion = magic.charAt(7) - 0x30; //ASCII number
// 0.0 - OS X Tiger and earlier
// 0.1 - Leopard
// 0.? - Snow Leopard
// 1.5 - Lion
// 2.0 - Snow Lion
if (majorVersion > 0) {
throw new IllegalArgumentException("Unsupported binary property list format: v" + majorVersion + "." + minorVersion + ". " +
"Version 1.0 and later are not yet supported.");
//Version 1.0+ is not even supported by OS X's own parser
}
/*
* Handle trailer, last 32 bytes of the file
*/
byte[] trailer = copyOfRange(bytes, bytes.length - 32, bytes.length);
//6 null bytes (index 0 to 5)
int offsetSize = (int) parseUnsignedInt(trailer, 6, 7);
objectRefSize = (int) parseUnsignedInt(trailer, 7, 8);
int numObjects = (int) parseUnsignedInt(trailer, 8, 16);
int topObject = (int) parseUnsignedInt(trailer, 16, 24);
int offsetTableOffset = (int) parseUnsignedInt(trailer, 24, 32);
/*
* Handle offset table
*/
offsetTable = new int[numObjects];
for (int i = 0; i < numObjects; i++) {
offsetTable[i] = (int) parseUnsignedInt(bytes, offsetTableOffset + i * offsetSize, offsetTableOffset + (i + 1) * offsetSize);
}
return parseObject(topObject);
}
/**
* Parses a binary property list from an input stream.
*
* @param is The input stream that points to the property list's data.
* @return The root object of the property list. This is usually a NSDictionary but can also be a NSArray.
* @throws PropertyListFormatException When the property list's format could not be parsed.
* @throws java.io.IOException When a NSString object could not be decoded or an InputStream IO error occurs.
*/
public static NSObject parse(InputStream is) throws IOException, PropertyListFormatException {
byte[] buf = PropertyListParser.readAll(is);
return parse(buf);
}
/**
* Parses a binary property list file.
*
* @param f The binary property list file
* @return The root object of the property list. This is usually a NSDictionary but can also be a NSArray.
* @throws PropertyListFormatException When the property list's format could not be parsed.
* @throws java.io.UnsupportedEncodingException When a NSString object could not be decoded or a file IO error occurs.
*/
public static NSObject parse(File f) throws IOException, PropertyListFormatException {
return parse(new FileInputStream(f));
}
/**
* Parses an object inside the currently parsed binary property list.
* For the format specification check
*
* Apple's binary property list parser implementation.
*
* @param obj The object ID.
* @return The parsed object.
* @throws PropertyListFormatException When the property list's format could not be parsed.
* @throws java.io.UnsupportedEncodingException When a NSString object could not be decoded.
*/
private NSObject parseObject(int obj) throws PropertyListFormatException, UnsupportedEncodingException {
int offset = offsetTable[obj];
byte type = bytes[offset];
int objType = (type & 0xF0) >> 4; //First 4 bits
int objInfo = type & 0x0F; //Second 4 bits
switch (objType) {
case 0x0: {
//Simple
switch (objInfo) {
case 0x0: {
//null object (v1.0 and later)
return null;
}
case 0x8: {
//false
return new NSNumber(false);
}
case 0x9: {
//true
return new NSNumber(true);
}
case 0xC: {
//URL with no base URL (v1.0 and later)
//TODO Implement binary URL parsing (not yet even implemented in Core Foundation as of revision 855.17)
throw new UnsupportedOperationException("The given binary property list contains a URL object. Parsing of this object type is not yet implemented.");
}
case 0xD: {
//URL with base URL (v1.0 and later)
//TODO Implement binary URL parsing (not yet even implemented in Core Foundation as of revision 855.17)
throw new UnsupportedOperationException("The given binary property list contains a URL object. Parsing of this object type is not yet implemented.");
}
case 0xE: {
//16-byte UUID (v1.0 and later)
//TODO Implement binary UUID parsing (not yet even implemented in Core Foundation as of revision 855.17)
throw new UnsupportedOperationException("The given binary property list contains a UUID object. Parsing of this object type is not yet implemented.");
}
default: {
throw new PropertyListFormatException("The given binary property list contains an object of unknown type (" + objType + ")");
}
}
}
case 0x1: {
//integer
int length = (int) Math.pow(2, objInfo);
return new NSNumber(bytes, offset + 1, offset + 1 + length, NSNumber.INTEGER);
}
case 0x2: {
//real
int length = (int) Math.pow(2, objInfo);
return new NSNumber(bytes, offset + 1, offset + 1 + length, NSNumber.REAL);
}
case 0x3: {
//Date
if (objInfo != 0x3) {
throw new PropertyListFormatException("The given binary property list contains a date object of an unknown type ("+objInfo+")");
}
return new NSDate(bytes, offset + 1, offset + 9);
}
case 0x4: {
//Data
int[] lengthAndOffset = readLengthAndOffset(objInfo, offset);
int length = lengthAndOffset[0];
int dataOffset = lengthAndOffset[1];
return new NSData(copyOfRange(bytes, offset + dataOffset, offset + dataOffset + length));
}
case 0x5: {
//ASCII string
int[] lengthAndOffset = readLengthAndOffset(objInfo, offset);
int length = lengthAndOffset[0]; //Each character is 1 byte
int strOffset = lengthAndOffset[1];
return new NSString(bytes, offset + strOffset, offset + strOffset + length, "ASCII");
}
case 0x6: {
//UTF-16-BE string
int[] lengthAndOffset = readLengthAndOffset(objInfo, offset);
int characters = lengthAndOffset[0];
int strOffset = lengthAndOffset[1];
//UTF-16 characters can have variable length, but the Core Foundation reference implementation
//assumes 2 byte characters, thus only covering the Basic Multilingual Plane
int length = characters * 2;
return new NSString(bytes, offset + strOffset, offset + strOffset + length, "UTF-16BE");
}
case 0x7: {
//UTF-8 string (v1.0 and later)
int[] lengthAndOffset = readLengthAndOffset(objInfo, offset);
int strOffset = lengthAndOffset[1];
int characters = lengthAndOffset[0];
//UTF-8 characters can have variable length, so we need to calculate the byte length dynamically
//by reading the UTF-8 characters one by one
int length = calculateUtf8StringLength(bytes, offset + strOffset, characters);
return new NSString(bytes, offset + strOffset, offset + strOffset + length, "UTF-8");
}
case 0x8: {
//UID (v1.0 and later)
int length = objInfo + 1;
return new UID(String.valueOf(obj), copyOfRange(bytes, offset + 1, offset + 1 + length));
}
case 0xA: {
//Array
int[] lengthAndOffset = readLengthAndOffset(objInfo, offset);
int length = lengthAndOffset[0];
int arrayOffset = lengthAndOffset[1];
NSArray array = new NSArray(length);
for (int i = 0; i < length; i++) {
int objRef = (int) parseUnsignedInt(bytes, offset + arrayOffset + i * objectRefSize, offset + arrayOffset + (i + 1) * objectRefSize);
array.setValue(i, parseObject(objRef));
}
return array;
}
case 0xB: {
//Ordered set (v1.0 and later)
int[] lengthAndOffset = readLengthAndOffset(objInfo, offset);
int length = lengthAndOffset[0];
int contentOffset = lengthAndOffset[1];
NSSet set = new NSSet(true);
for (int i = 0; i < length; i++) {
int objRef = (int) parseUnsignedInt(bytes, offset + contentOffset + i * objectRefSize, offset + contentOffset + (i + 1) * objectRefSize);
set.addObject(parseObject(objRef));
}
return set;
}
case 0xC: {
//Set (v1.0 and later)
int[] lengthAndOffset = readLengthAndOffset(objInfo, offset);
int length = lengthAndOffset[0];
int contentOffset = lengthAndOffset[1];
NSSet set = new NSSet();
for (int i = 0; i < length; i++) {
int objRef = (int) parseUnsignedInt(bytes, offset + contentOffset + i * objectRefSize, offset + contentOffset + (i + 1) * objectRefSize);
set.addObject(parseObject(objRef));
}
return set;
}
case 0xD: {
//Dictionary
int[] lengthAndOffset = readLengthAndOffset(objInfo, offset);
int length = lengthAndOffset[0];
int contentOffset = lengthAndOffset[1];
NSDictionary dict = new NSDictionary();
for (int i = 0; i < length; i++) {
int keyRef = (int) parseUnsignedInt(bytes, offset + contentOffset + i * objectRefSize, offset + contentOffset + (i + 1) * objectRefSize);
int valRef = (int) parseUnsignedInt(bytes, offset + contentOffset + (length * objectRefSize) + i * objectRefSize, offset + contentOffset + (length * objectRefSize) + (i + 1) * objectRefSize);
NSObject key = parseObject(keyRef);
NSObject val = parseObject(valRef);
assert key != null; //Encountering a null object at this point would either be a fundamental error in the parser or an error in the property list
dict.put(key.toString(), val);
}
return dict;
}
default: {
throw new PropertyListFormatException("The given binary property list contains an object of unknown type (" + objType + ")");
}
}
}
/**
* Reads the length for arrays, sets and dictionaries.
*
* @param objInfo Object information byte.
* @param offset Offset in the byte array at which the object is located.
* @return An array with the length two. First entry is the length, second entry the offset at which the content starts.
*/
private int[] readLengthAndOffset(int objInfo, int offset) {
int lengthValue = objInfo;
int offsetValue = 1;
if (objInfo == 0xF) {
int int_type = bytes[offset + 1];
int intType = (int_type & 0xF0) >> 4;
if (intType != 0x1) {
System.err.println("BinaryPropertyListParser: Length integer has an unexpected type" + intType + ". Attempting to parse anyway...");
}
int intInfo = int_type & 0x0F;
int intLength = (int) Math.pow(2, intInfo);
offsetValue = 2 + intLength;
if (intLength < 3) {
lengthValue = (int) parseUnsignedInt(bytes, offset + 2, offset + 2 + intLength);
} else {
lengthValue = new BigInteger(copyOfRange(bytes, offset + 2, offset + 2 + intLength)).intValue();
}
}
return new int[]{lengthValue, offsetValue};
}
private int calculateUtf8StringLength(byte[] bytes, int offset, int numCharacters) {
int length = 0;
for(int i = 0; i < numCharacters; i++) {
int tempOffset = offset + length;
if(bytes.length <= tempOffset) {
//WARNING: Invalid UTF-8 string, fall back to length = number of characters
return numCharacters;
}
if(bytes[tempOffset] < 0x80) {
length++;
}
if(bytes[tempOffset] < 0xC2) {
//Invalid value (marks continuation byte), fall back to length = number of characters
return numCharacters;
}
else if(bytes[tempOffset] < 0xE0) {
if((bytes[tempOffset + 1] & 0xC0) != 0x80) {
//Invalid continuation byte, fall back to length = number of characters
return numCharacters;
}
length += 2;
}
else if(bytes[tempOffset] < 0xF0) {
if((bytes[tempOffset + 1] & 0xC0) != 0x80
|| (bytes[tempOffset + 2] & 0xC0) != 0x80) {
//Invalid continuation byte, fall back to length = number of characters
return numCharacters;
}
length += 3;
}
else if(bytes[tempOffset] < 0xF5) {
if((bytes[tempOffset + 1] & 0xC0) != 0x80
|| (bytes[tempOffset + 2] & 0xC0) != 0x80
|| (bytes[tempOffset + 3] & 0xC0) != 0x80) {
//Invalid continuation byte, fall back to length = number of characters
return numCharacters;
}
length += 4;
}
}
return length;
}
/**
* Parses an unsigned integers from a byte array.
*
* @param bytes The byte array containing the unsigned integer.
* @return The unsigned integer represented by the given bytes.
*/
@SuppressWarnings("unused")
public static long parseUnsignedInt(byte[] bytes) {
return parseUnsignedInt(bytes, 0, bytes.length);
}
/**
* Parses an unsigned integer from a byte array.
*
* @param bytes The byte array containing the unsigned integer.
* @param startIndex Beginning of the unsigned int in the byte array.
* @param endIndex End of the unsigned int in the byte array.
* @return The unsigned integer represented by the given bytes.
*/
public static long parseUnsignedInt(byte[] bytes, int startIndex, int endIndex) {
long l = 0;
for (int i = startIndex; i < endIndex; i++) {
l <<= 8;
l |= bytes[i] & 0xFF;
}
l &= 0xFFFFFFFFL;
return l;
}
/**
* Parses a long from a (big-endian) byte array.
*
* @param bytes The bytes representing the long integer.
* @return The long integer represented by the given bytes.
*/
@SuppressWarnings("unused")
public static long parseLong(byte[] bytes) {
return parseLong(bytes, 0, bytes.length);
}
/**
* Parses a long from a (big-endian) byte array.
*
* @param bytes The bytes representing the long integer.
* @param startIndex Beginning of the long in the byte array.
* @param endIndex End of the long in the byte array.
* @return The long integer represented by the given bytes.
*/
public static long parseLong(byte[] bytes, int startIndex, int endIndex) {
long l = 0;
for (int i = startIndex; i < endIndex; i++) {
l <<= 8;
l |= bytes[i] & 0xFF;
}
return l;
}
/**
* Parses a double from a (big-endian) byte array.
*
* @param bytes The bytes representing the double.
* @return The double represented by the given bytes.
*/
@SuppressWarnings("unused")
public static double parseDouble(byte[] bytes) {
return parseDouble(bytes, 0, bytes.length);
}
/**
* Parses a double from a (big-endian) byte array.
*
* @param bytes The bytes representing the double.
* @param startIndex Beginning of the double in the byte array.
* @param endIndex End of the double in the byte array.
* @return The double represented by the given bytes.
*/
public static double parseDouble(byte[] bytes, int startIndex, int endIndex) {
if (endIndex - startIndex == 8) {
return Double.longBitsToDouble(parseLong(bytes, startIndex, endIndex));
} else if (endIndex - startIndex == 4) {
return Float.intBitsToFloat((int)parseLong(bytes, startIndex, endIndex));
} else {
throw new IllegalArgumentException("endIndex ("+endIndex+") - startIndex ("+startIndex+") != 4 or 8");
}
}
/**
* Copies a part of a byte array into a new array.
*
* @param src The source array.
* @param startIndex The index from which to start copying.
* @param endIndex The index until which to copy.
* @return The copied array.
*/
public static byte[] copyOfRange(byte[] src, int startIndex, int endIndex) {
int length = endIndex - startIndex;
if (length < 0) {
throw new IllegalArgumentException("startIndex (" + startIndex + ")" + " > endIndex (" + endIndex + ")");
}
byte[] dest = new byte[length];
System.arraycopy(src, startIndex, dest, 0, length);
return dest;
}
}