org.apache.commons.imaging.formats.tiff.TiffReader Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of commons-imaging Show documentation
Show all versions of commons-imaging Show documentation
Apache Commons Imaging (previously Sanselan) is a pure-Java image library.
The newest version!
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.commons.imaging.formats.tiff;
import static org.apache.commons.imaging.common.BinaryFunctions.read2Bytes;
import static org.apache.commons.imaging.common.BinaryFunctions.read4Bytes;
import static org.apache.commons.imaging.common.BinaryFunctions.readByte;
import static org.apache.commons.imaging.common.BinaryFunctions.readBytes;
import static org.apache.commons.imaging.common.BinaryFunctions.skipBytes;
import static org.apache.commons.imaging.formats.tiff.constants.TiffConstants.TIFF_ENTRY_MAX_VALUE_LENGTH;
import java.io.IOException;
import java.io.InputStream;
import java.nio.ByteOrder;
import java.util.ArrayList;
import java.util.List;
import java.util.Map;
import org.apache.commons.imaging.FormatCompliance;
import org.apache.commons.imaging.ImageReadException;
import org.apache.commons.imaging.ImagingConstants;
import org.apache.commons.imaging.common.BinaryFileParser;
import org.apache.commons.imaging.common.ByteConversions;
import org.apache.commons.imaging.common.bytesource.ByteSource;
import org.apache.commons.imaging.common.bytesource.ByteSourceFile;
import org.apache.commons.imaging.formats.jpeg.JpegConstants;
import org.apache.commons.imaging.formats.tiff.TiffDirectory.ImageDataElement;
import org.apache.commons.imaging.formats.tiff.constants.ExifTagConstants;
import org.apache.commons.imaging.formats.tiff.constants.TiffDirectoryConstants;
import org.apache.commons.imaging.formats.tiff.constants.TiffTagConstants;
import org.apache.commons.imaging.formats.tiff.fieldtypes.FieldType;
import org.apache.commons.imaging.formats.tiff.taginfos.TagInfoDirectory;
public class TiffReader extends BinaryFileParser {
private final boolean strict;
public TiffReader(final boolean strict) {
this.strict = strict;
}
private TiffHeader readTiffHeader(final ByteSource byteSource) throws ImageReadException, IOException {
try (InputStream is = byteSource.getInputStream()) {
return readTiffHeader(is);
}
}
private ByteOrder getTiffByteOrder(final int byteOrderByte) throws ImageReadException {
if (byteOrderByte == 'I') {
return ByteOrder.LITTLE_ENDIAN; // Intel
} else if (byteOrderByte == 'M') {
return ByteOrder.BIG_ENDIAN; // Motorola
} else {
throw new ImageReadException("Invalid TIFF byte order " + (0xff & byteOrderByte));
}
}
private TiffHeader readTiffHeader(final InputStream is) throws ImageReadException, IOException {
final int byteOrder1 = readByte("BYTE_ORDER_1", is, "Not a Valid TIFF File");
final int byteOrder2 = readByte("BYTE_ORDER_2", is, "Not a Valid TIFF File");
if (byteOrder1 != byteOrder2) {
throw new ImageReadException("Byte Order bytes don't match (" + byteOrder1 + ", " + byteOrder2 + ").");
}
final ByteOrder byteOrder = getTiffByteOrder(byteOrder1);
setByteOrder(byteOrder);
final int tiffVersion = read2Bytes("tiffVersion", is, "Not a Valid TIFF File", getByteOrder());
if (tiffVersion != 42) {
throw new ImageReadException("Unknown Tiff Version: " + tiffVersion);
}
final long offsetToFirstIFD =
0xFFFFffffL & read4Bytes("offsetToFirstIFD", is, "Not a Valid TIFF File", getByteOrder());
skipBytes(is, offsetToFirstIFD - 8, "Not a Valid TIFF File: couldn't find IFDs");
if (getDebug()) {
System.out.println("");
}
return new TiffHeader(byteOrder, tiffVersion, offsetToFirstIFD);
}
private void readDirectories(final ByteSource byteSource,
final FormatCompliance formatCompliance, final Listener listener)
throws ImageReadException, IOException {
final TiffHeader tiffHeader = readTiffHeader(byteSource);
if (!listener.setTiffHeader(tiffHeader)) {
return;
}
final long offset = tiffHeader.offsetToFirstIFD;
final int dirType = TiffDirectoryConstants.DIRECTORY_TYPE_ROOT;
final List visited = new ArrayList<>();
readDirectory(byteSource, offset, dirType, formatCompliance, listener, visited);
}
private boolean readDirectory(final ByteSource byteSource, final long offset,
final int dirType, final FormatCompliance formatCompliance, final Listener listener,
final List visited) throws ImageReadException, IOException {
final boolean ignoreNextDirectory = false;
return readDirectory(byteSource, offset, dirType, formatCompliance,
listener, ignoreNextDirectory, visited);
}
private boolean readDirectory(final ByteSource byteSource, final long directoryOffset,
final int dirType, final FormatCompliance formatCompliance, final Listener listener,
final boolean ignoreNextDirectory, final List visited)
throws ImageReadException, IOException {
if (visited.contains(directoryOffset)) {
return false;
}
visited.add(directoryOffset);
try (InputStream is = byteSource.getInputStream()) {
if (directoryOffset >= byteSource.getLength()) {
return true;
}
skipBytes(is, directoryOffset);
final List fields = new ArrayList<>();
int entryCount;
try {
entryCount = read2Bytes("DirectoryEntryCount", is, "Not a Valid TIFF File", getByteOrder());
} catch (final IOException e) {
if (strict) {
throw e;
}
return true;
}
for (int i = 0; i < entryCount; i++) {
final int tag = read2Bytes("Tag", is, "Not a Valid TIFF File", getByteOrder());
final int type = read2Bytes("Type", is, "Not a Valid TIFF File", getByteOrder());
final long count = 0xFFFFffffL & read4Bytes("Count", is, "Not a Valid TIFF File", getByteOrder());
final byte[] offsetBytes = readBytes("Offset", is, 4, "Not a Valid TIFF File");
final long offset = 0xFFFFffffL & ByteConversions.toInt(offsetBytes, getByteOrder());
if (tag == 0) {
// skip invalid fields.
// These are seen very rarely, but can have invalid value
// lengths,
// which can cause OOM problems.
continue;
}
final FieldType fieldType;
try {
fieldType = FieldType.getFieldType(type);
} catch (final ImageReadException imageReadEx) {
// skip over unknown fields types, since we
// can't calculate their size without
// knowing their type
continue;
}
final long valueLength = count * fieldType.getSize();
final byte[] value;
if (valueLength > TIFF_ENTRY_MAX_VALUE_LENGTH) {
if ((offset < 0) || (offset + valueLength) > byteSource.getLength()) {
if (strict) {
throw new IOException(
"Attempt to read byte range starting from " + offset + " "
+ "of length " + valueLength + " "
+ "which is outside the file's size of "
+ byteSource.getLength());
} else {
// corrupt field, ignore it
continue;
}
}
value = byteSource.getBlock(offset, (int) valueLength);
} else {
value = offsetBytes;
}
final TiffField field = new TiffField(tag, dirType, fieldType, count,
offset, value, getByteOrder(), i);
fields.add(field);
if (!listener.addField(field)) {
return true;
}
}
final long nextDirectoryOffset = 0xFFFFffffL & read4Bytes("nextDirectoryOffset", is,
"Not a Valid TIFF File", getByteOrder());
final TiffDirectory directory = new TiffDirectory(dirType, fields,
directoryOffset, nextDirectoryOffset);
if (listener.readImageData()) {
if (directory.hasTiffImageData()) {
final TiffImageData rawImageData = getTiffRawImageData(
byteSource, directory);
directory.setTiffImageData(rawImageData);
}
if (directory.hasJpegImageData()) {
final JpegImageData rawJpegImageData = getJpegRawImageData(
byteSource, directory);
directory.setJpegImageData(rawJpegImageData);
}
}
if (!listener.addDirectory(directory)) {
return true;
}
if (listener.readOffsetDirectories()) {
final TagInfoDirectory[] offsetFields = {
ExifTagConstants.EXIF_TAG_EXIF_OFFSET,
ExifTagConstants.EXIF_TAG_GPSINFO,
ExifTagConstants.EXIF_TAG_INTEROP_OFFSET
};
final int[] directoryTypes = {
TiffDirectoryConstants.DIRECTORY_TYPE_EXIF,
TiffDirectoryConstants.DIRECTORY_TYPE_GPS,
TiffDirectoryConstants.DIRECTORY_TYPE_INTEROPERABILITY
};
for (int i = 0; i < offsetFields.length; i++) {
final TagInfoDirectory offsetField = offsetFields[i];
final TiffField field = directory.findField(offsetField);
if (field != null) {
long subDirectoryOffset;
int subDirectoryType;
boolean subDirectoryRead = false;
try {
subDirectoryOffset = directory.getFieldValue(offsetField);
subDirectoryType = directoryTypes[i];
subDirectoryRead = readDirectory(byteSource,
subDirectoryOffset, subDirectoryType,
formatCompliance, listener, true, visited);
} catch (final ImageReadException imageReadException) {
if (strict) {
throw imageReadException;
}
}
if (!subDirectoryRead) {
fields.remove(field);
}
}
}
}
if (!ignoreNextDirectory && directory.nextDirectoryOffset > 0) {
// Debug.debug("next dir", directory.nextDirectoryOffset );
readDirectory(byteSource, directory.nextDirectoryOffset,
dirType + 1, formatCompliance, listener, visited);
}
return true;
}
}
public interface Listener {
boolean setTiffHeader(TiffHeader tiffHeader);
boolean addDirectory(TiffDirectory directory);
boolean addField(TiffField field);
boolean readImageData();
boolean readOffsetDirectories();
}
private static class Collector implements Listener {
private TiffHeader tiffHeader;
private final List directories = new ArrayList<>();
private final List fields = new ArrayList<>();
private final boolean readThumbnails;
public Collector() {
this(null);
}
public Collector(final Map params) {
boolean tmpReadThumbnails = true;
if (params != null && params.containsKey(ImagingConstants.PARAM_KEY_READ_THUMBNAILS)) {
tmpReadThumbnails = Boolean.TRUE.equals(params.get(ImagingConstants.PARAM_KEY_READ_THUMBNAILS));
}
this.readThumbnails = tmpReadThumbnails;
}
@Override
public boolean setTiffHeader(final TiffHeader tiffHeader) {
this.tiffHeader = tiffHeader;
return true;
}
@Override
public boolean addDirectory(final TiffDirectory directory) {
directories.add(directory);
return true;
}
@Override
public boolean addField(final TiffField field) {
fields.add(field);
return true;
}
@Override
public boolean readImageData() {
return readThumbnails;
}
@Override
public boolean readOffsetDirectories() {
return true;
}
public TiffContents getContents() {
return new TiffContents(tiffHeader, directories);
}
}
private static class FirstDirectoryCollector extends Collector {
private final boolean readImageData;
public FirstDirectoryCollector(final boolean readImageData) {
this.readImageData = readImageData;
}
@Override
public boolean addDirectory(final TiffDirectory directory) {
super.addDirectory(directory);
return false;
}
@Override
public boolean readImageData() {
return readImageData;
}
}
// NOT USED
// private static class DirectoryCollector extends Collector {
// private final boolean readImageData;
//
// public DirectoryCollector(final boolean readImageData) {
// this.readImageData = readImageData;
// }
//
// @Override
// public boolean addDirectory(final TiffDirectory directory) {
// super.addDirectory(directory);
// return false;
// }
//
// @Override
// public boolean readImageData() {
// return readImageData;
// }
// }
public TiffContents readFirstDirectory(final ByteSource byteSource, final Map params,
final boolean readImageData, final FormatCompliance formatCompliance)
throws ImageReadException, IOException {
final Collector collector = new FirstDirectoryCollector(readImageData);
read(byteSource, params, formatCompliance, collector);
final TiffContents contents = collector.getContents();
if (contents.directories.size() < 1) {
throw new ImageReadException(
"Image did not contain any directories.");
}
return contents;
}
public TiffContents readDirectories(final ByteSource byteSource,
final boolean readImageData, final FormatCompliance formatCompliance)
throws ImageReadException, IOException {
final Collector collector = new Collector(null);
readDirectories(byteSource, formatCompliance, collector);
final TiffContents contents = collector.getContents();
if (contents.directories.size() < 1) {
throw new ImageReadException(
"Image did not contain any directories.");
}
return contents;
}
public TiffContents readContents(final ByteSource byteSource, final Map params,
final FormatCompliance formatCompliance) throws ImageReadException,
IOException {
final Collector collector = new Collector(params);
read(byteSource, params, formatCompliance, collector);
return collector.getContents();
}
public void read(final ByteSource byteSource, final Map params,
final FormatCompliance formatCompliance, final Listener listener)
throws ImageReadException, IOException {
// TiffContents contents =
readDirectories(byteSource, formatCompliance, listener);
}
private TiffImageData getTiffRawImageData(final ByteSource byteSource,
final TiffDirectory directory) throws ImageReadException, IOException {
final List elements = directory.getTiffRawImageDataElements();
final TiffImageData.Data[] data = new TiffImageData.Data[elements.size()];
if (byteSource instanceof ByteSourceFile) {
final ByteSourceFile bsf = (ByteSourceFile) byteSource;
for (int i = 0; i < elements.size(); i++) {
final TiffDirectory.ImageDataElement element = elements.get(i);
data[i] = new TiffImageData.ByteSourceData(element.offset,
element.length, bsf);
}
} else {
for (int i = 0; i < elements.size(); i++) {
final TiffDirectory.ImageDataElement element = elements.get(i);
final byte[] bytes = byteSource.getBlock(element.offset, element.length);
data[i] = new TiffImageData.Data(element.offset, element.length, bytes);
}
}
if (directory.imageDataInStrips()) {
final TiffField rowsPerStripField = directory.findField(TiffTagConstants.TIFF_TAG_ROWS_PER_STRIP);
/*
* Default value of rowsperstrip is assumed to be infinity
* http://www.awaresystems.be/imaging/tiff/tifftags/rowsperstrip.html
*/
int rowsPerStrip = Integer.MAX_VALUE;
if (null != rowsPerStripField) {
rowsPerStrip = rowsPerStripField.getIntValue();
} else {
final TiffField imageHeight = directory.findField(TiffTagConstants.TIFF_TAG_IMAGE_LENGTH);
/**
* if rows per strip not present then rowsPerStrip is equal to
* imageLength or an infinity value;
*/
if (imageHeight != null) {
rowsPerStrip = imageHeight.getIntValue();
}
}
return new TiffImageData.Strips(data, rowsPerStrip);
} else {
final TiffField tileWidthField = directory.findField(TiffTagConstants.TIFF_TAG_TILE_WIDTH);
if (null == tileWidthField) {
throw new ImageReadException("Can't find tile width field.");
}
final int tileWidth = tileWidthField.getIntValue();
final TiffField tileLengthField = directory.findField(TiffTagConstants.TIFF_TAG_TILE_LENGTH);
if (null == tileLengthField) {
throw new ImageReadException("Can't find tile length field.");
}
final int tileLength = tileLengthField.getIntValue();
return new TiffImageData.Tiles(data, tileWidth, tileLength);
}
}
private JpegImageData getJpegRawImageData(final ByteSource byteSource,
final TiffDirectory directory) throws ImageReadException, IOException {
final ImageDataElement element = directory.getJpegRawImageDataElement();
final long offset = element.offset;
int length = element.length;
// In case the length is not correct, adjust it and check if the last read byte actually is the end of the image
if (offset + length > byteSource.getLength()) {
length = (int) (byteSource.getLength() - offset);
}
final byte[] data = byteSource.getBlock(offset, length);
// check if the last read byte is actually the end of the image data
if (strict &&
(length < 2 ||
(((data[data.length - 2] & 0xff) << 8) | (data[data.length - 1] & 0xff)) != JpegConstants.EOI_MARKER)) {
throw new ImageReadException("JPEG EOI marker could not be found at expected location");
}
return new JpegImageData(offset, length, data);
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy