All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.jpedal.parser.image.ID Maven / Gradle / Ivy

There is a newer version: 7.15.25
Show newest version
/*
 * ===========================================
 * Java Pdf Extraction Decoding Access Library
 * ===========================================
 *
 * Project Info:  http://www.idrsolutions.com
 * Help section for developers at http://www.idrsolutions.com/support/
 *
 * (C) Copyright 1997-2017 IDRsolutions and Contributors.
 *
 * This file is part of JPedal/JPDF2HTML5
 *
 @LICENSE@
 *
 * ---------------
 * ID.java
 * ---------------
 */
package org.jpedal.parser.image;

import java.awt.Color;
import java.awt.image.BufferedImage;

import org.jpedal.color.ColorspaceFactory;
import org.jpedal.color.DeviceRGBColorSpace;
import org.jpedal.color.GenericColorSpace;
import org.jpedal.exception.PdfException;
import org.jpedal.external.ErrorTracker;
import org.jpedal.external.ImageHandler;
import org.jpedal.io.*;
import org.jpedal.objects.PdfImageData;
import org.jpedal.objects.PdfPageData;
import org.jpedal.objects.raw.PdfArrayIterator;
import org.jpedal.objects.raw.PdfDictionary;
import org.jpedal.objects.raw.PdfObject;
import org.jpedal.parser.PdfObjectCache;
import org.jpedal.parser.image.data.ImageData;

public class ID extends ImageDecoder {
    public ID(final int imageCount, final PdfObjectReader currentPdfFile, final ErrorTracker errorTracker, final ImageHandler customImageHandler, final ObjectStore objectStoreStreamRef, final PdfImageData pdfImages, final PdfPageData pageData, final String imagesInFile) {
        super(imageCount, currentPdfFile, errorTracker, customImageHandler, objectStoreStreamRef, pdfImages, pageData, imagesInFile);
    }

    @Override
    public int processImage(int dataPointer, final int startInlineStream, final byte[] stream, final int tokenNumber) throws Exception {

        final PdfObject XObject = convertDataToObject(dataPointer, startInlineStream, stream, currentPdfFile.getObjectReader());

        final boolean inline_imageMask = XObject.getBoolean(PdfDictionary.ImageMask);
        final int inline_start_pointer = dataPointer + 1;
        final int i_w = XObject.getInt(PdfDictionary.Width);
        final int i_h = XObject.getInt(PdfDictionary.Height);
        final int i_bpc = XObject.getInt(PdfDictionary.BitsPerComponent);

        //find end of stream
        final int i = getEndOfImageData(inline_start_pointer, stream);

        if (parserOptions.imagesNeeded()) {

            BufferedImage image = null;

            final String image_name = parserOptions.getFileName() + "-IN-" + tokenNumber;

            byte[] i_data = setImageData(i, stream, inline_start_pointer, XObject);

            // allow user to process image
            if (customImageHandler != null) {
                image = customImageHandler.processImageData(gs, XObject);
            }

            i_data = decompressData(XObject, i_data, i_w, i_h);

            final GenericColorSpace decodeColorData = setColorSpace(XObject, currentPdfFile, cache);

            decodeColorData.setPrinting(parserOptions.isPrinting());

            //track colorspace use
            cache.put(PdfObjectCache.ColorspacesUsed, decodeColorData.getID(), "x");

            if (i_data != null) {

                if (customImageHandler == null || (image == null && !customImageHandler.alwaysIgnoreGenericHandler())) {
                    image = convertDataToImage(i_w, i_h, i_bpc, i_data, decodeColorData, image, inline_imageMask, XObject, image_name);
                }

                if (image != null) {
                    renderImage(image, image_name);
                }
            }
        }

        dataPointer = i + 3;

        return dataPointer;

    }

    private void renderImage(final BufferedImage image, final String image_name) {

        if (current.isHTMLorSVG()) {
            current.drawImage(parserOptions.getPageNumber(), image, gs, false, image_name, -2);

        } else {

            gs.x = gs.CTM[2][0];
            gs.y = gs.CTM[2][1];

            current.drawImage(parserOptions.getPageNumber(), image, gs, false, image_name, -1);
        }

        if (image != null) {
            image.flush();
        }
    }

    private BufferedImage convertDataToImage(final int i_w, final int i_h, final int i_bpc, final byte[] i_data, final GenericColorSpace decodeColorData, BufferedImage image, final boolean inline_imageMask, final PdfObject XObject, final String image_name) throws PdfException {
        final ImageData imageData = new ImageData(ImageCommands.ID);
        imageData.setWidth(i_w);
        imageData.setHeight(i_h);
        imageData.setDepth(i_bpc);
        imageData.setObjectData(i_data);
        imageData.setCompCount(decodeColorData.getColorSpace().getNumComponents());
        image = processImage(decodeColorData, imageData, inline_imageMask, XObject);
        //transparency slows down printing so try to reduce if possible in printing
        if (inline_imageMask && !ImageDecoder.allowPrintTransparency && parserOptions.isPrinting() && image != null && imageData.getDepth() == 1) {
            image = setupMask(image);
        }
        //generate name including filename to make it unique
        currentImage = image_name;
        return image;
    }

    private static GenericColorSpace setColorSpace(final PdfObject XObject, final PdfObjectReader currentPdfFile, final PdfObjectCache cache) {

        //handle colour information
        GenericColorSpace decodeColorData = new DeviceRGBColorSpace();
        //resolve color details
        PdfArrayIterator ColorSpace = XObject.getMixedArray(PdfDictionary.ColorSpace);
        if (ColorSpace.getTokenCount() > 0) { //if not set will be zero

            //allow for lookup
            final String colKey = ColorSpace.getNextValueAsString(false);

            if (colKey != null) { //allow for /R188 stored in lookup
                final Object col = cache.get(PdfObjectCache.Colorspaces, colKey.substring(1));

                if (col != null) {
                    ColorSpace = ColorspaceFactory.convertColValueToMixedArray(currentPdfFile, (byte[]) col);
                }
            }

            decodeColorData = ColorspaceFactory.getColorSpaceInstance(currentPdfFile, ColorSpace);
        }

        return decodeColorData;
    }

    private static PdfObject convertDataToObject(final int dataPointer, final int startInlineStream, final byte[] stream, final PdfFileReader pdfFileReader) {

        final PdfObject XObject = new org.jpedal.objects.raw.XObject(PdfDictionary.ID);
        final IDObjectDecoder objectDecoder = new IDObjectDecoder(pdfFileReader);

        objectDecoder.setEndPt(dataPointer - 2);
        objectDecoder.readDictionaryAsObject(XObject, startInlineStream, stream);

        return XObject;
    }

    private BufferedImage setupMask(BufferedImage image) {
        //setup any imageMask
        final byte[] maskCol = ImageCommands.getMaskColor(gs);
        if (maskCol != null && maskCol[0] == 0 && maskCol[1] == 0 && maskCol[2] == 0 && maskCol[3] == 0) {
            final int iw = image.getWidth();
            final int ih = image.getHeight();
            final BufferedImage newImage = new BufferedImage(iw, ih, BufferedImage.TYPE_BYTE_GRAY);

            newImage.getGraphics().setColor(Color.WHITE);
            newImage.getGraphics().fillRect(0, 0, iw, ih);
            newImage.getGraphics().drawImage(image, 0, 0, null);
            image = newImage;
        }
        return image;
    }

    private byte[] decompressData(final PdfObject XObject, byte[] i_data, final int i_w, final int i_h) throws Exception {
        final PdfArrayIterator filters = XObject.getMixedArray(PdfDictionary.Filter);
        //check not handled elsewhere
        final int firstValue;
        boolean needsDecoding = false;
        if (filters != null && filters.hasMoreTokens()) {
            firstValue = filters.getNextValueAsConstant(false);

            needsDecoding = (firstValue != PdfFilteredReader.JPXDecode && firstValue != PdfFilteredReader.DCTDecode);
        }
        //handle filters (JPXDecode/DCT decode is handle by process image)
        if (needsDecoding) {
            final PdfFilteredReader filter = new PdfFilteredReader();
            i_data = filter.decodeFilters(ObjectUtils.setupDecodeParms(XObject, currentPdfFile.getObjectReader()), i_data, filters, i_w, i_h, null);
        }
        return i_data;
    }

    private static byte[] setImageData(final int i, final byte[] stream, int inline_start_pointer, final PdfObject XObject) {

        int endPtr = i;

        //hack for odd files
        if (i < stream.length && stream[endPtr] != 32 && stream[endPtr] != 10 && stream[endPtr] != 13) {
            endPtr++;
        }
        //correct data (ie idoq/FC1100000021259.pdf )
        if (stream[inline_start_pointer] == 10) {
            inline_start_pointer++;
        }
        /*
        * put image data in array
        */
        final byte[] i_data = new byte[endPtr - inline_start_pointer];
        System.arraycopy(
                stream,
                inline_start_pointer,
                i_data,
                0,
                endPtr - inline_start_pointer);
        XObject.setStream(i_data);

        return i_data;
    }

    private static int getEndOfImageData(int i, final byte[] stream) {

        final int streamLength = stream.length;

        //find end
        while (true) {
            //look for end EI

            //handle Pdflib and xenos variety
            if (streamLength - i > 3 && stream[i + 1] == 69 && stream[i + 2] == 73 && ((stream[i + 3] == 10 && (streamLength == i + 4 || stream[i + 4] == 81)) || (stream[i + 3] == 32 && stream[i + 4] == 10))) {
                break;
            }

            //handle RADPDF  variety (see 26654)
            if (streamLength - i > 3 && stream[i + 1] == 69 && stream[i + 2] == 73 && ((stream[i + 3] == 32 && stream[i + 4] == 32))) {
                break;
            }

            //general case
            if ((streamLength - i > 3) && (stream[i] == 32 || stream[i] == 10 || stream[i] == 13 || (stream[i + 3] == 32 && stream[i + 4] == 'Q'))
                    && (stream[i + 1] == 69)
                    && (stream[i + 2] == 73)
                    && (stream[i + 3] == 32 || stream[i + 3] == 10 || stream[i + 3] == 13)) {
                break;
            }


            i++;

            if (i == streamLength) {
                break;
            }
        }
        return i;
    }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy