All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.jpedal.jbig2.segment.region.text.TextRegionSegment Maven / Gradle / Ivy

There is a newer version: 20151002
Show newest version
/**
* ===========================================
* Java Pdf Extraction Decoding Access Library
* ===========================================
*
* Project Info:  http://www.jpedal.org
* (C) Copyright 1997-2008, IDRsolutions and Contributors.
* Main Developer: Simon Barnett
*
* 	This file is part of JPedal
*
* Copyright (c) 2008, IDRsolutions
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions are met:
*     * Redistributions of source code must retain the above copyright
*       notice, this list of conditions and the following disclaimer.
*     * Redistributions in binary form must reproduce the above copyright
*       notice, this list of conditions and the following disclaimer in the
*       documentation and/or other materials provided with the distribution.
*     * Neither the name of the IDRsolutions nor the
*       names of its contributors may be used to endorse or promote products
*       derived from this software without specific prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY IDRsolutions ``AS IS'' AND ANY
* EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
* WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
* DISCLAIMED. IN NO EVENT SHALL IDRsolutions BE LIABLE FOR ANY
* DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
* (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
* LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
* ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
* SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*
* Other JBIG2 image decoding implementations include
* jbig2dec (http://jbig2dec.sourceforge.net/)
* xpdf (http://www.foolabs.com/xpdf/)
* 
* The final draft JBIG2 specification can be found at http://www.jpeg.org/public/fcd14492.pdf
* 
* All three of the above resources were used in the writing of this software, with methodologies,
* processes and inspiration taken from all three.
*
* ---------------
* TextRegionSegment.java
* ---------------
*/
package org.jpedal.jbig2.segment.region.text;

import java.io.IOException;
import java.util.ArrayList;
import java.util.Iterator;
import java.util.List;

import org.jpedal.jbig2.JBIG2Exception;
import org.jpedal.jbig2.decoders.HuffmanDecoder;
import org.jpedal.jbig2.decoders.JBIG2StreamDecoder;
import org.jpedal.jbig2.image.JBIG2Bitmap;
import org.jpedal.jbig2.segment.Segment;
import org.jpedal.jbig2.segment.pageinformation.PageInformationSegment;
import org.jpedal.jbig2.segment.region.RegionFlags;
import org.jpedal.jbig2.segment.region.RegionSegment;
import org.jpedal.jbig2.segment.symboldictionary.SymbolDictionarySegment;
import org.jpedal.jbig2.util.BinaryOperation;

public class TextRegionSegment extends RegionSegment {
	private TextRegionFlags textRegionFlags = new TextRegionFlags();

	private TextRegionHuffmanFlags textRegionHuffmanFlags = new TextRegionHuffmanFlags();

	private int noOfSymbolInstances;

	private boolean inlineImage;

	private short[] symbolRegionAdaptiveTemplateX = new short[2], symbolRegionAdaptiveTemplateY = new short[2];

	public TextRegionSegment(JBIG2StreamDecoder streamDecoder, boolean inlineImage) {
		super(streamDecoder);

		this.inlineImage = inlineImage;
	}

	public void readSegment() throws IOException, JBIG2Exception {
		if (JBIG2StreamDecoder.debug)
			System.out.println("==== Reading Text Region ====");

		super.readSegment();

		/** read text region Segment flags */
		readTextRegionFlags();

		short[] buff = new short[4];
		decoder.readByte(buff);
		noOfSymbolInstances = BinaryOperation.getInt32(buff);

		if (JBIG2StreamDecoder.debug)
			System.out.println("noOfSymbolInstances = " + noOfSymbolInstances);

		int noOfReferredToSegments = segmentHeader.getReferredToSegmentCount();
		int[] referredToSegments = segmentHeader.getReferredToSegments();

		List codeTables = new ArrayList();
		List segmentsReferenced = new ArrayList();
		int noOfSymbols = 0;

		if (JBIG2StreamDecoder.debug)
			System.out.println("noOfReferredToSegments = " + noOfReferredToSegments);

		for (int i = 0; i < noOfReferredToSegments; i++) {
			Segment seg = decoder.findSegment(referredToSegments[i]);
			int type = seg.getSegmentHeader().getSegmentType();

			if (type == Segment.SYMBOL_DICTIONARY) {
				segmentsReferenced.add(seg);
				noOfSymbols += ((SymbolDictionarySegment) seg).getNoOfExportedSymbols();
			} else if (type == Segment.TABLES) {
				codeTables.add(seg);
			}
		}

		int symbolCodeLength = 0;
		int count = 1;

		while (count < noOfSymbols) {
			symbolCodeLength++;
			count <<= 1;
		}

		int currentSymbol = 0;
		JBIG2Bitmap[] symbols = new JBIG2Bitmap[noOfSymbols];
		for (Iterator it = segmentsReferenced.iterator(); it.hasNext();) {
			Segment seg = (Segment) it.next();
			if (seg.getSegmentHeader().getSegmentType() == Segment.SYMBOL_DICTIONARY) {
				JBIG2Bitmap[] bitmaps = ((SymbolDictionarySegment) seg).getBitmaps();
				for (int j = 0; j < bitmaps.length; j++) {
					symbols[currentSymbol] = bitmaps[j];
					currentSymbol++;
				}
			}
		}

		int[][] huffmanFSTable = null;
		int[][] huffmanDSTable = null;
		int[][] huffmanDTTable = null;

		int[][] huffmanRDWTable = null;
		int[][] huffmanRDHTable = null;

		int[][] huffmanRDXTable = null;
		int[][] huffmanRDYTable = null;
		int[][] huffmanRSizeTable = null;

		boolean sbHuffman = textRegionFlags.getFlagValue(TextRegionFlags.SB_HUFF) != 0;

		int i = 0;
		if (sbHuffman) {
			int sbHuffFS = textRegionHuffmanFlags.getFlagValue(TextRegionHuffmanFlags.SB_HUFF_FS);
			if (sbHuffFS == 0) {
				huffmanFSTable = HuffmanDecoder.huffmanTableF;
			} else if (sbHuffFS == 1) {
				huffmanFSTable = HuffmanDecoder.huffmanTableG;
			} else {

			}

			int sbHuffDS = textRegionHuffmanFlags.getFlagValue(TextRegionHuffmanFlags.SB_HUFF_DS);
			if (sbHuffDS == 0) {
				huffmanDSTable = HuffmanDecoder.huffmanTableH;
			} else if (sbHuffDS == 1) {
				huffmanDSTable = HuffmanDecoder.huffmanTableI;
			} else if (sbHuffDS == 2) {
				huffmanDSTable = HuffmanDecoder.huffmanTableJ;
			} else {
				
			}

			int sbHuffDT = textRegionHuffmanFlags.getFlagValue(TextRegionHuffmanFlags.SB_HUFF_DT);
			if (sbHuffDT == 0) {
				huffmanDTTable = HuffmanDecoder.huffmanTableK;
			} else if (sbHuffDT == 1) {
				huffmanDTTable = HuffmanDecoder.huffmanTableL;
			} else if (sbHuffDT == 2) {
				huffmanDTTable = HuffmanDecoder.huffmanTableM;
			} else {

			}

			int sbHuffRDW = textRegionHuffmanFlags.getFlagValue(TextRegionHuffmanFlags.SB_HUFF_RDW);
			if (sbHuffRDW == 0) {
				huffmanRDWTable = HuffmanDecoder.huffmanTableN;
			} else if (sbHuffRDW == 1) {
				huffmanRDWTable = HuffmanDecoder.huffmanTableO;
			} else {

			}

			int sbHuffRDH = textRegionHuffmanFlags.getFlagValue(TextRegionHuffmanFlags.SB_HUFF_RDH);
			if (sbHuffRDH == 0) {
				huffmanRDHTable = HuffmanDecoder.huffmanTableN;
			} else if (sbHuffRDH == 1) {
				huffmanRDHTable = HuffmanDecoder.huffmanTableO;
			} else {

			}

			int sbHuffRDX = textRegionHuffmanFlags.getFlagValue(TextRegionHuffmanFlags.SB_HUFF_RDX);
			if (sbHuffRDX == 0) {
				huffmanRDXTable = HuffmanDecoder.huffmanTableN;
			} else if (sbHuffRDX == 1) {
				huffmanRDXTable = HuffmanDecoder.huffmanTableO;
			} else {

			}

			int sbHuffRDY = textRegionHuffmanFlags.getFlagValue(TextRegionHuffmanFlags.SB_HUFF_RDY);
			if (sbHuffRDY == 0) {
				huffmanRDYTable = HuffmanDecoder.huffmanTableN;
			} else if (sbHuffRDY == 1) {
				huffmanRDYTable = HuffmanDecoder.huffmanTableO;
			} else {

			}

			int sbHuffRSize = textRegionHuffmanFlags.getFlagValue(TextRegionHuffmanFlags.SB_HUFF_RSIZE);
			if (sbHuffRSize == 0) {
				huffmanRSizeTable = HuffmanDecoder.huffmanTableA;
			} else {

			}
		}

		int[][] runLengthTable = new int[36][4];
		int[][] symbolCodeTable = new int[noOfSymbols + 1][4];
		if (sbHuffman) {

			decoder.consumeRemainingBits();

			for (i = 0; i < 32; i++) {
				runLengthTable[i] = new int[] { i, decoder.readBits(4), 0, 0 };
			}

			runLengthTable[32] = new int[] { 0x103, decoder.readBits(4), 2, 0 };

			runLengthTable[33] = new int[] { 0x203, decoder.readBits(4), 3, 0 };

			runLengthTable[34] = new int[] { 0x20b, decoder.readBits(4), 7, 0 };

			runLengthTable[35] = new int[] { 0, 0, HuffmanDecoder.jbig2HuffmanEOT };

			runLengthTable = huffmanDecoder.buildTable(runLengthTable, 35);

			for (i = 0; i < noOfSymbols; i++) {
				symbolCodeTable[i] = new int[] { i, 0, 0, 0 };
			}

			i = 0;
			while (i < noOfSymbols) {
				int j = huffmanDecoder.decodeInt(runLengthTable).intResult();
				if (j > 0x200) {
					for (j -= 0x200; j != 0 && i < noOfSymbols; j--) {
						symbolCodeTable[i++][1] = 0;
					}
				} else if (j > 0x100) {
					for (j -= 0x100; j != 0 && i < noOfSymbols; j--) {
						symbolCodeTable[i][1] = symbolCodeTable[i - 1][1];
						i++;
					}
				} else {
					symbolCodeTable[i++][1] = j;
				}
			}

			symbolCodeTable[noOfSymbols][1] = 0;
			symbolCodeTable[noOfSymbols][2] = HuffmanDecoder.jbig2HuffmanEOT;
			symbolCodeTable = huffmanDecoder.buildTable(symbolCodeTable, noOfSymbols);
			
			decoder.consumeRemainingBits();
		} else {
			symbolCodeTable = null;
			arithmeticDecoder.resetIntStats(symbolCodeLength);
			arithmeticDecoder.start();
		}

		boolean symbolRefine = textRegionFlags.getFlagValue(TextRegionFlags.SB_REFINE) != 0;
		int logStrips = textRegionFlags.getFlagValue(TextRegionFlags.LOG_SB_STRIPES);
		int defaultPixel = textRegionFlags.getFlagValue(TextRegionFlags.SB_DEF_PIXEL);
		int combinationOperator = textRegionFlags.getFlagValue(TextRegionFlags.SB_COMB_OP);
		boolean transposed = textRegionFlags.getFlagValue(TextRegionFlags.TRANSPOSED) != 0;
		int referenceCorner = textRegionFlags.getFlagValue(TextRegionFlags.REF_CORNER);
		int sOffset = textRegionFlags.getFlagValue(TextRegionFlags.SB_DS_OFFSET);
		int template = textRegionFlags.getFlagValue(TextRegionFlags.SB_R_TEMPLATE);

		if (symbolRefine) {
			arithmeticDecoder.resetRefinementStats(template, null);
		}

		JBIG2Bitmap bitmap = new JBIG2Bitmap(regionBitmapWidth, regionBitmapHeight, arithmeticDecoder, huffmanDecoder, mmrDecoder);

		bitmap.readTextRegion(sbHuffman, symbolRefine, noOfSymbolInstances, logStrips, noOfSymbols, symbolCodeTable, symbolCodeLength, symbols, defaultPixel, combinationOperator, transposed, referenceCorner, sOffset, huffmanFSTable, huffmanDSTable, huffmanDTTable, huffmanRDWTable, huffmanRDHTable, huffmanRDXTable, huffmanRDYTable, huffmanRSizeTable, template, symbolRegionAdaptiveTemplateX, symbolRegionAdaptiveTemplateY, decoder);

		if (inlineImage) {
			PageInformationSegment pageSegment = decoder.findPageSegement(segmentHeader.getPageAssociation());
			JBIG2Bitmap pageBitmap = pageSegment.getPageBitmap();

			if (JBIG2StreamDecoder.debug)
				System.out.println(pageBitmap + " " + bitmap);

			int externalCombinationOperator = regionFlags.getFlagValue(RegionFlags.EXTERNAL_COMBINATION_OPERATOR);
			pageBitmap.combine(bitmap, regionBitmapXLocation, regionBitmapYLocation, externalCombinationOperator);
		} else {
			bitmap.setBitmapNumber(getSegmentHeader().getSegmentNumber());
			decoder.appendBitmap(bitmap);
		}

		decoder.consumeRemainingBits();
	}

	private void readTextRegionFlags() throws IOException {
		/** extract text region Segment flags */
		short[] textRegionFlagsField = new short[2];
		decoder.readByte(textRegionFlagsField);

		int flags = BinaryOperation.getInt16(textRegionFlagsField);
		textRegionFlags.setFlags(flags);

		if (JBIG2StreamDecoder.debug)
			System.out.println("text region Segment flags = " + flags);

		boolean sbHuff = textRegionFlags.getFlagValue(TextRegionFlags.SB_HUFF) != 0;
		if (sbHuff) {
			/** extract text region Segment Huffman flags */
			short[] textRegionHuffmanFlagsField = new short[2];
			decoder.readByte(textRegionHuffmanFlagsField);

			flags = BinaryOperation.getInt16(textRegionHuffmanFlagsField);
			textRegionHuffmanFlags.setFlags(flags);

			if (JBIG2StreamDecoder.debug)
				System.out.println("text region segment Huffman flags = " + flags);
		}

		boolean sbRefine = textRegionFlags.getFlagValue(TextRegionFlags.SB_REFINE) != 0;
		int sbrTemplate = textRegionFlags.getFlagValue(TextRegionFlags.SB_R_TEMPLATE);
		if (sbRefine && sbrTemplate == 0) {
			symbolRegionAdaptiveTemplateX[0] = readATValue();
			symbolRegionAdaptiveTemplateY[0] = readATValue();
			symbolRegionAdaptiveTemplateX[1] = readATValue();
			symbolRegionAdaptiveTemplateY[1] = readATValue();
		}
	}

	public TextRegionFlags getTextRegionFlags() {
		return textRegionFlags;
	}

	public TextRegionHuffmanFlags getTextRegionHuffmanFlags() {
		return textRegionHuffmanFlags;
	}
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy