All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.jpedal.jbig2.segment.region.text.TextRegionSegment Maven / Gradle / Ivy

There is a newer version: 7.15.25
Show newest version
/**
 * ===========================================
 * Java Pdf Extraction Decoding Access Library
 * ===========================================
 * 

* Project Info: http://www.jpedal.org * (C) Copyright 1997-2008, IDRsolutions and Contributors. * Main Developer: Simon Barnett *

* This file is part of JPedal *

* Copyright (c) 2008, IDRsolutions * All rights reserved. *

* Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions are met: * * Redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer. * * Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in the * documentation and/or other materials provided with the distribution. * * Neither the name of the IDRsolutions nor the * names of its contributors may be used to endorse or promote products * derived from this software without specific prior written permission. *

* THIS SOFTWARE IS PROVIDED BY IDRsolutions ``AS IS'' AND ANY * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE * DISCLAIMED. IN NO EVENT SHALL IDRsolutions BE LIABLE FOR ANY * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. *

* Other JBIG2 image decoding implementations include * jbig2dec (http://jbig2dec.sourceforge.net/) * xpdf (http://www.foolabs.com/xpdf/) *

* The final draft JBIG2 specification can be found at http://www.jpeg.org/public/fcd14492.pdf *

* All three of the above resources were used in the writing of this software, with methodologies, * processes and inspiration taken from all three. *

* --------------- * TextRegionSegment.java * --------------- */ package org.jpedal.jbig2.segment.region.text; import java.io.IOException; import java.util.ArrayList; import java.util.Iterator; import java.util.List; import org.jpedal.jbig2.JBIG2Exception; import org.jpedal.jbig2.decoders.HuffmanDecoder; import org.jpedal.jbig2.decoders.JBIG2StreamDecoder; import org.jpedal.jbig2.image.JBIG2Bitmap; import org.jpedal.jbig2.segment.Segment; import org.jpedal.jbig2.segment.pageinformation.PageInformationSegment; import org.jpedal.jbig2.segment.region.RegionFlags; import org.jpedal.jbig2.segment.region.RegionSegment; import org.jpedal.jbig2.segment.symboldictionary.SymbolDictionarySegment; import org.jpedal.jbig2.util.BinaryOperation; public class TextRegionSegment extends RegionSegment { private TextRegionFlags textRegionFlags = new TextRegionFlags(); private TextRegionHuffmanFlags textRegionHuffmanFlags = new TextRegionHuffmanFlags(); private int noOfSymbolInstances; private boolean inlineImage; private short[] symbolRegionAdaptiveTemplateX = new short[2], symbolRegionAdaptiveTemplateY = new short[2]; public TextRegionSegment(JBIG2StreamDecoder streamDecoder, boolean inlineImage) { super(streamDecoder); this.inlineImage = inlineImage; } public void readSegment() throws IOException, JBIG2Exception { if (JBIG2StreamDecoder.debug) System.out.println("==== Reading Text Region ===="); super.readSegment(); /** read text region Segment flags */ readTextRegionFlags(); short[] buff = new short[4]; decoder.readByte(buff); noOfSymbolInstances = BinaryOperation.getInt32(buff); if (JBIG2StreamDecoder.debug) System.out.println("noOfSymbolInstances = " + noOfSymbolInstances); int noOfReferredToSegments = segmentHeader.getReferredToSegmentCount(); int[] referredToSegments = segmentHeader.getReferredToSegments(); List codeTables = new ArrayList(); List segmentsReferenced = new ArrayList(); int noOfSymbols = 0; if (JBIG2StreamDecoder.debug) System.out.println("noOfReferredToSegments = " + noOfReferredToSegments); for (int i = 0; i < noOfReferredToSegments; i++) { Segment seg = decoder.findSegment(referredToSegments[i]); int type = seg.getSegmentHeader().getSegmentType(); if (type == Segment.SYMBOL_DICTIONARY) { segmentsReferenced.add(seg); noOfSymbols += ((SymbolDictionarySegment) seg).getNoOfExportedSymbols(); } else if (type == Segment.TABLES) { codeTables.add(seg); } } int symbolCodeLength = 0; int count = 1; while (count < noOfSymbols) { symbolCodeLength++; count <<= 1; } int currentSymbol = 0; JBIG2Bitmap[] symbols = new JBIG2Bitmap[noOfSymbols]; for (Iterator it = segmentsReferenced.iterator(); it.hasNext(); ) { Segment seg = (Segment) it.next(); if (seg.getSegmentHeader().getSegmentType() == Segment.SYMBOL_DICTIONARY) { JBIG2Bitmap[] bitmaps = ((SymbolDictionarySegment) seg).getBitmaps(); for (int j = 0; j < bitmaps.length; j++) { symbols[currentSymbol] = bitmaps[j]; currentSymbol++; } } } int[][] huffmanFSTable = null; int[][] huffmanDSTable = null; int[][] huffmanDTTable = null; int[][] huffmanRDWTable = null; int[][] huffmanRDHTable = null; int[][] huffmanRDXTable = null; int[][] huffmanRDYTable = null; int[][] huffmanRSizeTable = null; boolean sbHuffman = textRegionFlags.getFlagValue(TextRegionFlags.SB_HUFF) != 0; int i = 0; if (sbHuffman) { int sbHuffFS = textRegionHuffmanFlags.getFlagValue(TextRegionHuffmanFlags.SB_HUFF_FS); if (sbHuffFS == 0) { huffmanFSTable = HuffmanDecoder.huffmanTableF; } else if (sbHuffFS == 1) { huffmanFSTable = HuffmanDecoder.huffmanTableG; } else { } int sbHuffDS = textRegionHuffmanFlags.getFlagValue(TextRegionHuffmanFlags.SB_HUFF_DS); if (sbHuffDS == 0) { huffmanDSTable = HuffmanDecoder.huffmanTableH; } else if (sbHuffDS == 1) { huffmanDSTable = HuffmanDecoder.huffmanTableI; } else if (sbHuffDS == 2) { huffmanDSTable = HuffmanDecoder.huffmanTableJ; } else { } int sbHuffDT = textRegionHuffmanFlags.getFlagValue(TextRegionHuffmanFlags.SB_HUFF_DT); if (sbHuffDT == 0) { huffmanDTTable = HuffmanDecoder.huffmanTableK; } else if (sbHuffDT == 1) { huffmanDTTable = HuffmanDecoder.huffmanTableL; } else if (sbHuffDT == 2) { huffmanDTTable = HuffmanDecoder.huffmanTableM; } else { } int sbHuffRDW = textRegionHuffmanFlags.getFlagValue(TextRegionHuffmanFlags.SB_HUFF_RDW); if (sbHuffRDW == 0) { huffmanRDWTable = HuffmanDecoder.huffmanTableN; } else if (sbHuffRDW == 1) { huffmanRDWTable = HuffmanDecoder.huffmanTableO; } else { } int sbHuffRDH = textRegionHuffmanFlags.getFlagValue(TextRegionHuffmanFlags.SB_HUFF_RDH); if (sbHuffRDH == 0) { huffmanRDHTable = HuffmanDecoder.huffmanTableN; } else if (sbHuffRDH == 1) { huffmanRDHTable = HuffmanDecoder.huffmanTableO; } else { } int sbHuffRDX = textRegionHuffmanFlags.getFlagValue(TextRegionHuffmanFlags.SB_HUFF_RDX); if (sbHuffRDX == 0) { huffmanRDXTable = HuffmanDecoder.huffmanTableN; } else if (sbHuffRDX == 1) { huffmanRDXTable = HuffmanDecoder.huffmanTableO; } else { } int sbHuffRDY = textRegionHuffmanFlags.getFlagValue(TextRegionHuffmanFlags.SB_HUFF_RDY); if (sbHuffRDY == 0) { huffmanRDYTable = HuffmanDecoder.huffmanTableN; } else if (sbHuffRDY == 1) { huffmanRDYTable = HuffmanDecoder.huffmanTableO; } else { } int sbHuffRSize = textRegionHuffmanFlags.getFlagValue(TextRegionHuffmanFlags.SB_HUFF_RSIZE); if (sbHuffRSize == 0) { huffmanRSizeTable = HuffmanDecoder.huffmanTableA; } else { } } int[][] runLengthTable = new int[36][4]; int[][] symbolCodeTable = new int[noOfSymbols + 1][4]; if (sbHuffman) { decoder.consumeRemainingBits(); for (i = 0; i < 32; i++) { runLengthTable[i] = new int[]{i, decoder.readBits(4), 0, 0}; } runLengthTable[32] = new int[]{0x103, decoder.readBits(4), 2, 0}; runLengthTable[33] = new int[]{0x203, decoder.readBits(4), 3, 0}; runLengthTable[34] = new int[]{0x20b, decoder.readBits(4), 7, 0}; runLengthTable[35] = new int[]{0, 0, HuffmanDecoder.jbig2HuffmanEOT}; runLengthTable = huffmanDecoder.buildTable(runLengthTable, 35); for (i = 0; i < noOfSymbols; i++) { symbolCodeTable[i] = new int[]{i, 0, 0, 0}; } i = 0; while (i < noOfSymbols) { int j = huffmanDecoder.decodeInt(runLengthTable).intResult(); if (j > 0x200) { for (j -= 0x200; j != 0 && i < noOfSymbols; j--) { symbolCodeTable[i++][1] = 0; } } else if (j > 0x100) { for (j -= 0x100; j != 0 && i < noOfSymbols; j--) { symbolCodeTable[i][1] = symbolCodeTable[i - 1][1]; i++; } } else { symbolCodeTable[i++][1] = j; } } symbolCodeTable[noOfSymbols][1] = 0; symbolCodeTable[noOfSymbols][2] = HuffmanDecoder.jbig2HuffmanEOT; symbolCodeTable = huffmanDecoder.buildTable(symbolCodeTable, noOfSymbols); decoder.consumeRemainingBits(); } else { symbolCodeTable = null; arithmeticDecoder.resetIntStats(symbolCodeLength); arithmeticDecoder.start(); } boolean symbolRefine = textRegionFlags.getFlagValue(TextRegionFlags.SB_REFINE) != 0; int logStrips = textRegionFlags.getFlagValue(TextRegionFlags.LOG_SB_STRIPES); int defaultPixel = textRegionFlags.getFlagValue(TextRegionFlags.SB_DEF_PIXEL); int combinationOperator = textRegionFlags.getFlagValue(TextRegionFlags.SB_COMB_OP); boolean transposed = textRegionFlags.getFlagValue(TextRegionFlags.TRANSPOSED) != 0; int referenceCorner = textRegionFlags.getFlagValue(TextRegionFlags.REF_CORNER); int sOffset = textRegionFlags.getFlagValue(TextRegionFlags.SB_DS_OFFSET); int template = textRegionFlags.getFlagValue(TextRegionFlags.SB_R_TEMPLATE); if (symbolRefine) { arithmeticDecoder.resetRefinementStats(template, null); } JBIG2Bitmap bitmap = new JBIG2Bitmap(regionBitmapWidth, regionBitmapHeight, arithmeticDecoder, huffmanDecoder, mmrDecoder); bitmap.readTextRegion(sbHuffman, symbolRefine, noOfSymbolInstances, logStrips, noOfSymbols, symbolCodeTable, symbolCodeLength, symbols, defaultPixel, combinationOperator, transposed, referenceCorner, sOffset, huffmanFSTable, huffmanDSTable, huffmanDTTable, huffmanRDWTable, huffmanRDHTable, huffmanRDXTable, huffmanRDYTable, huffmanRSizeTable, template, symbolRegionAdaptiveTemplateX, symbolRegionAdaptiveTemplateY, decoder); if (inlineImage) { PageInformationSegment pageSegment = decoder.findPageSegement(segmentHeader.getPageAssociation()); JBIG2Bitmap pageBitmap = pageSegment.getPageBitmap(); if (JBIG2StreamDecoder.debug) System.out.println(pageBitmap + " " + bitmap); int externalCombinationOperator = regionFlags.getFlagValue(RegionFlags.EXTERNAL_COMBINATION_OPERATOR); pageBitmap.combine(bitmap, regionBitmapXLocation, regionBitmapYLocation, externalCombinationOperator); } else { bitmap.setBitmapNumber(getSegmentHeader().getSegmentNumber()); decoder.appendBitmap(bitmap); } decoder.consumeRemainingBits(); } private void readTextRegionFlags() throws IOException { /** extract text region Segment flags */ short[] textRegionFlagsField = new short[2]; decoder.readByte(textRegionFlagsField); int flags = BinaryOperation.getInt16(textRegionFlagsField); textRegionFlags.setFlags(flags); if (JBIG2StreamDecoder.debug) System.out.println("text region Segment flags = " + flags); boolean sbHuff = textRegionFlags.getFlagValue(TextRegionFlags.SB_HUFF) != 0; if (sbHuff) { /** extract text region Segment Huffman flags */ short[] textRegionHuffmanFlagsField = new short[2]; decoder.readByte(textRegionHuffmanFlagsField); flags = BinaryOperation.getInt16(textRegionHuffmanFlagsField); textRegionHuffmanFlags.setFlags(flags); if (JBIG2StreamDecoder.debug) System.out.println("text region segment Huffman flags = " + flags); } boolean sbRefine = textRegionFlags.getFlagValue(TextRegionFlags.SB_REFINE) != 0; int sbrTemplate = textRegionFlags.getFlagValue(TextRegionFlags.SB_R_TEMPLATE); if (sbRefine && sbrTemplate == 0) { symbolRegionAdaptiveTemplateX[0] = readATValue(); symbolRegionAdaptiveTemplateY[0] = readATValue(); symbolRegionAdaptiveTemplateX[1] = readATValue(); symbolRegionAdaptiveTemplateY[1] = readATValue(); } } public TextRegionFlags getTextRegionFlags() { return textRegionFlags; } public TextRegionHuffmanFlags getTextRegionHuffmanFlags() { return textRegionHuffmanFlags; } }





© 2015 - 2025 Weber Informatics LLC | Privacy Policy