com.feilong.lib.compress.archivers.zip.ZipArchiveInputStream Maven / Gradle / Ivy

Go to download
Show more of this group Show more artifacts with this name
Show all versions of feilong Show documentation
feilong is a suite of core and expanded libraries that include utility classes, http, excel,cvs, io classes, and much much more.
There is a newer version: 4.3.0
Show newest version
/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 * KIND, either express or implied.  See the License for the
 * specific language governing permissions and limitations
 * under the License.
 */
package com.feilong.lib.compress.archivers.zip;

import static com.feilong.lib.compress.archivers.zip.ZipConstants.DWORD;
import static com.feilong.lib.compress.archivers.zip.ZipConstants.SHORT;
import static com.feilong.lib.compress.archivers.zip.ZipConstants.WORD;
import static com.feilong.lib.compress.archivers.zip.ZipConstants.ZIP64_MAGIC;

import java.io.ByteArrayInputStream;
import java.io.ByteArrayOutputStream;
import java.io.EOFException;
import java.io.IOException;
import java.io.InputStream;
import java.io.PushbackInputStream;
import java.math.BigInteger;
import java.nio.ByteBuffer;
import java.util.Arrays;
import java.util.zip.CRC32;
import java.util.zip.DataFormatException;
import java.util.zip.Inflater;
import java.util.zip.ZipEntry;
import java.util.zip.ZipException;

import com.feilong.lib.compress.archivers.ArchiveEntry;
import com.feilong.lib.compress.archivers.ArchiveInputStream;
import com.feilong.lib.compress.utils.ArchiveUtils;
import com.feilong.lib.compress.utils.IOUtils;
import com.feilong.lib.compress.utils.InputStreamStatistics;

/**
 * Implements an input stream that can read Zip archives.
 *
 * 
 * As of Apache Commons Compress it transparently supports Zip64
 * extensions and thus individual entries and archives larger than 4
 * GB or with more than 65536 entries.
 * 
 *
 * 
 * The {@link ZipFile} class is preferred when reading from files
 * as {@link ZipArchiveInputStream} is limited by not being able to
 * read the central directory header before returning entries. In
 * particular {@link ZipArchiveInputStream}
 * 
 *
 * 
 *
 * may return entries that are not part of the central directory
 * at all and shouldn't be considered part of the archive.
 *
 * may return several entries with the same name.
 *
 * will not return internal or external attributes.
 *
 * may return incomplete extra field data.
 *
 * may return unknown sizes and CRC values for entries until the
 * next entry has been reached if the archive uses the data
 * descriptor feature.
 *
 * 
 *
 * @see ZipFile
 * @NotThreadSafe
 */
public class ZipArchiveInputStream extends ArchiveInputStream implements InputStreamStatistics{

    /** The zip encoding to use for file names and the file comment. */
    private final ZipEncoding    zipEncoding;

    // the provided encoding (for unit tests)
    final String                 encoding;

    /** Whether to look for and use Unicode extra fields. */
    private final boolean        useUnicodeExtraFields;

    /** Wrapped stream, will always be a PushbackInputStream. */
    private final InputStream    in;

    /** Inflater used for all deflated entries. */
    private final Inflater       inf                                  = new Inflater(true);

    /** Buffer used to read from the wrapped stream. */
    private final ByteBuffer     buf                                  = ByteBuffer.allocate(ZipArchiveOutputStream.BUFFER_SIZE);

    /** The entry that is currently being read. */
    private CurrentEntry         current                              = null;

    /** Whether the stream has been closed. */
    private boolean              closed                               = false;

    /** Whether the stream has reached the central directory - and thus found all entries. */
    private boolean              hitCentralDirectory                  = false;

    /**
     * When reading a stored entry that uses the data descriptor this
     * stream has to read the full entry and caches it. This is the
     * cache.
     */
    private ByteArrayInputStream lastStoredEntry                      = null;

    /** Whether the stream will try to read STORED entries that use a data descriptor. */
    private boolean              allowStoredEntriesWithDataDescriptor = false;

    /** Count decompressed bytes for current entry */
    private long                 uncompressedCount                    = 0;

    /** Whether the stream will try to skip the zip split signature(08074B50) at the beginning **/
    private final boolean        skipSplitSig;

    private static final int     LFH_LEN                              = 30;
    /*
     * local file header signature WORD
     * version needed to extract SHORT
     * general purpose bit flag SHORT
     * compression method SHORT
     * last mod file time SHORT
     * last mod file date SHORT
     * crc-32 WORD
     * compressed size WORD
     * uncompressed size WORD
     * file name length SHORT
     * extra field length SHORT
     */

    private static final int     CFH_LEN                              = 46;
    /*
     * central file header signature WORD
     * version made by SHORT
     * version needed to extract SHORT
     * general purpose bit flag SHORT
     * compression method SHORT
     * last mod file time SHORT
     * last mod file date SHORT
     * crc-32 WORD
     * compressed size WORD
     * uncompressed size WORD
     * file name length SHORT
     * extra field length SHORT
     * file comment length SHORT
     * disk number start SHORT
     * internal file attributes SHORT
     * external file attributes WORD
     * relative offset of local header WORD
     */

    private static final long    TWO_EXP_32                           = ZIP64_MAGIC + 1;

    // cached buffers - must only be used locally in the class (COMPRESS-172 - reduce garbage collection)
    private final byte[]         lfhBuf                               = new byte[LFH_LEN];

    private final byte[]         skipBuf                              = new byte[1024];

    private final byte[]         shortBuf                             = new byte[SHORT];

    private final byte[]         wordBuf                              = new byte[WORD];

    private final byte[]         twoDwordBuf                          = new byte[2 * DWORD];

    private int                  entriesRead                          = 0;

    /**
     * Create an instance using UTF-8 encoding
     * 
     * @param inputStream
     *            the stream to wrap
     */
    public ZipArchiveInputStream(final InputStream inputStream){
        this(inputStream, ZipEncodingHelper.UTF8);
    }

    /**
     * Create an instance using the specified encoding
     * 
     * @param inputStream
     *            the stream to wrap
     * @param encoding
     *            the encoding to use for file names, use null
     *            for the platform's default encoding
     * @since 1.5
     */
    public ZipArchiveInputStream(final InputStream inputStream, final String encoding){
        this(inputStream, encoding, true);
    }

    /**
     * Create an instance using the specified encoding
     * 
     * @param inputStream
     *            the stream to wrap
     * @param encoding
     *            the encoding to use for file names, use null
     *            for the platform's default encoding
     * @param useUnicodeExtraFields
     *            whether to use InfoZIP Unicode
     *            Extra Fields (if present) to set the file names.
     */
    public ZipArchiveInputStream(final InputStream inputStream, final String encoding, final boolean useUnicodeExtraFields){
        this(inputStream, encoding, useUnicodeExtraFields, false);
    }

    /**
     * Create an instance using the specified encoding
     * 
     * @param inputStream
     *            the stream to wrap
     * @param encoding
     *            the encoding to use for file names, use null
     *            for the platform's default encoding
     * @param useUnicodeExtraFields
     *            whether to use InfoZIP Unicode
     *            Extra Fields (if present) to set the file names.
     * @param allowStoredEntriesWithDataDescriptor
     *            whether the stream
     *            will try to read STORED entries that use a data descriptor
     * @since 1.1
     */
    public ZipArchiveInputStream(final InputStream inputStream, final String encoding, final boolean useUnicodeExtraFields,
                    final boolean allowStoredEntriesWithDataDescriptor){
        this(inputStream, encoding, useUnicodeExtraFields, allowStoredEntriesWithDataDescriptor, false);
    }

    /**
     * Create an instance using the specified encoding
     * 
     * @param inputStream
     *            the stream to wrap
     * @param encoding
     *            the encoding to use for file names, use null
     *            for the platform's default encoding
     * @param useUnicodeExtraFields
     *            whether to use InfoZIP Unicode
     *            Extra Fields (if present) to set the file names.
     * @param allowStoredEntriesWithDataDescriptor
     *            whether the stream
     *            will try to read STORED entries that use a data descriptor
     * @param skipSplitSig
     *            Whether the stream will try to skip the zip
     *            split signature(08074B50) at the beginning. You will need to
     *            set this to true if you want to read a split archive.
     * @since 1.20
     */
    public ZipArchiveInputStream(final InputStream inputStream, final String encoding, final boolean useUnicodeExtraFields,
                    final boolean allowStoredEntriesWithDataDescriptor, final boolean skipSplitSig){
        this.encoding = encoding;
        zipEncoding = ZipEncodingHelper.getZipEncoding(encoding);
        this.useUnicodeExtraFields = useUnicodeExtraFields;
        in = new PushbackInputStream(inputStream, buf.capacity());
        this.allowStoredEntriesWithDataDescriptor = allowStoredEntriesWithDataDescriptor;
        this.skipSplitSig = skipSplitSig;
        // haven't read anything so far
        buf.limit(0);
    }

    public ZipArchiveEntry getNextZipEntry() throws IOException{
        uncompressedCount = 0;

        boolean firstEntry = true;
        if (closed || hitCentralDirectory){
            return null;
        }
        if (current != null){
            closeEntry();
            firstEntry = false;
        }

        long currentHeaderOffset = getBytesRead();
        try{
            if (firstEntry){
                // split archives have a special signature before the
                // first local file header - look for it and fail with
                // the appropriate error message if this is a split
                // archive.
                readFirstLocalFileHeader(lfhBuf);
            }else{
                readFully(lfhBuf);
            }
        }catch (final EOFException e){ //NOSONAR
            return null;
        }

        final ZipLong sig = new ZipLong(lfhBuf);
        if (!sig.equals(ZipLong.LFH_SIG)){
            if (sig.equals(ZipLong.CFH_SIG) || sig.equals(ZipLong.AED_SIG) || isApkSigningBlock(lfhBuf)){
                hitCentralDirectory = true;
                skipRemainderOfArchive();
                return null;
            }
            throw new ZipException(String.format("Unexpected record signature: 0X%X", sig.getValue()));
        }

        int off = WORD;
        current = new CurrentEntry();

        final int versionMadeBy = ZipShort.getValue(lfhBuf, off);
        off += SHORT;
        current.entry.setPlatform((versionMadeBy >> ZipFile.BYTE_SHIFT) & ZipFile.NIBLET_MASK);

        final GeneralPurposeBit gpFlag = GeneralPurposeBit.parse(lfhBuf, off);
        final boolean hasUTF8Flag = gpFlag.usesUTF8ForNames();
        final ZipEncoding entryEncoding = hasUTF8Flag ? ZipEncodingHelper.UTF8_ZIP_ENCODING : zipEncoding;
        current.hasDataDescriptor = gpFlag.usesDataDescriptor();
        current.entry.setGeneralPurposeBit(gpFlag);

        off += SHORT;

        current.entry.setMethod(ZipShort.getValue(lfhBuf, off));
        off += SHORT;

        final long time = ZipUtil.dosToJavaTime(ZipLong.getValue(lfhBuf, off));
        current.entry.setTime(time);
        off += WORD;

        ZipLong size = null, cSize = null;
        if (!current.hasDataDescriptor){
            current.entry.setCrc(ZipLong.getValue(lfhBuf, off));
            off += WORD;

            cSize = new ZipLong(lfhBuf, off);
            off += WORD;

            size = new ZipLong(lfhBuf, off);
            off += WORD;
        }else{
            off += 3 * WORD;
        }

        final int fileNameLen = ZipShort.getValue(lfhBuf, off);

        off += SHORT;

        final int extraLen = ZipShort.getValue(lfhBuf, off);
        off += SHORT; // NOSONAR - assignment as documentation

        final byte[] fileName = new byte[fileNameLen];
        readFully(fileName);
        current.entry.setName(entryEncoding.decode(fileName), fileName);
        if (hasUTF8Flag){
            current.entry.setNameSource(ZipArchiveEntry.NameSource.NAME_WITH_EFS_FLAG);
        }

        final byte[] extraData = new byte[extraLen];
        readFully(extraData);
        current.entry.setExtra(extraData);

        if (!hasUTF8Flag && useUnicodeExtraFields){
            ZipUtil.setNameAndCommentFromExtraFields(current.entry, fileName, null);
        }

        processZip64Extra(size, cSize);

        current.entry.setLocalHeaderOffset(currentHeaderOffset);
        current.entry.setDataOffset(getBytesRead());
        current.entry.setStreamContiguous(true);

        ZipMethod m = ZipMethod.getMethodByCode(current.entry.getMethod());
        if (current.entry.getCompressedSize() != ArchiveEntry.SIZE_UNKNOWN){
            if (ZipUtil.canHandleEntryData(current.entry) && m != ZipMethod.STORED && m != ZipMethod.DEFLATED){
                InputStream bis = new BoundedInputStream(in, current.entry.getCompressedSize());
                switch (m) {
                    //                case UNSHRINKING:
                    //                    current.in = new UnshrinkingInputStream(bis);
                    //                    break;
                    case IMPLODING:
                        current.in = new ExplodingInputStream(
                                        current.entry.getGeneralPurposeBit().getSlidingDictionarySize(),
                                        current.entry.getGeneralPurposeBit().getNumberOfShannonFanoTrees(),
                                        bis);
                        break;
                    //                case BZIP2:
                    //                    current.in = new BZip2CompressorInputStream(bis);
                    //                    break;
                    //                case ENHANCED_DEFLATED:
                    //                    current.in = new Deflate64CompressorInputStream(bis);
                    //                    break;
                    default:
                        // we should never get here as all supported methods have been covered
                        // will cause an error when read is invoked, don't throw an exception here so people can
                        // skip unsupported entries
                        break;
                }
            }
        }

        //        else if (m == ZipMethod.ENHANCED_DEFLATED) {
        //            current.in = new Deflate64CompressorInputStream(in);
        //        }

        entriesRead++;
        return current.entry;
    }

    /**
     * Fills the given array with the first local file header and
     * deals with splitting/spanning markers that may prefix the first
     * LFH.
     */
    private void readFirstLocalFileHeader(final byte[] lfh) throws IOException{
        readFully(lfh);
        final ZipLong sig = new ZipLong(lfh);

        if (!skipSplitSig && sig.equals(ZipLong.DD_SIG)){
            throw new UnsupportedZipFeatureException(UnsupportedZipFeatureException.Feature.SPLITTING);
        }

        // the split zip signature(08074B50) should only be skipped when the skipSplitSig is set
        if (sig.equals(ZipLong.SINGLE_SEGMENT_SPLIT_MARKER) || sig.equals(ZipLong.DD_SIG)){
            // Just skip over the marker.
            final byte[] missedLfhBytes = new byte[4];
            readFully(missedLfhBytes);
            System.arraycopy(lfh, 4, lfh, 0, LFH_LEN - 4);
            System.arraycopy(missedLfhBytes, 0, lfh, LFH_LEN - 4, 4);
        }
    }

    /**
     * Records whether a Zip64 extra is present and sets the size
     * information from it if sizes are 0xFFFFFFFF and the entry
     * doesn't use a data descriptor.
     */
    private void processZip64Extra(final ZipLong size,final ZipLong cSize){
        final Zip64ExtendedInformationExtraField z64 = (Zip64ExtendedInformationExtraField) current.entry
                        .getExtraField(Zip64ExtendedInformationExtraField.HEADER_ID);
        current.usesZip64 = z64 != null;
        if (!current.hasDataDescriptor){
            if (z64 != null // same as current.usesZip64 but avoids NPE warning
                            && (ZipLong.ZIP64_MAGIC.equals(cSize) || ZipLong.ZIP64_MAGIC.equals(size))){
                current.entry.setCompressedSize(z64.getCompressedSize().getLongValue());
                current.entry.setSize(z64.getSize().getLongValue());
            }else if (cSize != null && size != null){
                current.entry.setCompressedSize(cSize.getValue());
                current.entry.setSize(size.getValue());
            }
        }
    }

    @Override
    public ArchiveEntry getNextEntry() throws IOException{
        return getNextZipEntry();
    }

    /**
     * Whether this class is able to read the given entry.
     *
     * 
     * May return false if it is set up to use encryption or a
     * compression method that hasn't been implemented yet.
     * 
     * 
     * @since 1.1
     */
    @Override
    public boolean canReadEntryData(final ArchiveEntry ae){
        if (ae instanceof ZipArchiveEntry){
            final ZipArchiveEntry ze = (ZipArchiveEntry) ae;
            return ZipUtil.canHandleEntryData(ze) && supportsDataDescriptorFor(ze) && supportsCompressedSizeFor(ze);
        }
        return false;
    }

    @Override
    public int read(final byte[] buffer,final int offset,final int length) throws IOException{
        if (length == 0){
            return 0;
        }
        if (closed){
            throw new IOException("The stream is closed");
        }

        if (current == null){
            return -1;
        }

        // avoid int overflow, check null buffer
        if (offset > buffer.length || length < 0 || offset < 0 || buffer.length - offset < length){
            throw new ArrayIndexOutOfBoundsException();
        }

        ZipUtil.checkRequestedFeatures(current.entry);
        if (!supportsDataDescriptorFor(current.entry)){
            throw new UnsupportedZipFeatureException(UnsupportedZipFeatureException.Feature.DATA_DESCRIPTOR, current.entry);
        }
        if (!supportsCompressedSizeFor(current.entry)){
            throw new UnsupportedZipFeatureException(UnsupportedZipFeatureException.Feature.UNKNOWN_COMPRESSED_SIZE, current.entry);
        }

        int read;
        if (current.entry.getMethod() == ZipArchiveOutputStream.STORED){
            read = readStored(buffer, offset, length);
        }else if (current.entry.getMethod() == ZipArchiveOutputStream.DEFLATED){
            read = readDeflated(buffer, offset, length);
        }else if (current.entry.getMethod() == ZipMethod.UNSHRINKING.getCode() || current.entry.getMethod() == ZipMethod.IMPLODING.getCode()
                        || current.entry.getMethod() == ZipMethod.ENHANCED_DEFLATED.getCode()
                        || current.entry.getMethod() == ZipMethod.BZIP2.getCode()){
            read = current.in.read(buffer, offset, length);
        }else{
            throw new UnsupportedZipFeatureException(ZipMethod.getMethodByCode(current.entry.getMethod()), current.entry);
        }

        if (read >= 0){
            current.crc.update(buffer, offset, read);
            uncompressedCount += read;
        }

        return read;
    }

    /**
     * @since 1.17
     */
    @Override
    public long getCompressedCount(){
        if (current.entry.getMethod() == ZipArchiveOutputStream.STORED){
            return current.bytesRead;
        }else if (current.entry.getMethod() == ZipArchiveOutputStream.DEFLATED){
            return getBytesInflated();
        }

        //        else if (current.entry.getMethod() == ZipMethod.UNSHRINKING.getCode()) {
        //            return ((UnshrinkingInputStream) current.in).getCompressedCount();
        //        } else if (current.entry.getMethod() == ZipMethod.IMPLODING.getCode()) {
        //            return ((ExplodingInputStream) current.in).getCompressedCount();
        //        } else if (current.entry.getMethod() == ZipMethod.ENHANCED_DEFLATED.getCode()) {
        //            return ((Deflate64CompressorInputStream) current.in).getCompressedCount();
        //        } else if (current.entry.getMethod() == ZipMethod.BZIP2.getCode()) {
        //            return ((BZip2CompressorInputStream) current.in).getCompressedCount();
        //        } 

        else{
            return -1;
        }
    }

    /**
     * @since 1.17
     */
    @Override
    public long getUncompressedCount(){
        return uncompressedCount;
    }

    /**
     * Implementation of read for STORED entries.
     */
    private int readStored(final byte[] buffer,final int offset,final int length) throws IOException{

        if (current.hasDataDescriptor){
            if (lastStoredEntry == null){
                readStoredEntry();
            }
            return lastStoredEntry.read(buffer, offset, length);
        }

        final long csize = current.entry.getSize();
        if (current.bytesRead >= csize){
            return -1;
        }

        if (buf.position() >= buf.limit()){
            buf.position(0);
            final int l = in.read(buf.array());
            if (l == -1){
                buf.limit(0);
                throw new IOException("Truncated ZIP file");
            }
            buf.limit(l);

            count(l);
            current.bytesReadFromStream += l;
        }

        int toRead = Math.min(buf.remaining(), length);
        if ((csize - current.bytesRead) < toRead){
            // if it is smaller than toRead then it fits into an int
            toRead = (int) (csize - current.bytesRead);
        }
        buf.get(buffer, offset, toRead);
        current.bytesRead += toRead;
        return toRead;
    }

    /**
     * Implementation of read for DEFLATED entries.
     */
    private int readDeflated(final byte[] buffer,final int offset,final int length) throws IOException{
        final int read = readFromInflater(buffer, offset, length);
        if (read <= 0){
            if (inf.finished()){
                return -1;
            }else if (inf.needsDictionary()){
                throw new ZipException("This archive needs a preset dictionary" + " which is not supported by Commons" + " Compress.");
            }else if (read == -1){
                throw new IOException("Truncated ZIP file");
            }
        }
        return read;
    }

    /**
     * Potentially reads more bytes to fill the inflater's buffer and
     * reads from it.
     */
    private int readFromInflater(final byte[] buffer,final int offset,final int length) throws IOException{
        int read = 0;
        do{
            if (inf.needsInput()){
                final int l = fill();
                if (l > 0){
                    current.bytesReadFromStream += buf.limit();
                }else if (l == -1){
                    return -1;
                }else{
                    break;
                }
            }
            try{
                read = inf.inflate(buffer, offset, length);
            }catch (final DataFormatException e){
                throw (IOException) new ZipException(e.getMessage()).initCause(e);
            }
        }while (read == 0 && inf.needsInput());
        return read;
    }

    @Override
    public void close() throws IOException{
        if (!closed){
            closed = true;
            try{
                in.close();
            }finally{
                inf.end();
            }
        }
    }

    /**
     * Skips over and discards value bytes of data from this input
     * stream.
     *
     * 
     * This implementation may end up skipping over some smaller
     * number of bytes, possibly 0, if and only if it reaches the end
     * of the underlying stream.
     * 
     *
     * 
     * The actual number of bytes skipped is returned.
     * 
     *
     * @param value
     *            the number of bytes to be skipped.
     * @return the actual number of bytes skipped.
     * @throws IOException
     *             - if an I/O error occurs.
     * @throws IllegalArgumentException
     *             - if value is negative.
     */
    @Override
    public long skip(final long value) throws IOException{
        if (value >= 0){
            long skipped = 0;
            while (skipped < value){
                final long rem = value - skipped;
                final int x = read(skipBuf, 0, (int) (skipBuf.length > rem ? rem : skipBuf.length));
                if (x == -1){
                    return skipped;
                }
                skipped += x;
            }
            return skipped;
        }
        throw new IllegalArgumentException();
    }

    /**
     * Checks if the signature matches what is expected for a zip file.
     * Does not currently handle self-extracting zips which may have arbitrary
     * leading content.
     *
     * @param signature
     *            the bytes to check
     * @param length
     *            the number of bytes to check
     * @return true, if this stream is a zip archive stream, false otherwise
     */
    public static boolean matches(final byte[] signature,final int length){
        if (length < ZipArchiveOutputStream.LFH_SIG.length){
            return false;
        }

        return checksig(signature, ZipArchiveOutputStream.LFH_SIG) // normal file
                        || checksig(signature, ZipArchiveOutputStream.EOCD_SIG) // empty zip
                        || checksig(signature, ZipArchiveOutputStream.DD_SIG) // split zip
                        || checksig(signature, ZipLong.SINGLE_SEGMENT_SPLIT_MARKER.getBytes());
    }

    private static boolean checksig(final byte[] signature,final byte[] expected){
        for (int i = 0; i < expected.length; i++){
            if (signature[i] != expected[i]){
                return false;
            }
        }
        return true;
    }

    /**
     * Closes the current ZIP archive entry and positions the underlying
     * stream to the beginning of the next entry. All per-entry variables
     * and data structures are cleared.
     * 
     * If the compressed size of this entry is included in the entry header,
     * then any outstanding bytes are simply skipped from the underlying
     * stream without uncompressing them. This allows an entry to be safely
     * closed even if the compression method is unsupported.
     * 

     * In case we don't know the compressed size of this entry or have
     * already buffered too much data from the underlying stream to support
     * uncompression, then the uncompression process is completed and the
     * end position of the stream is adjusted based on the result of that
     * process.
     *
     * @throws IOException
     *             if an error occurs
     */
    private void closeEntry() throws IOException{
        if (closed){
            throw new IOException("The stream is closed");
        }
        if (current == null){
            return;
        }

        // Ensure all entry bytes are read
        if (currentEntryHasOutstandingBytes()){
            drainCurrentEntryData();
        }else{
            // this is guaranteed to exhaust the stream
            skip(Long.MAX_VALUE); //NOSONAR

            final long inB = current.entry.getMethod() == ZipArchiveOutputStream.DEFLATED ? getBytesInflated() : current.bytesRead;

            // this is at most a single read() operation and can't
            // exceed the range of int
            final int diff = (int) (current.bytesReadFromStream - inB);

            // Pushback any required bytes
            if (diff > 0){
                pushback(buf.array(), buf.limit() - diff, diff);
                current.bytesReadFromStream -= diff;
            }

            // Drain remainder of entry if not all data bytes were required
            if (currentEntryHasOutstandingBytes()){
                drainCurrentEntryData();
            }
        }

        if (lastStoredEntry == null && current.hasDataDescriptor){
            readDataDescriptor();
        }

        inf.reset();
        buf.clear().flip();
        current = null;
        lastStoredEntry = null;
    }

    /**
     * If the compressed size of the current entry is included in the entry header
     * and there are any outstanding bytes in the underlying stream, then
     * this returns true.
     *
     * @return true, if current entry is determined to have outstanding bytes, false otherwise
     */
    private boolean currentEntryHasOutstandingBytes(){
        return current.bytesReadFromStream <= current.entry.getCompressedSize() && !current.hasDataDescriptor;
    }

    /**
     * Read all data of the current entry from the underlying stream
     * that hasn't been read, yet.
     */
    private void drainCurrentEntryData() throws IOException{
        long remaining = current.entry.getCompressedSize() - current.bytesReadFromStream;
        while (remaining > 0){
            final long n = in.read(buf.array(), 0, (int) Math.min(buf.capacity(), remaining));
            if (n < 0){
                throw new EOFException("Truncated ZIP entry: " + ArchiveUtils.sanitize(current.entry.getName()));
            }
            count(n);
            remaining -= n;
        }
    }

    /**
     * Get the number of bytes Inflater has actually processed.
     *
     * 

     * for Java < Java7 the getBytes* methods in
     * Inflater/Deflater seem to return unsigned ints rather than
     * longs that start over with 0 at 2^32.
     * 
     *
     * 
     * The stream knows how many bytes it has read, but not how
     * many the Inflater actually consumed - it should be between the
     * total number of bytes read for the entry and the total number
     * minus the last read operation. Here we just try to make the
     * value close enough to the bytes we've read by assuming the
     * number of bytes consumed must be smaller than (or equal to) the
     * number of bytes read but not smaller by more than 2^32.
     * 
     */
    private long getBytesInflated(){
        long inB = inf.getBytesRead();
        if (current.bytesReadFromStream >= TWO_EXP_32){
            while (inB + TWO_EXP_32 <= current.bytesReadFromStream){
                inB += TWO_EXP_32;
            }
        }
        return inB;
    }

    private int fill() throws IOException{
        if (closed){
            throw new IOException("The stream is closed");
        }
        final int length = in.read(buf.array());
        if (length > 0){
            buf.limit(length);
            count(buf.limit());
            inf.setInput(buf.array(), 0, buf.limit());
        }
        return length;
    }

    private void readFully(final byte[] b) throws IOException{
        readFully(b, 0);
    }

    private void readFully(final byte[] b,final int off) throws IOException{
        final int len = b.length - off;
        final int count = IOUtils.readFully(in, b, off, len);
        count(count);
        if (count < len){
            throw new EOFException();
        }
    }

    private void readDataDescriptor() throws IOException{
        readFully(wordBuf);
        ZipLong val = new ZipLong(wordBuf);
        if (ZipLong.DD_SIG.equals(val)){
            // data descriptor with signature, skip sig
            readFully(wordBuf);
            val = new ZipLong(wordBuf);
        }
        current.entry.setCrc(val.getValue());

        // if there is a ZIP64 extra field, sizes are eight bytes
        // each, otherwise four bytes each.  Unfortunately some
        // implementations - namely Java7 - use eight bytes without
        // using a ZIP64 extra field -
        // https://bugs.sun.com/bugdatabase/view_bug.do?bug_id=7073588

        // just read 16 bytes and check whether bytes nine to twelve
        // look like one of the signatures of what could follow a data
        // descriptor (ignoring archive decryption headers for now).
        // If so, push back eight bytes and assume sizes are four
        // bytes, otherwise sizes are eight bytes each.
        readFully(twoDwordBuf);
        final ZipLong potentialSig = new ZipLong(twoDwordBuf, DWORD);
        if (potentialSig.equals(ZipLong.CFH_SIG) || potentialSig.equals(ZipLong.LFH_SIG)){
            pushback(twoDwordBuf, DWORD, DWORD);
            current.entry.setCompressedSize(ZipLong.getValue(twoDwordBuf));
            current.entry.setSize(ZipLong.getValue(twoDwordBuf, WORD));
        }else{
            current.entry.setCompressedSize(ZipEightByteInteger.getLongValue(twoDwordBuf));
            current.entry.setSize(ZipEightByteInteger.getLongValue(twoDwordBuf, DWORD));
        }
    }

    /**
     * Whether this entry requires a data descriptor this library can work with.
     *
     * @return true if allowStoredEntriesWithDataDescriptor is true,
     *         the entry doesn't require any data descriptor or the method is
     *         DEFLATED or ENHANCED_DEFLATED.
     */
    private boolean supportsDataDescriptorFor(final ZipArchiveEntry entry){
        return !entry.getGeneralPurposeBit().usesDataDescriptor()

                        || (allowStoredEntriesWithDataDescriptor && entry.getMethod() == ZipEntry.STORED)
                        || entry.getMethod() == ZipEntry.DEFLATED || entry.getMethod() == ZipMethod.ENHANCED_DEFLATED.getCode();
    }

    /**
     * Whether the compressed size for the entry is either known or
     * not required by the compression method being used.
     */
    private boolean supportsCompressedSizeFor(final ZipArchiveEntry entry){
        return entry.getCompressedSize() != ArchiveEntry.SIZE_UNKNOWN || entry.getMethod() == ZipEntry.DEFLATED
                        || entry.getMethod() == ZipMethod.ENHANCED_DEFLATED.getCode() || (entry.getGeneralPurposeBit().usesDataDescriptor()
                                        && allowStoredEntriesWithDataDescriptor && entry.getMethod() == ZipEntry.STORED);
    }

    private static final String USE_ZIPFILE_INSTEAD_OF_STREAM_DISCLAIMER = " while reading a stored entry using data descriptor. Either the archive is broken"
                    + " or it can not be read using ZipArchiveInputStream and you must use ZipFile."
                    + " A common cause for this is a ZIP archive containing a ZIP archive."
                    + " See http://commons.apache.org/proper/commons-compress/zip.html#ZipArchiveInputStream_vs_ZipFile";

    /**
     * Caches a stored entry that uses the data descriptor.
     *
     * 
     * Reads a stored entry until the signature of a local file
     * header, central directory header or data descriptor has been
     * found.
     * Stores all entry data in lastStoredEntry.
     * 
     * 
Rewinds the stream to position at the data
     * descriptor.
     * reads the data descriptor
     * 
     *
     * 
     * After calling this method the entry should know its size,
     * the entry's data is cached and the stream is positioned at the
     * next local file or central directory header.
     * 
     */
    private void readStoredEntry() throws IOException{
        final ByteArrayOutputStream bos = new ByteArrayOutputStream();
        int off = 0;
        boolean done = false;

        // length of DD without signature
        final int ddLen = current.usesZip64 ? WORD + 2 * DWORD : 3 * WORD;

        while (!done){
            final int r = in.read(buf.array(), off, ZipArchiveOutputStream.BUFFER_SIZE - off);
            if (r <= 0){
                // read the whole archive without ever finding a
                // central directory
                throw new IOException("Truncated ZIP file");
            }
            if (r + off < 4){
                // buffer too small to check for a signature, loop
                off += r;
                continue;
            }

            done = bufferContainsSignature(bos, off, r, ddLen);
            if (!done){
                off = cacheBytesRead(bos, off, r, ddLen);
            }
        }
        if (current.entry.getCompressedSize() != current.entry.getSize()){
            throw new ZipException("compressed and uncompressed size don't match" + USE_ZIPFILE_INSTEAD_OF_STREAM_DISCLAIMER);
        }
        final byte[] b = bos.toByteArray();
        if (b.length != current.entry.getSize()){
            throw new ZipException("actual and claimed size don't match" + USE_ZIPFILE_INSTEAD_OF_STREAM_DISCLAIMER);
        }
        lastStoredEntry = new ByteArrayInputStream(b);
    }

    private static final byte[] LFH = ZipLong.LFH_SIG.getBytes();

    private static final byte[] CFH = ZipLong.CFH_SIG.getBytes();

    private static final byte[] DD  = ZipLong.DD_SIG.getBytes();

    /**
     * Checks whether the current buffer contains the signature of a
     * "data descriptor", "local file header" or
     * "central directory entry".
     *
     * 
     * If it contains such a signature, reads the data descriptor
     * and positions the stream right after the data descriptor.
     * 
     */
    private boolean bufferContainsSignature(final ByteArrayOutputStream bos,final int offset,final int lastRead,final int expectedDDLen)
                    throws IOException{

        boolean done = false;
        for (int i = 0; !done && i < offset + lastRead - 4; i++){
            if (buf.array()[i] == LFH[0] && buf.array()[i + 1] == LFH[1]){
                int expectDDPos = i;
                if (i >= expectedDDLen && (buf.array()[i + 2] == LFH[2] && buf.array()[i + 3] == LFH[3])
                                || (buf.array()[i] == CFH[2] && buf.array()[i + 3] == CFH[3])){
                    // found a LFH or CFH:
                    expectDDPos = i - expectedDDLen;
                    done = true;
                }else if (buf.array()[i + 2] == DD[2] && buf.array()[i + 3] == DD[3]){
                    // found DD:
                    done = true;
                }
                if (done){
                    // * push back bytes read in excess as well as the data
                    //   descriptor
                    // * copy the remaining bytes to cache
                    // * read data descriptor
                    pushback(buf.array(), expectDDPos, offset + lastRead - expectDDPos);
                    bos.write(buf.array(), 0, expectDDPos);
                    readDataDescriptor();
                }
            }
        }
        return done;
    }

    /**
     * If the last read bytes could hold a data descriptor and an
     * incomplete signature then save the last bytes to the front of
     * the buffer and cache everything in front of the potential data
     * descriptor into the given ByteArrayOutputStream.
     *
     * 
     * Data descriptor plus incomplete signature (3 bytes in the
     * worst case) can be 20 bytes max.
     * 
     */
    private int cacheBytesRead(final ByteArrayOutputStream bos,int offset,final int lastRead,final int expecteDDLen){
        final int cacheable = offset + lastRead - expecteDDLen - 3;
        if (cacheable > 0){
            bos.write(buf.array(), 0, cacheable);
            System.arraycopy(buf.array(), cacheable, buf.array(), 0, expecteDDLen + 3);
            offset = expecteDDLen + 3;
        }else{
            offset += lastRead;
        }
        return offset;
    }

    private void pushback(final byte[] buf,final int offset,final int length) throws IOException{
        ((PushbackInputStream) in).unread(buf, offset, length);
        pushedBackBytes(length);
    }

    // End of Central Directory Record
    //   end of central dir signature    WORD
    //   number of this disk             SHORT
    //   number of the disk with the
    //   start of the central directory  SHORT
    //   total number of entries in the
    //   central directory on this disk  SHORT
    //   total number of entries in
    //   the central directory           SHORT
    //   size of the central directory   WORD
    //   offset of start of central
    //   directory with respect to
    //   the starting disk number        WORD
    //   .ZIP file comment length        SHORT
    //   .ZIP file comment               up to 64KB
    //

    /**
     * Reads the stream until it find the "End of central directory
     * record" and consumes it as well.
     */
    private void skipRemainderOfArchive() throws IOException{
        // skip over central directory. One LFH has been read too much
        // already.  The calculation discounts file names and extra
        // data so it will be too short.
        realSkip((long) entriesRead * CFH_LEN - LFH_LEN);
        findEocdRecord();
        realSkip((long) ZipFile.MIN_EOCD_SIZE - WORD /* signature */ - SHORT /* comment len */);
        readFully(shortBuf);
        // file comment
        realSkip(ZipShort.getValue(shortBuf));
    }

    /**
     * Reads forward until the signature of the "End of central
     * directory" record is found.
     */
    private void findEocdRecord() throws IOException{
        int currentByte = -1;
        boolean skipReadCall = false;
        while (skipReadCall || (currentByte = readOneByte()) > -1){
            skipReadCall = false;
            if (!isFirstByteOfEocdSig(currentByte)){
                continue;
            }
            currentByte = readOneByte();
            if (currentByte != ZipArchiveOutputStream.EOCD_SIG[1]){
                if (currentByte == -1){
                    break;
                }
                skipReadCall = isFirstByteOfEocdSig(currentByte);
                continue;
            }
            currentByte = readOneByte();
            if (currentByte != ZipArchiveOutputStream.EOCD_SIG[2]){
                if (currentByte == -1){
                    break;
                }
                skipReadCall = isFirstByteOfEocdSig(currentByte);
                continue;
            }
            currentByte = readOneByte();
            if (currentByte == -1 || currentByte == ZipArchiveOutputStream.EOCD_SIG[3]){
                break;
            }
            skipReadCall = isFirstByteOfEocdSig(currentByte);
        }
    }

    /**
     * Skips bytes by reading from the underlying stream rather than
     * the (potentially inflating) archive stream - which {@link
     * #skip} would do.
     *
     * Also updates bytes-read counter.
     */
    private void realSkip(final long value) throws IOException{
        if (value >= 0){
            long skipped = 0;
            while (skipped < value){
                final long rem = value - skipped;
                final int x = in.read(skipBuf, 0, (int) (skipBuf.length > rem ? rem : skipBuf.length));
                if (x == -1){
                    return;
                }
                count(x);
                skipped += x;
            }
            return;
        }
        throw new IllegalArgumentException();
    }

    /**
     * Reads bytes by reading from the underlying stream rather than
     * the (potentially inflating) archive stream - which {@link #read} would do.
     *
     * Also updates bytes-read counter.
     */
    private int readOneByte() throws IOException{
        final int b = in.read();
        if (b != -1){
            count(1);
        }
        return b;
    }

    private boolean isFirstByteOfEocdSig(final int b){
        return b == ZipArchiveOutputStream.EOCD_SIG[0];
    }

    private static final byte[]     APK_SIGNING_BLOCK_MAGIC = new byte[] {
                                                                           'A',
                                                                           'P',
                                                                           'K',
                                                                           ' ',
                                                                           'S',
                                                                           'i',
                                                                           'g',
                                                                           ' ',
                                                                           'B',
                                                                           'l',
                                                                           'o',
                                                                           'c',
                                                                           'k',
                                                                           ' ',
                                                                           '4',
                                                                           '2', };

    private static final BigInteger LONG_MAX                = BigInteger.valueOf(Long.MAX_VALUE);

    /**
     * Checks whether this might be an APK Signing Block.
     *
     * 
     * Unfortunately the APK signing block does not start with some kind of signature, it rather ends with one. It
     * starts with a length, so what we do is parse the suspect length, skip ahead far enough, look for the signature
     * and if we've found it, return true.
     * 
     *
     * @param suspectLocalFileHeader
     *            the bytes read from the underlying stream in the expectation that they would hold
     *            the local file header of the next entry.
     *
     * @return true if this looks like a APK signing block
     *
     * @see https://source.android.com/security/apksigning/v2
     */
    private boolean isApkSigningBlock(byte[] suspectLocalFileHeader) throws IOException{
        // length of block excluding the size field itself
        BigInteger len = ZipEightByteInteger.getValue(suspectLocalFileHeader);
        // LFH has already been read and all but the first eight bytes contain (part of) the APK signing block,
        // also subtract 16 bytes in order to position us at the magic string
        BigInteger toSkip = len.add(BigInteger.valueOf(DWORD - suspectLocalFileHeader.length - (long) APK_SIGNING_BLOCK_MAGIC.length));
        byte[] magic = new byte[APK_SIGNING_BLOCK_MAGIC.length];

        try{
            if (toSkip.signum() < 0){
                // suspectLocalFileHeader contains the start of suspect magic string
                int off = suspectLocalFileHeader.length + toSkip.intValue();
                // length was shorter than magic length
                if (off < DWORD){
                    return false;
                }
                int bytesInBuffer = Math.abs(toSkip.intValue());
                System.arraycopy(suspectLocalFileHeader, off, magic, 0, Math.min(bytesInBuffer, magic.length));
                if (bytesInBuffer < magic.length){
                    readFully(magic, bytesInBuffer);
                }
            }else{
                while (toSkip.compareTo(LONG_MAX) > 0){
                    realSkip(Long.MAX_VALUE);
                    toSkip = toSkip.add(LONG_MAX.negate());
                }
                realSkip(toSkip.longValue());
                readFully(magic);
            }
        }catch (EOFException ex){ //NOSONAR
            // length was invalid
            return false;
        }
        return Arrays.equals(magic, APK_SIGNING_BLOCK_MAGIC);
    }

    /**
     * Structure collecting information for the entry that is
     * currently being read.
     */
    private static final class CurrentEntry{

        /**
         * Current ZIP entry.
         */
        private final ZipArchiveEntry entry = new ZipArchiveEntry();

        /**
         * Does the entry use a data descriptor?
         */
        private boolean               hasDataDescriptor;

        /**
         * Does the entry have a ZIP64 extended information extra field.
         */
        private boolean               usesZip64;

        /**
         * Number of bytes of entry content read by the client if the
         * entry is STORED.
         */
        private long                  bytesRead;

        /**
         * Number of bytes of entry content read from the stream.
         *
         * 
         * This may be more than the actual entry's length as some
         * stuff gets buffered up and needs to be pushed back when the
         * end of the entry has been reached.
         * 
         */
        private long                  bytesReadFromStream;

        /**
         * The checksum calculated as the current entry is read.
         */
        private final CRC32           crc   = new CRC32();

        /**
         * The input stream decompressing the data for shrunk and imploded entries.
         */
        private InputStream           in;
    }

    /**
     * Bounded input stream adapted from commons-io
     */
    private class BoundedInputStream extends InputStream{

        /** the wrapped input stream */
        private final InputStream in;

        /** the max length to provide */
        private final long        max;

        /** the number of bytes already returned */
        private long              pos = 0;

        /**
         * Creates a new BoundedInputStream that wraps the given input
         * stream and limits it to a certain size.
         *
         * @param in
         *            The wrapped input stream
         * @param size
         *            The maximum number of bytes to return
         */
        public BoundedInputStream(final InputStream in, final long size){
            this.max = size;
            this.in = in;
        }

        @Override
        public int read() throws IOException{
            if (max >= 0 && pos >= max){
                return -1;
            }
            final int result = in.read();
            pos++;
            count(1);
            current.bytesReadFromStream++;
            return result;
        }

        @Override
        public int read(final byte[] b) throws IOException{
            return this.read(b, 0, b.length);
        }

        @Override
        public int read(final byte[] b,final int off,final int len) throws IOException{
            if (len == 0){
                return 0;
            }
            if (max >= 0 && pos >= max){
                return -1;
            }
            final long maxRead = max >= 0 ? Math.min(len, max - pos) : len;
            final int bytesRead = in.read(b, off, (int) maxRead);

            if (bytesRead == -1){
                return -1;
            }

            pos += bytesRead;
            count(bytesRead);
            current.bytesReadFromStream += bytesRead;
            return bytesRead;
        }

        @Override
        public long skip(final long n) throws IOException{
            final long toSkip = max >= 0 ? Math.min(n, max - pos) : n;
            final long skippedBytes = IOUtils.skip(in, toSkip);
            pos += skippedBytes;
            return skippedBytes;
        }

        @Override
        public int available() throws IOException{
            if (max >= 0 && pos >= max){
                return 0;
            }
            return in.available();
        }
    }
}