All Downloads are FREE. Search and download functionalities are using the official Maven repository.

uk.ac.starlink.util.Compression Maven / Gradle / Ivy

There is a newer version: 4.3
Show newest version
package uk.ac.starlink.util;

import java.io.BufferedInputStream;
import java.io.IOException;
import java.io.InputStream;
import java.util.zip.GZIPInputStream;
import uk.ac.starlink.util.bzip2.CBZip2InputStream;

/**
 * Characterises the compression status of a stream, and provides methods
 * for decompressing it.
 *
 * @author   Mark Taylor (Starlink)
 */
public abstract class Compression {

    private String name;

    /** Number of bytes needed to determine compression type (magic number). */
    public static final int MAGIC_SIZE = 3;

    /**
     * Private sole constructor.
     *
     * @param   name  the name of this compression method
     */
    private Compression( String name ) {
        this.name = name;
    }

    /**
     * Returns a stream which is a decompressed version of the input stream,
     * according to this objects compression type.
     *
     * @param  raw  the raw input stream
     * @return  a stream giving the decompressed version of raw
     */
    public abstract InputStream decompress( InputStream raw ) 
            throws IOException;

    /**
     * Returns a Compression object characterising the compression (if any)
     * represented by a given magic number.
     *
     * @param  magic  a buffer containing the first {@link #MAGIC_SIZE}
     *         bytes of input of the stream to be characterised
     * @return  a Compression object of the type represented by
     *          magic
     * @throws IllegalArgumentException  if magic.length<MAGIC_SIZE
     */
    public static Compression getCompression( byte[] magic ) {
        if ( magic.length < MAGIC_SIZE ) {
            throw new IllegalArgumentException( 
                "Magic buffer must be at least MAGIC_SIZE=" + MAGIC_SIZE + 
                " bytes" );
        }
        else if ( magic[ 0 ] == (byte) 0x1f && 
                  magic[ 1 ] == (byte) 0x8b ) {
            return GZIP;
        }
        else if ( magic[ 0 ] == (byte) 'B' &&
                  magic[ 1 ] == (byte) 'Z' &&
                  magic[ 2 ] == (byte) 'h' ) {
            return BZIP2;
        }
        else if ( magic[ 0 ] == (byte) 0x1f &&
                  magic[ 1 ] == (byte) 0x9d ) {
            return COMPRESS;
        }
        else {
            return NONE;
        }
    }

    /**
     * Returns a decompressed version of the given input stream.
     *
     * @param  raw  the raw input stream
     * @return  the decompressed version of raw
     */
    public static InputStream decompressStatic( InputStream raw ) 
             throws IOException {
        if ( ! raw.markSupported() || DataSource.getMarkWorkaround() ) {
            raw = new BufferedInputStream( raw );
        }
        raw.mark( MAGIC_SIZE );
        byte[] buf = new byte[ MAGIC_SIZE ];
        raw.read( buf );
        raw.reset();
        Compression compress = getCompression( buf );
        return compress.decompress( raw );
    }

    /**
     * Returns the name of this compression type.
     *
     * @return  string representation
     */
    public String toString() {
        return name;
    }

    /**
     * A Compression object representing no compression (or perhaps an
     * unknown one).  The decompress method will return the
     * raw input stream unchanged.
     */
    public static final Compression NONE = new Compression( "none" ) {
        public InputStream decompress( InputStream raw ) throws IOException {
            return raw;
        }
    };

    /**
     * A Compression object representing GZip compression.
     */
    public static final Compression GZIP = new Compression( "gzip" ) {
        public InputStream decompress( InputStream raw ) throws IOException {
            return new GZIPInputStream( raw ) {

                /* This is a workaround for a bug in GZIPInputStream in
                 * J2SE1.4.0.
                 * GZIPInputStream.markSupported() returns true; however
                 * instances of this class do not support marking, which
                 * screws up some things that the DataSource class tries to do.
                 * So we fiddle the inflating stream to tell the truth. */
                /* Note this seems to be not uncommon in decompression streams
                 * (had to fix the same bug in the UncompressInputStream 
                 * implementation used here too). */
                /* (bug ID 4812237 submitted to 
                 * developer.java.sun.com by mbt) */
                public boolean markSupported() {
                    return false;
                }

                /* This is a workaround for a different bug, ID 4795134
                 * at bugs.sun.com.  Though that bug report claims it's not
                 * a defect, I disagree.
                 * InflaterInputStream (hence GZIPInputStream) can return 1
                 * even when the end of stream has been reached.  It is less
                 * damaging to report available as 0 when the real answer
                 * is non-zero than the other way around.  But it's probably
                 * a good idea to avoid relying on available() in any case. */
                public int available() throws IOException {
                    int avail = super.available();
                    return avail > 1 ? avail : 0;
                }
            };
        }
    };

    /**
     * A Compression object representing BZip2 compression.
     */
    public static final Compression BZIP2 = new Compression( "bzip2" ) {
        public InputStream decompress( InputStream raw ) throws IOException {

            /* Eat the first two bytes. */
            if ( raw.read() != 'B' || raw.read() != 'Z' ) {
                throw new IllegalArgumentException( 
                    "Wrong magic number for bzip2 encoding" );
            }
            return new CBZip2InputStream( raw, true );
        }
    };

    /**
     * A Compression object representing Unix compress-type compression.
     */
    public static final Compression COMPRESS = new Compression( "compress" ) {
        public InputStream decompress( InputStream raw ) throws IOException {
            return new UncompressInputStream( raw );
        }
    };
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy