io.protostuff.ByteString Maven / Gradle / Ivy

Go to download
Show more of this group Show more artifacts with this name
Show all versions of protostuff-api Show documentation
serialization api for messages
The newest version!
//========================================================================
//Copyright 2007-2009 David Yu [email protected]
//------------------------------------------------------------------------
//Licensed under the Apache License, Version 2.0 (the "License");
//you may not use this file except in compliance with the License.
//You may obtain a copy of the License at 
//http://www.apache.org/licenses/LICENSE-2.0
//Unless required by applicable law or agreed to in writing, software
//distributed under the License is distributed on an "AS IS" BASIS,
//WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
//See the License for the specific language governing permissions and
//limitations under the License.
//========================================================================

// Protocol Buffers - Google's data interchange format
// Copyright 2008 Google Inc.  All rights reserved.
// http://code.google.com/p/protobuf/
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
// copyright notice, this list of conditions and the following disclaimer
// in the documentation and/or other materials provided with the
// distribution.
//     * Neither the name of Google Inc. nor the names of its
// contributors may be used to endorse or promote products derived from
// this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

package io.protostuff;

import static io.protostuff.StringSerializer.STRING;

import java.io.DataOutput;
import java.io.IOException;
import java.io.OutputStream;
import java.io.UnsupportedEncodingException;
import java.nio.ByteBuffer;

/**
 * Immutable array of bytes.
 * 
 * @author [email protected] Bob Lee
 * @author [email protected] Kenton Varda
 * @author David Yu
 */
public final class ByteString
{
    // START EXTRA
    // internal package access to avoid double memory allocation
    static ByteString wrap(byte[] bytes)
    {
        return new ByteString(bytes);
    }

    // internal package access to avoid double memory allocation
    byte[] getBytes()
    {
        return bytes;
    }

    /**
     * Writes the bytes to the {@link OutputStream}.
     */
    public static void writeTo(OutputStream out, ByteString bs) throws IOException
    {
        out.write(bs.bytes);
    }

    /**
     * Writes the bytes to the {@link DataOutput}.
     */
    public static void writeTo(DataOutput out, ByteString bs) throws IOException
    {
        out.write(bs.bytes);
    }

    /**
     * Writes the bytes to the {@link Output}.
     */
    public static void writeTo(Output output, ByteString bs, int fieldNumber,
            boolean repeated) throws IOException
    {
        output.writeByteArray(fieldNumber, bs.bytes, repeated);
    }

    @Override
    public String toString()
    {
        return String.format("",
                Integer.toHexString(System.identityHashCode(this)), size());
    }

    // END EXTRA
    private final byte[] bytes;

    private ByteString(final byte[] bytes)
    {
        this.bytes = bytes;
    }

    /**
     * Gets the byte at the given index.
     * 
     * @throws ArrayIndexOutOfBoundsException
     *             {@code index} is < 0 or >= size
     */
    public byte byteAt(final int index)
    {
        return bytes[index];
    }

    /**
     * Gets the number of bytes.
     */
    public int size()
    {
        return bytes.length;
    }

    /**
     * Returns {@code true} if the size is {@code 0}, {@code false} otherwise.
     */
    public boolean isEmpty()
    {
        return bytes.length == 0;
    }

    // =================================================================
    // byte[] -> ByteString

    /**
     * Empty String.
     */
    public static final String EMPTY_STRING = "";

    /**
     * Empty byte array.
     */
    public static final byte[] EMPTY_BYTE_ARRAY = new byte[0];

    /**
     * Empty ByteString.
     */
    public static final ByteString EMPTY = new ByteString(EMPTY_BYTE_ARRAY);

    /**
     * Copies the given bytes into a {@code ByteString}.
     */
    public static ByteString copyFrom(final byte[] bytes, final int offset,
            final int size)
    {
        final byte[] copy = new byte[size];
        System.arraycopy(bytes, offset, copy, 0, size);
        return new ByteString(copy);
    }

    /**
     * Copies the given bytes into a {@code ByteString}.
     */
    public static ByteString copyFrom(final byte[] bytes)
    {
        return copyFrom(bytes, 0, bytes.length);
    }

    /**
     * Encodes {@code text} into a sequence of bytes using the named charset and returns the result as a
     * {@code ByteString}.
     */
    public static ByteString copyFrom(final String text, final String charsetName)
    {
        try
        {
            return new ByteString(text.getBytes(charsetName));
        }
        catch (UnsupportedEncodingException e)
        {
            throw new RuntimeException(charsetName + " not supported?", e);
        }
    }

    /**
     * Encodes {@code text} into a sequence of UTF-8 bytes and returns the result as a {@code ByteString}.
     */
    public static ByteString copyFromUtf8(final String text)
    {
        return new ByteString(STRING.ser(text));
        /*
         * @try { return new ByteString(text.getBytes("UTF-8")); } catch (UnsupportedEncodingException e) { throw new
         * RuntimeException("UTF-8 not supported?", e); }
         */
    }

    // =================================================================
    // ByteString -> byte[]

    /**
     * Copies bytes into a buffer at the given offset.
     * 
     * @param target
     *            buffer to copy into
     * @param offset
     *            in the target buffer
     */
    public void copyTo(final byte[] target, final int offset)
    {
        System.arraycopy(bytes, 0, target, offset, bytes.length);
    }

    /**
     * Copies bytes into a buffer.
     * 
     * @param target
     *            buffer to copy into
     * @param sourceOffset
     *            offset within these bytes
     * @param targetOffset
     *            offset within the target buffer
     * @param size
     *            number of bytes to copy
     */
    public void copyTo(final byte[] target, final int sourceOffset,
            final int targetOffset,
            final int size)
    {
        System.arraycopy(bytes, sourceOffset, target, targetOffset, size);
    }

    /**
     * Copies bytes to a {@code byte[]}.
     */
    public byte[] toByteArray()
    {
        final int size = bytes.length;
        final byte[] copy = new byte[size];
        System.arraycopy(bytes, 0, copy, 0, size);
        return copy;
    }

    /**
     * Constructs a new read-only {@code java.nio.ByteBuffer} with the same backing byte array.
     */
    public ByteBuffer asReadOnlyByteBuffer()
    {
        final ByteBuffer byteBuffer = ByteBuffer.wrap(bytes);
        return byteBuffer.asReadOnlyBuffer();
    }

    /*
     * @ Constructs a new {@code String} by decoding the bytes using the specified charset.
     */
    /*
     * @public String unsignedIntToString(final String charsetName) throws UnsupportedEncodingException { return new String(bytes,
     * charsetName); }
     */

    /**
     * Constructs a new {@code String} by decoding the bytes as UTF-8.
     */
    public String toStringUtf8()
    {
        return STRING.deser(bytes);
        /*
         * @try { return new String(bytes, "UTF-8"); } catch (UnsupportedEncodingException e) { throw new
         * RuntimeException("UTF-8 not supported?", e); }
         */
    }

    // =================================================================
    // equals() and hashCode()

    @Override
    public boolean equals(final Object o)
    {
        return o == this || (o instanceof ByteString && equals(this, (ByteString) o, false));
    }

    /**
     * Returns true if the contents of both match.
     */
    public static boolean equals(ByteString bs, ByteString other, boolean checkHash)
    {
        final int size = bs.bytes.length;
        if (size != other.bytes.length)
        {
            return false;
        }

        if (checkHash)
        {
            // volatile reads
            final int h1 = bs.hash, h2 = other.hash;
            if (h1 != 0 && h2 != 0 && h1 != h2)
            {
                return false;
            }
        }

        final byte[] thisBytes = bs.bytes;
        final byte[] otherBytes = other.bytes;
        for (int i = 0; i < size; i++)
        {
            if (thisBytes[i] != otherBytes[i])
            {
                return false;
            }
        }

        return true;
    }

    /**
     * Returns true if the contents of the internal array and the provided array match.
     */
    public boolean equals(final byte[] data)
    {
        return equals(data, 0, data.length);
    }

    /**
     * Returns true if the contents of the internal array and the provided array match.
     */
    public boolean equals(final byte[] data, int offset, final int len)
    {
        final byte[] bytes = this.bytes;
        if (len != bytes.length)
            return false;

        for (int i = 0; i < len;)
        {
            if (bytes[i++] != data[offset++])
            {
                return false;
            }
        }

        return true;
    }

    private volatile int hash = 0;

    @Override
    public int hashCode()
    {
        int h = hash;

        if (h == 0)
        {
            final byte[] thisBytes = bytes;
            final int size = bytes.length;

            h = size;
            for (int i = 0; i < size; i++)
            {
                h = h * 31 + thisBytes[i];
            }
            if (h == 0)
            {
                h = 1;
            }

            hash = h;
        }

        return h;
    }

    // =================================================================
    // Input stream

    /*
     * @ Creates an {@code InputStream} which can be used to read the bytes.
     */
    /*
     * @public InputStream newInput() { return new ByteArrayInputStream(bytes); }
     */

    /*
     * @ Creates a {@link CodedInputStream} which can be used to read the bytes. Using this is more efficient than
     * creating a {@link CodedInputStream} wrapping the result of {@link #newInput()}.
     */
    /*
     * @public CodedInputStream newCodedInput() { // We trust CodedInputStream not to modify the bytes, or to give
     * anyone // else access to them. return CodedInputStream.newInstance(bytes); }
     */

    // =================================================================
    // Output stream

    /*
     * @ Creates a new {@link Output} with the given initial capacity.
     */
    /*
     * @public static Output newOutput(final int initialCapacity) { return new Output(new
     * ByteArrayOutputStream(initialCapacity)); }
     */

    /*
     * @ Creates a new {@link Output}.
     */
    /*
     * @public static Output newOutput() { return newOutput(32); }
     */

    /*
     * @ Outputs to a {@code ByteString} instance. Call {@link #toByteString()} to create the {@code ByteString}
     * instance.
     */
    /*
     * @public static final class Output extends FilterOutputStream { private final ByteArrayOutputStream bout;
     * 
     * /** Constructs a new output with the given initial capacity.
     * 
     * @ private Output(final ByteArrayOutputStream bout) { super(bout); this.bout = bout; }
     * 
     * /** Creates a {@code ByteString} instance from this {@code Output}.
     * 
     * @ public ByteString toByteString() { final byte[] byteArray = bout.toByteArray(); return new
     * ByteString(byteArray); } }
     * 
     * /** Constructs a new ByteString builder, which allows you to efficiently construct a {@code ByteString} by
     * writing to a {@link CodedOutputStream}. Using this is much more efficient than calling {@code newOutput()} and
     * wrapping that in a {@code CodedOutputStream}.
     * 
     * This is package-private because it's a somewhat confusing interface. Users can call {@link
     * Message#toByteString()} instead of calling this directly.
     * 
     * @param size The target byte size of the {@code ByteString}. You must write exactly this many bytes before
     * building the result.
     * 
     * @ static CodedBuilder newCodedBuilder(final int size) { return new CodedBuilder(size); }
     * 
     * /** See {@link ByteString#newCodedBuilder(int)}. *@ static final class CodedBuilder { private final
     * CodedOutputStream output; private final byte[] buffer;
     * 
     * private CodedBuilder(final int size) { buffer = new byte[size]; output = CodedOutputStream.newInstance(buffer); }
     * 
     * public ByteString build() { output.checkNoSpaceLeft();
     * 
     * // We can be confident that the CodedOutputStream will not modify the // underlying bytes anymore because it
     * already wrote all of them. So, // no need to make a copy. return new ByteString(buffer); }
     * 
     * public CodedOutputStream getCodedOutput() { return output; } }
     */

    // moved from Internal.java

    /**
     * Helper called by generated code to construct default values for string fields.
     * 

     * The protocol compiler does not actually contain a UTF-8 decoder -- it just pushes UTF-8-encoded text around
     * without touching it. The one place where this presents a problem is when generating Java string literals. Unicode
     * characters in the string literal would normally need to be encoded using a Unicode escape sequence, which would
     * require decoding them. To get around this, protoc instead embeds the UTF-8 bytes into the generated code and
     * leaves it to the runtime library to decode them.
     * 

     * It gets worse, though. If protoc just generated a byte array, like: new byte[] {0x12, 0x34, 0x56, 0x78} Java
     * actually generates *code* which allocates an array and then fills in each value. This is much less efficient than
     * just embedding the bytes directly into the bytecode. To get around this, we need another work-around. String
     * literals are embedded directly, so protoc actually generates a string literal corresponding to the bytes. The
     * easiest way to do this is to use the ISO-8859-1 character set, which corresponds to the first 256 characters of
     * the Unicode range. Protoc can then use good old CEscape to generate the string.
     * 

     * So we have a string literal which represents a set of bytes which represents another string. This function --
     * stringDefaultValue -- converts from the generated string to the string we actually want. The generated code calls
     * this automatically.
     */
    public static String stringDefaultValue(String bytes)
    {
        try
        {
            return new String(bytes.getBytes("ISO-8859-1"), "UTF-8");
        }
        catch (UnsupportedEncodingException e)
        {
            // This should never happen since all JVMs are required to implement
            // both of the above character sets.
            throw new IllegalStateException(
                    "Java VM does not support a standard character set.", e);
        }
    }

    /**
     * Helper called by generated code to construct default values for bytes fields.
     * 

     * This is a lot like {@link #stringDefaultValue}, but for bytes fields. In this case we only need the second of the
     * two hacks -- allowing us to embed raw bytes as a string literal with ISO-8859-1 encoding.
     */
    public static ByteString bytesDefaultValue(String bytes)
    {
        return new ByteString(byteArrayDefaultValue(bytes));
    }

    /**
     * Helper called by generated code to construct default values for byte array fields.
     * 
     * This is a lot like {@link #stringDefaultValue}, but for bytes fields. In this case we only need the second of the
     * two hacks -- allowing us to embed raw bytes as a string literal with ISO-8859-1 encoding.
     */
    public static byte[] byteArrayDefaultValue(String bytes)
    {
        try
        {
            return bytes.getBytes("ISO-8859-1");
        }
        catch (UnsupportedEncodingException e)
        {
            // This should never happen since all JVMs are required to implement
            // ISO-8859-1.
            throw new IllegalStateException(
                    "Java VM does not support a standard character set.", e);
        }
    }
}