All Downloads are FREE. Search and download functionalities are using the official Maven repository.

io.permazen.util.UnsignedIntEncoder Maven / Gradle / Ivy


/*
 * Copyright (C) 2015 Archie L. Cobbs. All rights reserved.
 */

package io.permazen.util;

import com.google.common.base.Preconditions;

import java.io.EOFException;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.nio.ByteBuffer;

/**
 * Encodes unsigned (i.e., non-negative) {@code int} values to/from self-delimited binary, preserving sort order, and such
 * that the length of the encoding is optimized for values near zero and encoded values never begin with {@code 0xff}.
 *
 * 

* The encoding uses a simple prefixing format: * *

* * * * * * * * * * * * * * * * * * * * * * * * * * * * * *
Encoded BytesValue
{@code 0x00 ... 0xfa}Same
{@code 0xfb 0xWW}{@code 0xWW + 0xfb}
{@code 0xfc 0xWW 0xXX}{@code 0xWWXX + 0xfb}
{@code 0xfd 0xWW 0xXX 0xYY}{@code 0xWWXXYY + 0xfb}
{@code 0xfe 0xWW 0xXX 0xYY 0xZZ}{@code 0xWWXXYYZZ + 0xfb}
{@code 0xff}Illegal
*
*/ public final class UnsignedIntEncoder { /** * Maximum possible length of an encoded value. */ public static final int MAX_ENCODED_LENGTH = 5; /** * Minimum value that triggers a multi-byte encoding. */ public static final int MIN_MULTI_BYTE_VALUE = 0xfb; // values 0xfb ... 0xfe prefix multi-byte values private UnsignedIntEncoder() { } /** * Encode the given value. * * @param value value to encode * @return encoded value * @throws IllegalArgumentException if {@code value} is negative */ public static byte[] encode(int value) { final ByteWriter writer = new ByteWriter(UnsignedIntEncoder.encodeLength(value)); UnsignedIntEncoder.write(writer, value); return writer.getBytes(); } /** * Decode the given value. * * @param data encoded value * @return decoded value * @throws IllegalArgumentException if {@code bytes} contains an invalid encoding, or extra trailing garbage */ public static int decode(byte[] data) { final ByteReader reader = new ByteReader(data); final int value = UnsignedIntEncoder.read(reader); if (reader.remain() > 0) throw new IllegalArgumentException("encoded value contains extra trailing garbage"); return value; } /** * Encode the given value to the output. * * @param writer destination for the encoded value * @param value value to encode * @throws IllegalArgumentException if {@code value} is negative */ public static void write(ByteWriter writer, int value) { writer.makeRoom(MAX_ENCODED_LENGTH); writer.len += UnsignedIntEncoder.encode(value, writer.buf, writer.len); } /** * Encode the given value and write it to the given {@link OutputStream}. * * @param out destination for the encoded value * @param value value to encode * @throws IOException if an I/O error occurs * @throws NullPointerException if {@code out} is null */ public static void write(OutputStream out, int value) throws IOException { final byte[] array = new byte[UnsignedIntEncoder.MAX_ENCODED_LENGTH]; final int nbytes = UnsignedIntEncoder.encode(value, array, 0); out.write(array, 0, nbytes); } /** * Encode the given value and write it to the given {@link ByteBuffer}. * * @param buf destination for the encoded value * @param value value to encode * @throws java.nio.BufferOverflowException if {@code buf} overflows * @throws java.nio.ReadOnlyBufferException if {@code buf} is read-only * @throws NullPointerException if {@code buf} is null */ public static void write(ByteBuffer buf, int value) { final byte[] array = new byte[UnsignedIntEncoder.MAX_ENCODED_LENGTH]; final int nbytes = UnsignedIntEncoder.encode(value, array, 0); buf.put(array, 0, nbytes); } /** * Read and decode a value from the input. * * @param reader input holding an encoded value * @return the decoded value, always non-negative * @throws IllegalArgumentException if the encoded value is truncated * @throws IllegalArgumentException if an invalid encoding is encountered */ public static int read(ByteReader reader) { try { final int first = reader.readByte(); int value; switch (first) { case 0xfb: value = reader.readByte(); break; case 0xfc: value = (reader.readByte() << 8) | reader.readByte(); break; case 0xfd: value = (reader.readByte() << 16) | (reader.readByte() << 8) | reader.readByte(); break; case 0xfe: value = (reader.readByte() << 24) | (reader.readByte() << 16) | (reader.readByte() << 8) | reader.readByte(); if (value + MIN_MULTI_BYTE_VALUE < 0) throw new IllegalArgumentException("invalid unsigned int encoding with high bit set"); break; case 0xff: throw new IllegalArgumentException("invalid unsigned int encoding starting with 0xff"); default: return first; } return value + MIN_MULTI_BYTE_VALUE; } catch (IndexOutOfBoundsException e) { throw new IllegalArgumentException("encoded value is truncated", e); } } /** * Read and decode a value from the given {@link InputStream}. * * @param input input source for the encoded value * @return the decoded value * @throws IOException if an I/O error occurs * @throws EOFException if an unexpected EOF is encountered * @throws IllegalArgumentException if an invalid encoding is encountered * @throws NullPointerException if {@code input} is null */ public static int read(InputStream input) throws IOException { final int first = input.read(); if (first == -1) throw new EOFException(); final byte[] array = new byte[UnsignedIntEncoder.decodeLength(first)]; array[0] = (byte)first; for (int i = 1; i < array.length; i++) { final int next = input.read(); if (next == -1) throw new EOFException(); array[i] = (byte)next; } return UnsignedIntEncoder.read(new ByteReader(array)); } /** * Read and decode a value from the given {@link ByteBuffer}. * * @param buf input source for the encoded value * @return the decoded value * @throws java.nio.BufferUnderflowException if {@code buf} underflows * @throws IllegalArgumentException if an invalid encoding is encountered * @throws NullPointerException if {@code buf} is null */ public static int read(ByteBuffer buf) { final byte first = buf.get(); final byte[] array = new byte[UnsignedIntEncoder.decodeLength(first)]; array[0] = first; if (array.length > 1) buf.get(array, 1, array.length - 1); return UnsignedIntEncoder.read(new ByteReader(array)); } /** * Skip a value from the input. * * @param reader input holding an encoded value */ public static void skip(ByteReader reader) { final int first = reader.readByte(); if (first >= MIN_MULTI_BYTE_VALUE) reader.skip(first - MIN_MULTI_BYTE_VALUE + 1); } /** * Determine the length (in bytes) of an encoded value based on the first byte. * * @param first first byte of encoded value (in lower eight bits; other bits are ignored) * @return the length of the encoded value (including {@code first}) * @throws IllegalArgumentException if the lower eight bits of {@code first} equal {@code 0xff} */ public static int decodeLength(int first) { first &= 0xff; Preconditions.checkArgument(first != 0xff, "invalid unsigned int encoding starting with 0xff"); return first < MIN_MULTI_BYTE_VALUE ? 1 : first - MIN_MULTI_BYTE_VALUE + 2; } /** * Determine the length (in bytes) of the encoded value. * * @param value value to encode * @return the length of the encoded value, a value between one and {@link #MAX_ENCODED_LENGTH} * @throws IllegalArgumentException if {@code value} is negative */ public static int encodeLength(int value) { Preconditions.checkArgument(value >= 0, "value < 0"); value -= MIN_MULTI_BYTE_VALUE; if (value < 0) return 1; int length = 2; while ((value >>= 8) != 0) length++; return length; } /** * Encode the given value and write the encoded bytes into the given buffer. * * @param value value to encode * @param buf output buffer * @param off starting offset into output buffer * @return the number of encoded bytes written * @throws IllegalArgumentException if {@code value} is negative * @throws NullPointerException if {@code buf} is null * @throws ArrayIndexOutOfBoundsException if {@code off} is negative or the encoded value exceeds the given buffer */ public static int encode(int value, byte[] buf, int off) { Preconditions.checkArgument(value >= 0, "value < 0"); if (value < MIN_MULTI_BYTE_VALUE) { buf[off] = (byte)value; return 1; } value -= MIN_MULTI_BYTE_VALUE; int len = 1; int mask = 0xff000000; boolean encoding = false; for (int shift = 24; shift != 0; shift -= 8, mask >>= 8) { if (encoding || (value & mask) != 0L) { buf[off + len++] = (byte)(value >> shift); encoding = true; } } buf[off + len++] = (byte)value; buf[off] = (byte)(MIN_MULTI_BYTE_VALUE + len - 2); return len; } /** * Test routine. * * @param args command line arguments */ public static void main(String[] args) { for (String arg : args) { byte[] bytes = null; try { bytes = ByteUtil.parse(arg); } catch (IllegalArgumentException e) { if (arg.startsWith("0x")) bytes = ByteUtil.parse(arg.substring(2)); } if (bytes != null) { System.out.println("Decoding bytes: " + ByteUtil.toString(bytes)); try { final long value = UnsignedIntEncoder.decode(bytes); System.out.println("0x" + ByteUtil.toString(bytes) + " decodes to " + value + " (" + String.format("0x%016x", value) + ")"); } catch (IndexOutOfBoundsException | IllegalArgumentException e) { System.out.println("Error decoding " + ByteUtil.toString(bytes) + ": " + e); } } Integer value = null; try { value = Integer.parseInt(arg); } catch (IllegalArgumentException e) { // ignore } if (value != null && value >= 0) { System.out.println("Encoding value " + value); final ByteWriter writer = new ByteWriter(); UnsignedIntEncoder.write(writer, value); System.out.println(value + " (" + String.format("0x%016x", value) + ") encodes to " + ByteUtil.toString(writer.getBytes())); } } } }




© 2015 - 2025 Weber Informatics LLC | Privacy Policy