scodec.codecs.codecs.scala Maven / Gradle / Ivy
/*
* Copyright (c) 2013, Scodec
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without modification,
* are permitted provided that the following conditions are met:
*
* 1. Redistributions of source code must retain the above copyright notice, this
* list of conditions and the following disclaimer.
*
* 2. Redistributions in binary form must reproduce the above copyright notice,
* this list of conditions and the following disclaimer in the documentation
* and/or other materials provided with the distribution.
*
* 3. Neither the name of the copyright holder nor the names of its contributors
* may be used to endorse or promote products derived from this software without
* specific prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
* WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
* DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR
* ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
* (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
* LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
* ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
* SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
package scodec
package codecs
import scala.math.{floor, log10}
import java.nio.charset.Charset
import java.security.cert.{Certificate, X509Certificate}
import java.util.UUID
import scodec.bits.*
// TODO - Move this old package level ScalaDoc to the right place when scala 3 supports package documentation
/**
* Provides codecs for common types and combinators for building larger codecs.
*
* === Bits and Bytes Codecs ===
*
* The simplest of the provided codecs are those that encode/decode `BitVector`s and `ByteVectors` directly.
* These are provided by `bits` and `bytes` methods. These codecs encode all of the bits/bytes directly
* in to the result and decode *all* of the remaining bits/bytes in to the result value. That is, the result
* of `decode` always returns a empty bit vector for the remaining bits.
*
* Similarly, fixed size alternatives are provided by the `bits(size)` and `bytes(size)` methods, which
* encode a fixed number of bits/bytes (or error if not provided the correct size) and decoded a fixed number
* of bits/bytes (or error if that many bits/bytes are not available).
*
* There are more specialized codecs for working with bits, including `ignore` and `constant`.
*
*
* === Numeric Codecs ===
*
* There are built-in codecs for `Int`, `Long`, `Float`, and `Double`.
*
* There are a number of predefined integral codecs named using the form: {{{
[u]int$${size}[L]
}}}
* where `u` stands for unsigned, `size` is replaced by one of `8, 16, 24, 32, 64`, and `L` stands for little-endian.
* For each codec of that form, the type is `Codec[Int]` or `Codec[Long]` depending on the specified size.
* For example, `int32` supports 32-bit big-endian 2s complement signed integers, and uint16L supports 16-bit little-endian
* unsigned integers.
* Note: `uint64[L]` are not provided because a 64-bit unsigned integer does not fit in to a `Long`.
*
* Additionally, methods of the form `[u]int[L](size: Int)` and `[u]long[L](size: Int)` exist to build arbitrarily
* sized codecs, within the limitations of `Int` and `Long`.
*
* IEEE 754 floating point values are supported by the [[float]], [[floatL]], [[double]], and [[doubleL]] codecs.
*
*
* === Miscellaneous Value Codecs ===
*
* In addition to the numeric codecs, there are built-in codecs for `Boolean`, `String`, and `UUID`.
*
* Boolean values are supported by the `bool` codecs.
*
*
* === Combinators ===
*
* There are a number of methods provided that create codecs out of other codecs. These include simple combinators
* such as [[fixedSizeBits]] and [[variableSizeBits]] and advanced combinators such as [[discriminated]], which
* provides its own DSL for building a large codec out of many small codecs. For a list of all combinators,
* see the Combinators section below.
*
* === Cryptography Codecs ===
*
* There are codecs that support working with encrypted data ([[encrypted]]), digital signatures and checksums
* ([[fixedSizeSignature]] and [[variableSizeSignature]]). Additionally, support for `java.security.cert.Certificate`s
* is provided by [[certificate]] and [[x509Certificate]].
*/
/**
* Encodes by returning supplied bit vector; decodes by taking all remaining bits in the supplied bit vector.
*/
val bits: Codec[BitVector] = new Codec[BitVector]:
def sizeBound = SizeBound.unknown
def encode(buffer: BitVector) = Attempt.successful(buffer)
def decode(buffer: BitVector) = Attempt.successful(DecodeResult(buffer, BitVector.empty))
override def toString = "bits"
/**
* Encodes by returning the supplied bit vector if its length is `size` bits, padding with zeroes if smaller than `size` bits, returning error if greater;
* decodes by taking `size` bits from the supplied bit vector.
*
* @param size number of bits to encode/decode
*/
def bits(size: Long): Codec[BitVector] =
fixedSizeBits(size, bits).withToString(s"bits($size)")
/**
* Encodes by returning the supplied bit vector if its length is `size` bits, otherwise returning error;
* decodes by taking `size` bits from the supplied bit vector.
*
* @param size number of bits to encode/decode
*/
def bitsStrict(size: Long): Codec[BitVector] =
new FixedSizeStrictCodec(size, bits).withToString(s"bitsStrict($size)")
/**
* Encodes by returning supplied byte vector as a bit vector; decodes by taking all remaining bits in supplied bit vector and converting to a byte vector.
*/
val bytes: Codec[ByteVector] =
bits.xmapc(_.bytes)(_.bits).withToString("bytes")
/**
* Encodes by returning the supplied byte vector if its length is `size` bytes, padding with zeroes if smaller than `size` bytes, returning error if greater;
* decodes by taking `size * 8` bits from the supplied bit vector and converting to a byte vector.
*
* @param size number of bytes to encode/decode
*/
def bytes(size: Int): Codec[ByteVector] =
fixedSizeBytes(size.toLong, bits).xmapc(_.bytes)(_.bits).withToString(s"bytes($size)")
/**
* Encodes by returning the supplied byte vector if its length is `size` bytes, otherwise returning error;
* decodes by taking `size * 8` bits from the supplied bit vector and converting to a byte vector.
*
* @param size number of bytes to encode/decode
*/
def bytesStrict(size: Int): Codec[ByteVector] =
new FixedSizeStrictCodec(size * 8L, bits).xmapc(_.bytes)(_.bits).withToString(s"bytesStrict($size)")
/**
* Codec for 8-bit 2s complement bytes.
*/
val byte: Codec[Byte] = new ByteCodec(8, true)
/**
* Codec for 8-bit unsigned bytes.
*/
val ushort8: Codec[Short] = new ShortCodec(8, false, ByteOrdering.BigEndian)
/**
* Codec for 16-bit 2s complement big-endian shorts.
*/
val short16: Codec[Short] = new ShortCodec(16, true, ByteOrdering.BigEndian)
/**
* Codec for 8-bit 2s complement big-endian integers.
*/
val int8: Codec[Int] = new IntCodec(8, true, ByteOrdering.BigEndian)
/**
* Codec for 16-bit 2s complement big-endian integers.
*/
val int16: Codec[Int] = new IntCodec(16, true, ByteOrdering.BigEndian)
/**
* Codec for 24-bit 2s complement big-endian integers.
*/
val int24: Codec[Int] = new IntCodec(24, true, ByteOrdering.BigEndian)
/**
* Codec for 32-bit 2s complement big-endian integers.
*/
val int32: Codec[Int] = new IntCodec(32, true, ByteOrdering.BigEndian)
/**
* Codec for 64-bit 2s complement big-endian integers.
*/
val int64: Codec[Long] = new LongCodec(64, true, ByteOrdering.BigEndian)
/**
* Codec for 2-bit unsigned big-endian integers.
*/
val uint2: Codec[Int] = new IntCodec(2, false, ByteOrdering.BigEndian)
/**
* Codec for 4-bit unsigned big-endian integers.
*/
val uint4: Codec[Int] = new IntCodec(4, false, ByteOrdering.BigEndian)
/**
* Codec for 8-bit unsigned big-endian integers.
*/
val uint8: Codec[Int] = new IntCodec(8, false, ByteOrdering.BigEndian)
/**
* Codec for 16-bit unsigned big-endian integers.
*/
val uint16: Codec[Int] = new IntCodec(16, false, ByteOrdering.BigEndian)
/**
* Codec for 24-bit unsigned big-endian integers.
*/
val uint24: Codec[Int] = new IntCodec(24, false, ByteOrdering.BigEndian)
/**
* Codec for 32-bit unsigned big-endian integers.
*/
val uint32: Codec[Long] = new LongCodec(32, false, ByteOrdering.BigEndian)
/**
* Codec for 16-bit 2s complement little-endian shorts.
*/
val short16L: Codec[Short] = new ShortCodec(16, true, ByteOrdering.LittleEndian)
/**
* Codec for 8-bit 2s complement little-endian integers.
*/
val int8L: Codec[Int] = new IntCodec(8, true, ByteOrdering.LittleEndian)
/**
* Codec for 16-bit 2s complement little-endian integers.
*/
val int16L: Codec[Int] = new IntCodec(16, true, ByteOrdering.LittleEndian)
/**
* Codec for 24-bit 2s complement little-endian integers.
*/
val int24L: Codec[Int] = new IntCodec(24, true, ByteOrdering.LittleEndian)
/**
* Codec for 32-bit 2s complement little-endian integers.
*/
val int32L: Codec[Int] = new IntCodec(32, true, ByteOrdering.LittleEndian)
/**
* Codec for 64-bit 2s complement little-endian integers.
*/
val int64L: Codec[Long] = new LongCodec(64, true, ByteOrdering.LittleEndian)
/**
* Codec for 2-bit unsigned little-endian integers.
*/
val uint2L: Codec[Int] = new IntCodec(2, false, ByteOrdering.LittleEndian)
/**
* Codec for 4-bit unsigned little-endian integers.
*/
val uint4L: Codec[Int] = new IntCodec(4, false, ByteOrdering.LittleEndian)
/**
* Codec for 8-bit unsigned little-endian integers.
*/
val uint8L: Codec[Int] = new IntCodec(8, false, ByteOrdering.LittleEndian)
/**
* Codec for 16-bit unsigned little-endian integers.
*/
val uint16L: Codec[Int] = new IntCodec(16, false, ByteOrdering.LittleEndian)
/**
* Codec for 24-bit unsigned little-endian integers.
*/
val uint24L: Codec[Int] = new IntCodec(24, false, ByteOrdering.LittleEndian)
/**
* Codec for 32-bit unsigned little-endian integers.
*/
val uint32L: Codec[Long] = new LongCodec(32, false, ByteOrdering.LittleEndian)
/**
* Codec for variable-length big-endian integers.
* Encoding requires between 1 and 5 bytes, depending on the value.
* Smaller ints require less bytes. Negative values are always encoded with 5 bytes.
*/
val vint: Codec[Int] = new VarIntCodec(ByteOrdering.BigEndian)
/**
* Codec for variable-length little-endian integers.
* Encoding requires between 1 and 5 bytes, depending on the value.
* Smaller ints require less bytes. Negative values are always encoded with 5 bytes.
*/
val vintL: Codec[Int] = new VarIntCodec(ByteOrdering.LittleEndian)
/**
* Codec for variable-length big-endian longs.
* Encoding requires between 1 and 9 bytes, depending on the value.
* Smaller longs require less bytes.
* Negative values are not supported.
*/
val vlong: Codec[Long] = new VarLongCodec(ByteOrdering.BigEndian)
/**
* Codec for variable-length packed decimal longs.
* Negative values are not supported.
*/
val vpbcd: Codec[Long] = VarPackedDecimalCodec
/**
* Codec for variable-length little-endian longs.
* Encoding requires between 1 and 9 bytes, depending on the value.
* Smaller longs require less bytes.
* Negative values are not supported.
*/
val vlongL: Codec[Long] = new VarLongCodec(ByteOrdering.LittleEndian)
/**
* Codec for n-bit 2s complement bytes.
* @param size number of bits (must be 0 < size <= 8)
*/
def byte(size: Int): Codec[Byte] = new ByteCodec(size, true)
/**
* Codec for n-bit unsigned bytes.
* @param size number of bits (must be 0 < size <= 7)
*/
def ubyte(size: Int): Codec[Byte] = new ByteCodec(size, false)
/**
* Codec for n-bit 2s complement big-endian shorts.
* @param size number of bits (must be 0 < size <= 16)
*/
def short(size: Int): Codec[Short] = new ShortCodec(size, true, ByteOrdering.BigEndian)
/**
* Codec for n-bit unsigned big-endian shorts.
* @param size number of bits (must be 0 < size <= 15)
*/
def ushort(size: Int): Codec[Short] = new ShortCodec(size, false, ByteOrdering.BigEndian)
/**
* Codec for n-bit 2s complement big-endian integers that are represented with `Int`.
* @param size number of bits (must be 0 < size <= 32)
*/
def int(size: Int): Codec[Int] = new IntCodec(size, true, ByteOrdering.BigEndian)
/**
* Codec for n-bit unsigned big-endian integers that are represented with `Int`.
* @param bits number of bits (must be 0 < size <= 31)
*/
def uint(bits: Int): Codec[Int] = new IntCodec(bits, false, ByteOrdering.BigEndian)
/**
* Codec for n-bit 2s complement big-endian integers that are represented with `Long`.
* @param bits number of bits (must be 0 < size <= 64)
*/
def long(bits: Int): Codec[Long] = new LongCodec(bits, true, ByteOrdering.BigEndian)
/**
* Codec for n-bit unsigned big-endian integers that are represented with `Long`.
* @param bits number of bits (must be 0 < size <= 63)
*/
def ulong(bits: Int): Codec[Long] = new LongCodec(bits, false, ByteOrdering.BigEndian)
/**
* Codec for n-bit 2s complement little-endian shorts.
* @param size number of bits (must be 0 < size <= 16)
*/
def shortL(size: Int): Codec[Short] = new ShortCodec(size, true, ByteOrdering.LittleEndian)
/**
* Codec for n-bit unsigned little-endian shorts.
* @param size number of bits (must be 0 < size <= 15)
*/
def ushortL(size: Int): Codec[Short] = new ShortCodec(size, false, ByteOrdering.LittleEndian)
/**
* Codec for n-bit 2s complement little-endian integers that are represented with `Int`.
* @param bits number of bits (must be 0 < size <= 32)
*/
def intL(bits: Int): Codec[Int] = new IntCodec(bits, true, ByteOrdering.LittleEndian)
/**
* Codec for n-bit unsigned little-endian integers that are represented with `Int`.
* @param bits number of bits (must be 0 < size <= 31)
*/
def uintL(bits: Int): Codec[Int] = new IntCodec(bits, false, ByteOrdering.LittleEndian)
/**
* Codec for n-bit 2s complement little-endian integers that are represented with `Long`.
* @param bits number of bits (must be 0 < size <= 64)
*/
def longL(bits: Int): Codec[Long] = new LongCodec(bits, true, ByteOrdering.LittleEndian)
/**
* Codec for n-bit unsigned little-endian integers that are represented with `Long`.
* @param bits number of bits (must be 0 < size <= 63)
*/
def ulongL(bits: Int): Codec[Long] = new LongCodec(bits, false, ByteOrdering.LittleEndian)
/**
* Codec for n-nibble packed decimal (BCD) integers that are represented with `Long`.
* @param nibbles number of nibbles (4-bit chunks)
*/
def pbcd(nibbles: Int): Codec[Long] = new Codec[Long] {
private def width: Long = nibbles.toLong * 4L
def decode(bits: BitVector): Attempt[DecodeResult[Long]] =
bits.consumeThen(width)(
e => Attempt.failure(Err(e)),
(bits, rem) => vpbcd.decodeValue(bits).map(a => DecodeResult(a, rem))
)
def encode(l: Long): Attempt[BitVector] = vpbcd.encode(l).map(_.padLeft(width))
def sizeBound = SizeBound.exact(width)
}
/**
* Codec for n-nibble packed decimal (BCD) integers that are represented with `Long`.
* This codec, despite requiring the size in nibbles, is byte-size oriented.
* This means it expects to parse complete bytes (even if nibble size is
* odd). For encoding, this codec will pad 0s on the left while, for
* decoding, it will fetch the size in bytes round up.
* @param nibbles number of nibbles (4-bit chunks)
*/
def lpbcd(nibbles: Int): Codec[Long] = new Codec[Long] {
val nsize = nibbles.toLong * 4
val bsize = nsize + nsize % 8
def sizeBound = SizeBound.exact(bsize)
def decode(b: BitVector) = fixedSizeBits(bsize, vpbcd).decode(b)
def encode(l: Long) = fixedSizeBits(nsize, vpbcd).encode(l).map { x =>
val size: Long = floor(log10(l.toDouble) + 1).toLong * 4
(BitVector.low(bsize) ++ x.take(size)).drop(size)
}
}
/**
* 32-bit big endian IEEE 754 floating point number.
*/
val float: Codec[Float] = new FloatCodec(ByteOrdering.BigEndian)
/**
* 32-bit little endian IEEE 754 floating point number.
*/
val floatL: Codec[Float] = new FloatCodec(ByteOrdering.LittleEndian)
/**
* 64-bit big endian IEEE 754 floating point number.
*/
val double: Codec[Double] = new DoubleCodec(ByteOrdering.BigEndian)
/**
* 64-bit little endian IEEE 754 floating point number.
*/
val doubleL: Codec[Double] = new DoubleCodec(ByteOrdering.LittleEndian)
/**
* 1-bit boolean codec, where false corresponds to bit value 0 and true corresponds to bit value 1.
*/
val bool: Codec[Boolean] = BooleanCodec
/**
* n-bit boolean codec, where false corresponds to bit vector of all 0s and true corresponds to all other vectors.
*/
def bool(n: Long): Codec[Boolean] = new Codec[Boolean] {
private val zeros = BitVector.low(n)
private val ones = BitVector.high(n)
private val codec = bits(n).xmap[Boolean](bits => !(bits == zeros), b => if b then ones else zeros)
def sizeBound = SizeBound.exact(n)
def encode(b: Boolean) = codec.encode(b)
def decode(b: BitVector) = codec.decode(b)
override def toString = s"bool($n)"
}
/**
* String codec that uses the supplied `Charset` to perform encoding/decoding.
*
* This codec does not encode the size of the string in to the output. Hence, decoding
* a vector that has additional data after the encoded string will result in
* unexpected output. Instead, it is common to use this codec along with either
* [[fixedSizeBits]] or [[variableSizeBits]]. For example, a common encoding
* is a size field, say 2 bytes, followed by the encoded string. This can be
* accomplished with: {{{variableSizeBits(uint16, string)}}}
*
* @param charset charset to use to convert strings to/from binary
*/
def string(charset: Charset): Codec[String] = new StringCodec(charset)
/**
* String codec that uses the `US-ASCII` charset. See [[string]] for more information on `String` codecs.
*/
val ascii = string(Platform.ascii)
/**
* String codec that uses the `UTF-8` charset. See [[string]] for more information on `String` codecs.
*/
val utf8 = string(Platform.utf8)
/**
* String codec that uses the `US-ASCII` charset that encodes strings with a trailing `NUL` termination byte
* and decodes a string up to the next `NUL` termination byte.
* It fails to decode if the bit vector ends before a `NUL` termination byte can be found.
*/
val cstring: Codec[String] = filtered(
ascii,
new Codec[BitVector] {
val nul = BitVector.lowByte
override def sizeBound: SizeBound = SizeBound.unknown
override def encode(bits: BitVector): Attempt[BitVector] = Attempt.successful(bits ++ nul)
override def decode(bits: BitVector): Attempt[DecodeResult[BitVector]] =
bits.bytes.indexOfSlice(nul.bytes) match {
case -1 => Attempt.failure(Err("Does not contain a 'NUL' termination byte."))
case i => Attempt.successful(DecodeResult(bits.take(i * 8L), bits.drop(i * 8L + 8L)))
}
}
).withToString("cstring")
/**
* String codec that uses the given `Charset` and prefixes the encoded string by the byte size
* in a 32-bit 2s complement big endian field.
*
* @param charset charset to use to convert strings to/from binary
*/
def string32(charset: Charset): Codec[String] =
variableSizeBytes(int32, string(charset)).withToString(s"string32(${charset.displayName})")
/**
* String codec that uses the given `Charset` and prefixes the encoded string by the byte size
* in a 32-bit 2s complement little endian field.
*
* @param charset charset to use to convert strings to/from binary
*/
def string32L(charset: Charset): Codec[String] =
variableSizeBytes(int32L, string(charset)).withToString(s"string32(${charset.displayName})")
/**
* String codec that uses the `US-ASCII` charset and prefixes the encoded string by the byte size
* in a 32-bit 2s complement big endian field.
*/
val ascii32 = string32(Platform.ascii)
/**
* String codec that uses the `US-ASCII` charset and prefixes the encoded string by the byte size
* in a 32-bit 2s complement little endian field.
*/
val ascii32L = string32L(Platform.ascii)
/**
* String codec that uses the `UTF-8` charset and prefixes the encoded string by the byte size
* in a 32-bit 2s complement big endian field.
*/
val utf8_32 = string32(Platform.utf8)
/**
* String codec that uses the `UTF-8` charset and prefixes the encoded string by the byte size
* in a 32-bit 2s complement little endian field.
*/
val utf8_32L = string32L(Platform.utf8)
/**
* Encodes/decodes `UUID`s as 2 64-bit big-endian longs, first the high 64-bits then the low 64-bits.
*/
val uuid: Codec[UUID] = UuidCodec
/**
* Codec that always returns an empty vector from `encode` and always returns `(empty, value)` from `decode`.
* This is often useful when combined with other codecs (e.g., the [[discriminated]]).
* @param value value to return from decode
*/
def provide[A](value: A): Codec[A] = new ProvideCodec(value)
/**
* Codec that always encodes `size` 0 bits and always decodes `size` bits and then discards them, returning `()` instead.
* @param size number of bits to ignore
*/
def ignore(size: Long): Codec[Unit] = new IgnoreCodec(size)
/**
* Codec that always encodes the specified bits and always decodes the specified bits, returning `()` if the actual bits match
* the specified bits and returning an error otherwise.
* @param bits constant bits
*/
def constant(bits: BitVector): Codec[Unit] = new ConstantCodec(bits)
/**
* Codec that always encodes the specified bytes and always decodes the specified bytes, returning `()` if the actual bytes match
* the specified bytes and returning an error otherwise.
* @param bytes constant bytes
*/
def constant(bytes: ByteVector): Codec[Unit] = constant(bytes.bits)
/**
* Codec that always encodes the specified bits and always decodes the specified bits, returning `()` if the actual bits match
* the specified bits and returning an error otherwise.
* @param bits constant bits
*/
def constant[A: Integral](bits: A*): Codec[Unit] = constant(BitVector(bits*))
/**
* Codec that always encodes the specified bits and always decodes n bits, returning `()`, where n is the length of the
* specified bits.
* @param bits constant bits
*/
def constantLenient(bits: BitVector): Codec[Unit] = new ConstantCodec(bits, false)
/**
* Codec that always encodes the specified bytes and always decodes n bytes, returning `()`, where n is the length of the
* specified bytes.
* @param bytes constant bytes
*/
def constantLenient(bytes: ByteVector): Codec[Unit] = constantLenient(bytes.bits)
/**
* Codec that always encodes the specified bits and always decodes n bits, returning `()`, where n is the length of the
* specified bits.
* @param bits constant bits
*/
def constantLenient[A: Integral](bits: A*): Codec[Unit] = constantLenient(BitVector(bits*))
/**
* Codec that limits the number of bits the specified codec works with.
*
* When encoding, if encoding with the specified codec
* results in less than the specified size, the vector is right padded with 0 bits. If the result is larger than the specified
* size, an encoding error is returned.
*
* When decoding, the specified codec is only given `size` bits. If the specified codec does not consume all the bits it was
* given, any remaining bits are discarded.
*
* @param size number of bits
* @param codec codec to limit
*/
def fixedSizeBits[A](size: Long, codec: Codec[A]): Codec[A] = new FixedSizeCodec(size, codec)
/**
* Byte equivalent of [[fixedSizeBits]].
* @param size number of bytes
* @param codec codec to limit
*/
def fixedSizeBytes[A](size: Long, codec: Codec[A]): Codec[A] = new Codec[A] {
private val fcodec = fixedSizeBits(size * 8, codec)
def sizeBound = fcodec.sizeBound
def encode(a: A) = fcodec.encode(a)
def decode(b: BitVector) = fcodec.decode(b)
override def toString = s"fixedSizeBytes($size, $codec)"
}
/**
* Codec that limits the number of bits the specified codec works with.
*
* If the encoded result is larger than the specified
* size, an encoding error is returned.
*
* If encoding with the specified codec
* results in less than the specified size, the vector is right padded by repeatedly encoding with padCodec.
* An encoding error is returned if the padCodec result does not precisely fill the remaining space.
*
* When decoding, the specified codec is only given `size` bits. If the specified codec does not consume all the bits it was
* given, all remaining bits are repeatedly decoded by padCodec. A decoding error is returned if any
* padCodec decode returns an error.
*
* @param size number of bits
* @param codec codec to limit
* @param padCodec codec to use for padding
*/
def paddedFixedSizeBits[A](size: Long, codec: Codec[A], padCodec: Codec[Unit]): Codec[A] =
new PaddedFixedSizeCodec(size, codec, _ => padCodec)
/**
* Codec that limits the number of bits the specified codec works with.
*
* If the encoded result is larger than the specified
* size, an encoding error is returned.
*
* If encoding with the specified codec
* results in less than the specified size, the vector is right padded by repeatedly encoding with the
* codec returned from `padCodec(numberOfPaddingBits)`.
* An encoding error is returned if the padCodec result does not precisely fill the remaining space.
*
* When decoding, the specified codec is only given `size` bits. If the specified codec does not consume all the bits it was
* given, all remaining bits are repeatedly decoded by the codec returned from `padCodec(remainingBitCount)`.
* A decoding error is returned if any padding decode iteration returns an error.
*
* @param size number of bits
* @param codec codec to limit
* @param padCodec function that provides the codec to use for padding
*/
def paddedFixedSizeBitsDependent[A](
size: Long,
codec: Codec[A],
padCodec: Long => Codec[Unit]
): Codec[A] = new PaddedFixedSizeCodec(size, codec, padCodec)
/**
* Byte equivalent of [[paddedFixedSizeBits]].
* @param size number of bytes
* @param codec codec to limit
* @param padCodec codec to use for padding
*/
def paddedFixedSizeBytes[A](size: Long, codec: Codec[A], padCodec: Codec[Unit]): Codec[A] =
paddedFixedSizeBytesDependent(size, codec, _ => padCodec)
/**
* Byte equivalent of [[paddedFixedSizeBitsDependent]].
*
* The `padCodec` function is passed the number of *bits* of padding required -- not bytes.
*
* @param size number of bytes
* @param codec codec to limit
* @param padCodec function that provides the codec to use for padding
*/
def paddedFixedSizeBytesDependent[A](
size: Long,
codec: Codec[A],
padCodec: Long => Codec[Unit]
): Codec[A] = new Codec[A] {
private val fcodec = paddedFixedSizeBitsDependent(size * 8, codec, padCodec)
def sizeBound = SizeBound.exact(size * 8)
def encode(a: A) = fcodec.encode(a)
def decode(b: BitVector) = fcodec.decode(b)
override def toString = s"paddedFixedSizeBytes($size, $codec)"
}
/**
* Codec that pads on a multiplier.
*
* Similar to ByteAligendCodec, but instead of only padding to 8 bits, pads to a variable size
*
* @param sizeCodec codec that determines the size
* @param valueCodec codec for encoding the payload
* @param multipleForPadding multiple to align the value to with padding
*/
def paddedVarAlignedBits[A](
sizeCodec: Codec[Long],
valueCodec: Codec[A],
multipleForPadding: Int
) = new PaddedVarAlignedCodec(sizeCodec, valueCodec, multipleForPadding.toLong)
/**
* Byte equivalent of [[paddedVarAlignedBits]].
* @param sizeCodec codec that determines the size
* @param valueCodec coec for encoding the payload
* @param multipleForPadding multiple of bytes to align the value to with padding
*/
def paddedVarAlignedBytes[A](
sizeCodec: Codec[Int],
valueCodec: Codec[A],
multipleForPadding: Int
) = new Codec[A] {
val sizedWiden = widenIntToLong(sizeCodec)
private val codec = new PaddedVarAlignedCodec(
sizedWiden.widen(_ * 8, bitsToBytesDivisible),
valueCodec,
multipleForPadding.toLong * 8
)
override def encode(a: A) = codec.encode(a)
override def decode(buffer: BitVector) = codec.decode(buffer)
override def sizeBound = codec.sizeBound
override def toString = "PaddedVarAlignedBytesCodec"
}
/**
* Codec that limits the number of bits the specified codec works with.
*
* When encoding, if encoding with the specified codec
* results in less than the specified size, the vector is returned with no padding. If the result is larger than the specified
* size, an encoding error is returned. This differs from `fixedSizeBits` by not padding encoded vectors less than the specified
* size.
*
* When decoding, the specified codec is only given `size` bits. If the specified codec does not consume all the bits it was
* given, any remaining bits are returned with the overall remainder.
*
* @param size number of bits
* @param codec codec to limit
*/
def limitedSizeBits[A](limit: Long, codec: Codec[A]): Codec[A] =
new LimitedSizeCodec(limit, codec)
/**
* Byte equivalent of [[limitedSizeBits]].
* @param size number of bytes
* @param codec codec to limit
*/
def limitedSizeBytes[A](limit: Long, codec: Codec[A]): Codec[A] = new Codec[A] {
private val fcodec = limitedSizeBits(limit * 8, codec)
def sizeBound = fcodec.sizeBound
def encode(a: A) = fcodec.encode(a)
def decode(b: BitVector) = fcodec.decode(b)
override def toString = s"limitedSizeBytes($limit, $codec)"
}
/**
* Codec that supports vectors of the form `size ++ value` where the `size` field decodes to the bit length of the `value` field.
*
* For example, encoding the string `"hello"` with `variableSizeBits(uint8, ascii)` yields a vector of 6 bytes -- the first byte being
* 0x28 and the next 5 bytes being the US-ASCII encoding of `"hello"`.
*
* The `size` field can be any `Int` codec. An optional padding can be applied to the size field. The `sizePadding` is added to
* the calculated size before encoding, and subtracted from the decoded size before decoding the value.
*
* For example, encoding `"hello"` with `variableSizeBits(uint8, ascii, 1)` yields a vector of 6 bytes -- the first byte being
* 0x29 and the next 5 bytes being the US-ASCII encoding of `"hello"`.
*
* @param size codec that encodes/decodes the size in bits
* @param value codec the encodes/decodes the value
* @param sizePadding number of bits to add to the size before encoding (and subtract from the size before decoding)
*/
def variableSizeBits[A](size: Codec[Int], value: Codec[A], sizePadding: Int = 0): Codec[A] =
variableSizeBitsLong(widenIntToLong(size), value, sizePadding.toLong)
/**
* Byte equivalent of [[variableSizeBits]].
* @param size codec that encodes/decodes the size in bytes
* @param value codec the encodes/decodes the value
* @param sizePadding number of bytes to add to the size before encoding (and subtract from the size before decoding)
*/
def variableSizeBytes[A](size: Codec[Int], value: Codec[A], sizePadding: Int = 0): Codec[A] =
variableSizeBytesLong(widenIntToLong(size), value, sizePadding.toLong)
private def widenIntToLong(c: Codec[Int]): Codec[Long] =
c.widen(
i => i.toLong,
l =>
if l > Int.MaxValue || l < Int.MinValue then
Attempt.failure(Err(s"$l cannot be converted to an integer"))
else Attempt.successful(l.toInt)
)
.withToString(c.toString)
/**
* Codec that supports vectors of the form `size ++ value` where the `size` field decodes to the bit length of the `value` field.
*
* For example, encoding the string `"hello"` with `variableSizeBitsLong(uint32, ascii)` yields a vector of 9 bytes -- the first four bytes being
* 0x00000028 and the next 5 bytes being the US-ASCII encoding of `"hello"`.
*
* The `size` field can be any `Long` codec. An optional padding can be applied to the size field. The `sizePadding` is added to
* the calculated size before encoding, and subtracted from the decoded size before decoding the value.
*
* For example, encoding `"hello"` with `variableSizeBitsLong(uint32, ascii, 1)` yields a vector of 9 bytes -- the first 4 bytes being
* 0x00000029 and the next 5 bytes being the US-ASCII encoding of `"hello"`.
*
* @param size codec that encodes/decodes the size in bits
* @param value codec the encodes/decodes the value
* @param sizePadding number of bits to add to the size before encoding (and subtract from the size before decoding)
*/
def variableSizeBitsLong[A](size: Codec[Long], value: Codec[A], sizePadding: Long = 0): Codec[A] =
new VariableSizeCodec(size, value, sizePadding)
/**
* Byte equivalent of [[variableSizeBitsLong]].
* @param size codec that encodes/decodes the size in bytes
* @param value codec the encodes/decodes the value
* @param sizePadding number of bytes to add to the size before encoding (and subtract from the size before decoding)
*/
def variableSizeBytesLong[A](
size: Codec[Long],
value: Codec[A],
sizePadding: Long = 0
): Codec[A] = new Codec[A] {
private val codec =
variableSizeBitsLong(size.widen(_ * 8, bitsToBytesDivisible), value, sizePadding * 8)
def sizeBound = size.sizeBound + value.sizeBound
def encode(a: A) = codec.encode(a)
def decode(b: BitVector) = codec.decode(b)
override def toString = s"variableSizeBytes($size, $value)"
}
private def bitsToBytesDivisible(n: Long): Attempt[Long] =
if n % 8 == 0 then Attempt.successful(n / 8)
else Attempt.failure(Err(s"$n is not evenly divisible by 8"))
/**
* Codec that supports vectors of the form `value ++ delimiter` where the `delimiter` marks the end of the `value` field.
*
* @param size codec that encodes/decodes the delimiter
* @param value codec the encodes/decodes the value
*/
def variableSizeDelimited[A](delimiterCodec: Codec[Unit], value: Codec[A]): Codec[A] =
new VariableSizeDelimitedCodec(delimiterCodec, value)
/**
* Codec that supports vectors of the form `value ++ delimiter` where the `delimiter` marks the end of the `value` field.
*
* @param size codec that encodes/decodes the delimiter
* @param value codec the encodes/decodes the value
* @param multipleValueSize the size or a mutiple size of the expected value
*/
def variableSizeDelimited[A](
delimiterCodec: Codec[Unit],
value: Codec[A],
multipleValueSize: Long
): Codec[A] =
new VariableSizeDelimitedCodec(delimiterCodec, value, multipleValueSize)
/**
* Codec that supports vectors of the form `size ++ prefix ++ value` where the `size` field decodes to the bit length of the `value` field.
*
* For example, encoding `(3, "hello")` with `variableSizePrefixedBits(uint8, int32, ascii)` yields a vector of 10 bytes -- the first byte being
* 0x28, the next 4 bytes being 0x00000003, and the last 5 bytes being the US-ASCII encoding of `"hello"`.
*
* The `size` field can be any `Int` codec. An optional padding can be applied to the size field. The `sizePadding` is added to
* the calculated size before encoding, and subtracted from the decoded size before decoding the value.
*
* For example, encoding `(3, "hello")` with `variableSizePrefixedBits(uint8, int32, ascii, 1)` yields a vector of 10 bytes -- the first byte being
* 0x29, the next 4 bytes being 0x00000003, and the last 5 bytes being the US-ASCII encoding of `"hello"`.
*
* @param size codec that encodes/decodes the size in bits
* @param prefix codec that encodes/decodes the prefix
* @param value codec the encodes/decodes the value
* @param sizePadding number of bits to add to the size before encoding (and subtract from the size before decoding)
*/
def variableSizePrefixedBits[A, B](
size: Codec[Int],
prefix: Codec[A],
value: Codec[B],
sizePadding: Int = 0
): Codec[(A, B)] =
variableSizePrefixedBitsLong(widenIntToLong(size), prefix, value, sizePadding.toLong)
/**
* Byte equivalent of [[variableSizePrefixedBits]].
* @param size codec that encodes/decodes the size in bytes
* @param prefix codec that encodes/decodes the prefix
* @param value codec the encodes/decodes the value
* @param sizePadding number of bytes to add to the size before encoding (and subtract from the size before decoding)
*/
def variableSizePrefixedBytes[A, B](
size: Codec[Int],
prefix: Codec[A],
value: Codec[B],
sizePadding: Int = 0
): Codec[(A, B)] =
variableSizePrefixedBytesLong(widenIntToLong(size), prefix, value, sizePadding.toLong)
/**
* Codec that supports vectors of the form `size ++ prefix ++ value` where the `size` field decodes to the bit length of the `value` field.
*
* For example, encoding the string `(3, "hello")` with `variableSizePrefixedBitsLong(uint32, int32, ascii)` yields a vector of 13 bytes -- the
* first four bytes being 0x00000028, the next 4 bytes being 0x00000003, and the last 5 bytes being the US-ASCII encoding of `"hello"`.
*
* The `size` field can be any `Long` codec. An optional padding can be applied to the size field. The `sizePadding` is added to
* the calculated size before encoding, and subtracted from the decoded size before decoding the value.
*
* For example, encoding `(3, "hello")` with `variableSizePrefixedBitsLong(uint32, int32, ascii, 1)` yields a vector of 13 bytes -- the first
* 4 bytes being 0x00000029, the next 4 bytes being 0x00000003, and the last 5 bytes being the US-ASCII encoding of `"hello"`.
*
* @param size codec that encodes/decodes the size in bits
* @param prefix codec that encodes/decodes the prefix
* @param value codec the encodes/decodes the value
* @param sizePadding number of bits to add to the size before encoding (and subtract from the size before decoding)
*/
def variableSizePrefixedBitsLong[A, B](
size: Codec[Long],
prefix: Codec[A],
value: Codec[B],
sizePadding: Long = 0
): Codec[(A, B)] =
new VariableSizePrefixedCodec(size, prefix, value, sizePadding)
/**
* Byte equivalent of [[variableSizePrefixedBitsLong]].
* @param size codec that encodes/decodes the size in bytes
* @param prefix codec that encodes/decodes the prefix
* @param value codec the encodes/decodes the value
* @param sizePadding number of bytes to add to the size before encoding (and subtract from the size before decoding)
*/
def variableSizePrefixedBytesLong[A, B](
size: Codec[Long],
prefix: Codec[A],
value: Codec[B],
sizePadding: Long = 0
): Codec[(A, B)] = new Codec[(A, B)] {
private val codec = variableSizePrefixedBitsLong(
size.widen(_ * 8, bitsToBytesDivisible),
prefix,
value,
sizePadding * 8
)
def sizeBound = size.sizeBound + value.sizeBound
def encode(ab: (A, B)) = codec.encode(ab)
def decode(b: BitVector) = codec.decode(b)
override def toString = s"variableSizePrefixedBytes($size, $prefix, $value)"
}
/**
* Decodes using the specified codec but resets the remainder to the original vector.
* Encodes with the specified codec.
* @param target codec that encodes/decodes the value
* @return codec that behaves the same as `target` but resets remainder to the input vector after decoding
*/
def peek[A](target: Codec[A]): Codec[A] = new Codec[A] {
def sizeBound = target.sizeBound
def encode(a: A) = target.encode(a)
def decode(b: BitVector) = target.decode(b).map(_.mapRemainder(_ => b))
}
/**
* Codec that decodes vectors of the form `size ++ rest` as a `BitVector`, where the returned vector includes the size bits.
*
* This differs from `variableSizeBits(size, bits, sizePadding)` in that the encoded size is expected to be encoded before
* calling encode and the encoded size is returned as part of the vector.
*
* @param size size codec -- must have an exact size
* @param sizePadding number of bits to subtract from the size before decoding
*/
def peekVariableSizeBits(size: Codec[Int], sizePadding: Int = 0): Codec[BitVector] =
peekVariableSizeBitsLong(widenIntToLong(size), sizePadding.toLong)
/**
* `Long` equivalent of [[peekVariableSizeBits]].
* @param size size codec -- must have an exact size
* @param sizePadding number of bits to subtract from the size before decoding
*/
def peekVariableSizeBitsLong(size: Codec[Long], sizePadding: Long = 0L): Codec[BitVector] =
new Codec[BitVector] {
private val sizeInBits = size.sizeBound.exact.getOrElse(
throw new IllegalArgumentException(
s"must be used with a size field of an exactly known size but $size has size bound ${size.sizeBound}"
)
)
private val decoder =
(peek(bits(sizeInBits)) :: variableSizeBitsLong(size, bits, sizePadding)).map(_ ++ _)
def sizeBound = size.sizeBound.atLeast
def encode(b: BitVector) = Attempt.successful(b)
def decode(b: BitVector) = decoder.decode(b)
override def toString = s"peekVariableSizeBits($size)"
}
/**
* Equivalent to [[peekVariableSizeBits]] where the size units are in bytes instead of bits.
*
* @param size size codec -- must have an exact size
* @param sizePadding number of bytes to subtract from the size before decoding
*/
def peekVariableSizeBytes(size: Codec[Int], sizePadding: Int = 0): Codec[BitVector] =
peekVariableSizeBytesLong(widenIntToLong(size), sizePadding.toLong)
/**
* `Long` equivalent of [[peekVariableSizeBytes]].
* @param size size codec -- must have an exact size
* @param sizePadding number of bits to subtract from the size before decoding
*/
def peekVariableSizeBytesLong(size: Codec[Long], sizePadding: Long = 0L): Codec[BitVector] =
new Codec[BitVector] {
private val codec =
peekVariableSizeBitsLong(size.widen(_ * 8, bitsToBytesDivisible), sizePadding * 8)
def sizeBound = codec.sizeBound
def encode(a: BitVector) = codec.encode(a)
def decode(b: BitVector) = codec.decode(b)
override def toString = s"peekVariableSizeBytes($size)"
}
/**
* Codec that:
* - encodes using the specified codec but right-pads with 0 bits to the next largest byte when the size of the
* encoded bit vector is not divisible by 8
* - decodes using the specified codec but drops any leading bits of the remainder when the number of bytes
* consumed by the specified codec is not divisible by 8
*
* This combinator allows byte alignment without manually specifying ignore bits. For example, instead of writing
* `(bool(1) :: bool(1) :: ignore(6)).dropUnits`, this combinator allows `byteAligned(bool(1) :: bool(1))`.
*
* Note that aligning large structures on byte boundaries can provide significant performance improvements when
* converting to/from data structures that are based on bytes -- e.g., `Array[Byte]` or `ByteBuffer`.
*
* @param codec codec to align to next larger byte boundary
*/
def byteAligned[A](codec: Codec[A]): Codec[A] = new ByteAlignedCodec(codec)
/**
* Codec of `Option[A]` that delegates to a `Codec[A]` when the `included` parameter is true.
*
* When encoding, if `included` is true and the value to encode is a `Some`, the specified codec is used to encode the inner value.
* Otherwise, an empty bit vector is returned.
*
* When decoding, if `included` is true, the specified codec is used and its result is wrapped in a `Some`. Otherwise, a `None` is returned.
*
* @param included whether this codec is enabled (meaning it delegates to the specified codec) or disabled, in which case it
* encodes no bits and returns `None` from decode
* @param codec codec to conditionally include
*/
def conditional[A](included: Boolean, codec: => Codec[A]): Codec[Option[A]] =
new ConditionalCodec(included, codec)
/**
* Codec of `Option[A]` that delegates to a `Codec[A]` when the `guard` codec decodes a true.
*
* When encoding, a `Some` results in `guard` encoding a `true` and `target` encoding the value.
* A `None` results in `guard` encoding a false and the `target` not encoding anything.
*
* Various guard codecs and combinators are provided by this library -- e.g., `bitsRemaining` and `recover`.
*
* @param guard codec that determines whether the target codec is included
* @param target codec to conditionally include
*/
def optional[A](guard: Codec[Boolean], target: Codec[A]): Codec[Option[A]] =
either(guard, provide(()), target)
.xmap[Option[A]](_.toOption, _.toRight(()))
.withToString(s"optional($guard, $target)")
/**
* Codec that decodes true when the input vector is non-empty and false when it is empty.
* Encodes to an empty bit vector.
*
*/
val bitsRemaining: Codec[Boolean] = new Codec[Boolean] {
def sizeBound = SizeBound.exact(0)
def encode(b: Boolean) = Attempt.successful(BitVector.empty)
def decode(b: BitVector) = Attempt.successful(DecodeResult(b.nonEmpty, b))
override def toString = "bitsRemaining"
}
/**
* Creates a `Codec[A]` from a `Codec[Option[A]]` and a fallback `Codec[A]`.
*
* When encoding, the `A` is encoded with `opt` (by wrapping it in a `Some`).
* When decoding, `opt` is first used to decode the buffer. If it decodes a `Some(a)`, that
* value is returned. If it decodes a `None`, `default` is used to decode the buffer.
*
* @param opt optional codec
* @param default fallback codec used during decoding when `opt` decodes a `None`
*/
def withDefault[A](opt: Codec[Option[A]], default: Codec[A]): Codec[A] =
val paired = opt.flatZip {
case Some(a) => provide(a)
case None => default
}
paired.xmap[A](_._2, a => (Some(a), a)).withToString(s"withDefault($opt, $default)")
/**
* Creates a `Codec[A]` from a `Codec[Option[A]]` and a fallback value `A`.
*
* When encoding, the `A` is encoded with `opt` (by wrapping it in a `Some`).
* When decoding, `opt` is first used to decode the buffer. If it decodes a `Some(a)`, that
* value is returned. If it decodes a `None`, the `default` value is return.
*
* @param opt optional codec
* @param default fallback value returned from `decode` when `opt` decodes a `None`
*/
def withDefaultValue[A](opt: Codec[Option[A]], default: A): Codec[A] =
withDefault(opt, provide(default))
/**
* Creates a codec that decodes true when the target codec decodes successfully and decodes false
* when the target codec decodes unsuccessfully. Upon a successful decode of the target codec, the
* remaining bits are returned, whereas upon an unsuccessful decode, the original input buffer is
* returned.
*
* When encoding, a true results in the target codec encoding a unit whereas a false results
* in encoding of an empty vector.
*
* @param target codec to recover errors from
*/
def recover(target: Codec[Unit]): Codec[Boolean] = new RecoverCodec(target, false)
/**
* Lookahead version of [[recover]] -- i.e., upon successful decoding with the target codec,
* the original buffer is returned instead of the remaining buffer.
*
* @param target codec to recover errors from
*/
def lookahead(target: Codec[Unit]): Codec[Boolean] = new RecoverCodec(target, true)
/**
* Codec that encodes/decodes using the specified codecs by trying each codec in succession
* and using the first successful result.
*
*/
def choice[A](codecs: Codec[A]*): Codec[A] =
Codec(
Encoder.choiceEncoder(codecs*),
Decoder.choiceDecoder(codecs*)
).withToString(codecs.mkString("choice(", ", ", ")"))
/**
* Codec that encodes/decodes a `Vector[A]` from a `Codec[A]`.
*
* When encoding, each `A` in the vector is encoded and all of the resulting vectors are concatenated.
*
* When decoding, `codec.decode` is called repeatedly until there are no more remaining bits and the value result
* of each `decode` is returned in the vector.
*
* @param codec codec to encode/decode a single element of the sequence
*/
def vector[A](codec: Codec[A]): Codec[Vector[A]] = new VectorCodec(codec)
/**
* Codec that encodes/decodes a `Vector[A]` of `N` elements using a `Codec[A]`.
*
* When encoding, the number of elements in the vector is encoded using `countCodec`
* and the values are then each encoded using `valueCodec`.
*
* When decoding, the number of elements is decoded using `countCodec` and then that number of elements
* are decoded using `valueCodec`. Any remaining bits are returned.
*
* Note: when the count is known statically, use `vectorOfN(provide(count), ...)`.
*
* @param codec codec to encode/decode a single element of the sequence
*/
def vectorOfN[A](countCodec: Codec[Int], valueCodec: Codec[A]): Codec[Vector[A]] =
countCodec
.flatZip(count => new VectorCodec(valueCodec, Some(count)))
.narrow(
{
case (cnt, xs) =>
if xs.size == cnt then Attempt.successful(xs)
else {
val valueBits = valueCodec.sizeBound.exact.getOrElse(valueCodec.sizeBound.lowerBound)
Attempt.failure(Err.insufficientBits(cnt * valueBits, xs.size * valueBits))
}
},
xs => (xs.size, xs)
)
.withToString(s"vectorOfN($countCodec, $valueCodec)")
/**
* Codec that encodes/decodes a `Vector[A]` from a `Codec[A]`.
*
* When encoding, each `A` in the vector is encoded and all of the resulting bits are combined using `mux`.
*
* When decoding, `deMux` is called repeatedly to obtain the next bits (to decode using `valueCodec`) and the
* remaining bits (input to `deMux` on next iteration) until a decoding error is encountered or no more bits remain.
* The final return value is a vector of all decoded element values.
*
* Note: For large vectors, it may be necessary to compact bits in `deMux`.
*
* @param mux element multiplexer
* @param deMux element de-multiplexer (should return the next bits to decode and the remaining bits for next iteration)
* @param valueCodec element codec (used to decode next bits)
* @tparam A element type
*/
def vectorMultiplexed[A](
mux: (BitVector, BitVector) => BitVector,
deMux: BitVector => (BitVector, BitVector),
valueCodec: Codec[A]
): Codec[Vector[A]] =
new VectorMultiplexedCodec[A](mux, deMux, valueCodec)
/**
* Codec that encodes/decodes a `Vector[A]` from a `Codec[A]`.
*
* When encoding, each `A` in the vector is encoded and all of the resulting bits are concatenated using `delimiter`.
*
* When decoding, the input bits are first (logically) grouped into `delimiter` sized chunks and partitioned around `delimiter` chunks.
* Then, the individual partitions are (concatenated and) decoded using the `valueCodec` and the values collected are returned in a vector.
*
* Note: This method applies specific semantics to the notion of a `delimiter`. An alternate (and faster) implementation could be to search
* for the `delimiter` using `BitVector.indexOfSlice` but this would work only if value bits do not contain the `delimiter` bits at
* any bit position.
*
* Example:
* {{{
* val codec = vectorDelimited(BitVector(' '), ascii)
* codec.decode(ascii.encode("i am delimited").require).require.value // Vector("i", "am", "delimited")
* }}}
*
* @param delimiter the bits used to separate element bit values
* @param valueCodec element codec (used to decode next bits)
* @tparam A element type
*/
def vectorDelimited[A](delimiter: BitVector, valueCodec: Codec[A]): Codec[Vector[A]] =
if delimiter.size == 0 then vector(valueCodec)
else
vectorMultiplexed(
_ ++ delimiter ++ _,
bits => DeMultiplexer.delimited(bits, delimiter),
valueCodec
).withToString(s"vectorDelimited($delimiter, $valueCodec)")
/**
* Codec that encodes/decodes a `List[A]` from a `Codec[A]`.
*
* When encoding, each `A` in the list is encoded and all of the resulting vectors are concatenated.
*
* When decoding, `codec.decode` is called repeatedly until there are no more remaining bits and the value result
* of each `decode` is returned in the list.
*
* @param codec codec to encode/decode a single element of the sequence
*/
def list[A](codec: Codec[A]): Codec[List[A]] = new ListCodec(codec)
/**
* Codec that encodes/decodes a `List[A]` of `N` elements using a `Codec[A]`.
*
* When encoding, the number of elements in the list is encoded using `countCodec`
* and the values are then each encoded using `valueCodec`.
*
* When decoding, the number of elements is decoded using `countCodec` and then that number of elements
* are decoded using `valueCodec`. Any remaining bits are returned.
*
* Note: when the count is known statically, use `listOfN(provide(count), ...)`.
*
* @param codec codec to encode/decode a single element of the sequence
*/
def listOfN[A](countCodec: Codec[Int], valueCodec: Codec[A]): Codec[List[A]] =
countCodec
.flatZip(count => new ListCodec(valueCodec, Some(count)))
.narrow(
{
case (cnt, xs) =>
if xs.size == cnt then Attempt.successful(xs)
else {
val valueBits = valueCodec.sizeBound.exact.getOrElse(valueCodec.sizeBound.lowerBound)
Attempt.failure(Err.insufficientBits(cnt * valueBits, xs.size * valueBits))
}
},
xs => (xs.size, xs)
)
.withToString(s"listOfN($countCodec, $valueCodec)")
/**
* Codec that encodes/decodes a `List[A]` from a `Codec[A]`.
*
* When encoding, each `A` in the list is encoded and all of the resulting bits are combined using `mux`.
*
* When decoding, `deMux` is called repeatedly to obtain the next bits (to decode using `valueCodec`) and the
* remaining bits (input to `deMux` on next iteration) until a decoding error is encountered or no more bits remain.
* The final return value is a list of all decoded element values.
*
* Note: For large lists, it may be necessary to compact bits in `deMux`.
*
* @param mux element multiplexer
* @param deMux element de-multiplexer (should return the next bits to decode and the remaining bits for next iteration)
* @param valueCodec element codec (used to decode next bits)
* @tparam A element type
*/
def listMultiplexed[A](
mux: (BitVector, BitVector) => BitVector,
deMux: BitVector => (BitVector, BitVector),
valueCodec: Codec[A]
): Codec[List[A]] =
new ListMultiplexedCodec[A](mux, deMux, valueCodec)
/**
* Codec that encodes/decodes a `List[A]` from a `Codec[A]`.
*
* When encoding, each `A` in the list is encoded and all of the resulting bits are concatenated using `delimiter`.
*
* When decoding, the input bits are first (logically) grouped into `delimiter` sized chunks and partitioned around `delimiter` chunks.
* Then, the individual partitions are (concatenated and) decoded using the `valueCodec` and the values collected are returned in a list.
*
* Note: This method applies specific semantics to the notion of a `delimiter`. An alternate (and faster) implementation could be to search
* for the `delimiter` using `BitVector.indexOfSlice` but this would work only if value bits do not contain the `delimiter` bits at
* any bit position.
*
* Example:
* {{{
* val codec = listDelimited(BitVector(' '), ascii)
* codec.decode(ascii.encode("i am delimited").require).require.value // List("i", "am", "delimited")
* }}}
*
* @param delimiter the bits used to separate element bit values
* @param valueCodec element codec (used to decode next bits)
* @tparam A element type
*/
def listDelimited[A](delimiter: BitVector, valueCodec: Codec[A]): Codec[List[A]] =
if delimiter.size == 0 then list(valueCodec)
else
listMultiplexed(
_ ++ delimiter ++ _,
bits => DeMultiplexer.delimited(bits, delimiter),
valueCodec
).withToString(s"listDelimited($delimiter, $valueCodec)")
/**
* Combinator that chooses amongst two codecs based on a given byte ordering.
* @param big codec to use when big endian
* @param little codec to use when little endian
*/
def endiannessDependent[A](big: Codec[A], little: Codec[A])(
using ordering: ByteOrdering
): Codec[A] =
ordering match
case ByteOrdering.BigEndian => big
case ByteOrdering.LittleEndian => little
/**
* Either codec that supports bit vectors of form `indicator ++ (left or right)` where a
* value of `false` for the indicator indicates it is followed by a left value and a value
* of `true` indicates it is followed by a right value.
*
* @param indicator codec that encodes/decodes false for left and true for right
* @param left codec the encodes a left value
* @param right codec the encodes a right value
*/
def either[L, R](
indicator: Codec[Boolean],
left: Codec[L],
right: Codec[R]
): Codec[Either[L, R]] =
discriminated[Either[L, R]]
.by(indicator)
.caseP(false) { case Left(l) => l }(Left.apply)(left)
.caseP(true) { case Right(r) => r }(Right.apply)(right)
/**
* Either codec that supports bit vectors of form `left or right` where the right codec
* is consulted first when decoding. If the right codec fails to decode, the left codec
* is used.
*
* @param left codec the encodes a left value
* @param right codec the encodes a right value
*/
def fallback[L, R](left: Codec[L], right: Codec[R]): Codec[Either[L, R]] =
new Codec[Either[L, R]] {
def sizeBound = left.sizeBound | right.sizeBound
def encode(e: Either[L, R]) = e.fold(left.encode, right.encode)
def decode(b: BitVector) = right.decode(b).map(_.map(Right(_))).recoverWith {
case _ => left.decode(b).map(_.map(Left(_)))
}
}
/**
* Provides a `Codec[A]` that delegates to a lazily evaluated `Codec[A]`.
*/
def lazily[A](codec: => Codec[A]): Codec[A] = Codec.lazily(codec)
/**
* Codec that always fails encoding and decoding with the specified message.
*/
def fail[A](err: Err): Codec[A] = fail(err, err)
/**
* Codec that always fails encoding and decoding with the specified messages.
*/
def fail[A](encErr: Err, decErr: Err): Codec[A] = new FailCodec[A](encErr, decErr)
/**
* Codec that filters bits before/after decoding/encoding.
*
* Note: the remainder returned from `filter.decode` is appended to the remainder of `codec.decode`.
*
* @param codec the target codec
* @param filter a codec that represents pre/post-processing stages for input/output bits
*/
def filtered[A](codec: Codec[A], filter: Codec[BitVector]): Codec[A] = new Codec[A] {
def sizeBound: SizeBound = filter.sizeBound
def encode(value: A): Attempt[BitVector] = codec.encode(value).flatMap(filter.encode)
def decode(bits: BitVector): Attempt[DecodeResult[A]] =
filter.decode(bits).flatMap(r => codec.decode(r.value).map(_.mapRemainder(_ ++ r.remainder)))
override def toString = s"filtered($codec, $filter)"
}
/**
* Codec that supports a checksum.
*
* When encoding, first the value is encoded using `target`, then a checksum is computed over the result the encoded value using `checksum`,
* and finally, the encoded value and the checksum are converted to a single vector using `framing.encode(value -> chk)`.
*
* When decoding, the input vector is split in to an encoded value, a checksum value, and a remainder using `framing.decode`.
* If `validate` is true, a checksum is computed over the encoded value and compared with the decoded checksum value. If the checksums
* match, the encoded value is decoded with `target` and the result is returned, with its remainder concatenated with the remainder of
* deframing. If the checksums do not match, a `ChecksumMismatch` error is raised.
*
* For example: {{{
val crc32 = scodec.bits.crc(hex"04c11db7".bits, hex"ffffffff".bits, true, true, hex"ffffffff".bits)
// Size of the string is not included in the checksum -- the `framing` codec handles adding the size *after* checksum computation
val c = checksummed(utf8, crc32, variableSizeBytes(int32, bits) ~ bits(32))
// Size of the string is included in the checksum
val d = checksummed(utf8_32, crc32, peekVariableSizeBytes(int32) ~ bits(32))
}}}
*
* @param target codec used for encoding/decoding values of type `A`
* @param checksum computes a checksum of the input
* @param framing codec used to convert the encoded value and computed checksum in to a single vector
*/
def checksummed[A](
target: Codec[A],
checksum: BitVector => BitVector,
framing: Codec[(BitVector, BitVector)],
validate: Boolean = true
): Codec[A] = new Codec[A] {
def sizeBound: SizeBound = target.sizeBound.atLeast
def encode(a: A) =
for
value <- target.encode(a)
result <- framing.encode(value -> checksum(value))
yield result
def decode(bits: BitVector) =
for
r <- framing.decode(bits)
(value, actual) = r.value
result <-
if validate then
val expected = checksum(value)
if expected == actual then target.decode(value)
else Attempt.failure(ChecksumMismatch(value, expected, actual))
else
target.decode(value)
yield result.mapRemainder(_ ++ r.remainder)
override def toString = s"checksummed($target, $framing)"
}
/**
* Codec that encrypts and decrypts using a `javax.crypto.Cipher`.
*
* Encoding a value of type `A` is delegated to the specified codec and the resulting bit vector is encrypted
* with a cipher provided by the given [[CipherFactory]].
*
* Decoding first decrypts all of the remaining bits and then decodes the decrypted bits with the
* specified codec. Successful decoding always returns no remaining bits, even if the specified
* codec does not consume all decrypted bits.
*
* @param codec codec that encodes a value to plaintext bits and decodes plaintext bits to a value
* @param cipherFactory factory to use for encryption/decryption
*/
def encrypted[A](codec: Codec[A], cipherFactory: CipherFactory): Codec[A] =
new CipherCodec(codec, cipherFactory)
/**
* Codec that includes a signature of the encoded bits.
*
* Encoding a value of type `A` is delegated to the specified codec and then a signature of those bits is
* appended using the specified [[SignatureFactory]] to perform signing.
*
* Decoding first decodes using the specified codec and then all of the remaining bits are treated as
* the signature of the decoded bits. The signature is verified and if it fails to verify, an error
* is returned.
*
* Note: because decoding is first delegated to the specified code, care must be taken to ensure
* that codec does not consume the signature bits. For example, if the target codec is an unbounded
* string (e.g., ascii, utf8), decoding an encoded vector will result in the string codec trying to
* decode the signature bits as part of the string.
*
* Use [[SignatureFactory]] or [[ChecksumFactory]] to create a [[SignerFactory]].
*
* @param size size in bytes of signature
* @param codec codec to use to encode/decode value field
* @param signatureFactory factory to use for signing/verifying
*/
def fixedSizeSignature[A](
size: Int
)(codec: Codec[A], signerFactory: SignerFactory): Codec[A] =
new SignatureCodec(codec, fixedSizeBytes(size.toLong, bits), signerFactory)
/**
* Codec that includes a signature of the encoded bits.
*
* Same functionality as [[fixedSizeSignature]] with one difference -- the size of the signature bytes are
* written between the encoded bits and the signature bits.
*
* Use [[SignatureFactory]] or [[ChecksumFactory]] to create a [[SignerFactory]].
*
* @param size codec to use to encode/decode size of signature field
* @param codec codec to use to encode/decode value field
* @param signatureFactory factory to use for signing/verifying
*/
def variableSizeSignature[A](
size: Codec[Int]
)(codec: Codec[A], signerFactory: SignerFactory): Codec[A] =
new SignatureCodec(codec, variableSizeBytes(size, bits), signerFactory)
/**
* Codec that encodes/decodes certificates using their default encoding.
*
* @param certType certificate type to pass to `java.security.cert.CertificateFactory.getInstance`
*/
def certificate(certType: String): Codec[Certificate] = new CertificateCodec(certType)
/**
* Codec that encodes/decodes certificates using their default encoding.
*/
def x509Certificate: Codec[X509Certificate] =
certificate("X.509")
.xmap[X509Certificate](_.asInstanceOf[X509Certificate], identity)
.withToString("x509certificate")
/**
* Provides the `|` method on `String`, which is reverse syntax for `codec withContext ctx`.
*
* Usage: {{{val codec = "id" | uint8}}}
*/
extension (context: String) def |[A](codec: Codec[A]): Codec[A] = codec.withContext(context)
// DiscriminatorCodec syntax
/**
* Provides syntax for building a [[DiscriminatorCodec]].
*
* Usage: {{{
val codecA: Codec[A] = ...
val codecB: Codec[B] = ...
val codecE: Codec[Either[A,B]] =
discriminated[Either[A,B]].by(uint8)
.| (0) { case Left(l) => l } (Left.apply) (codecA)
.| (1) { case Right(r) => r } (Right.apply) (codecB)
}}}
* This encodes an `Either[A,B]` by checking the given patterns
* in sequence from top to bottom. For the first pattern that matches,
* it emits the corresponding discriminator value: `0` for `Left`
* and `1` for `Right`, encoded via the `uint8` codec. It then emits
* either an encoded `A`, encoded using `codecA`, or an encoded `B`,
* using `codecB`.
*
* Decoding is the mirror of this; the returned `codecE` will first
* read an `Int`, using the `uint8` codec. If it is a `0`, it then
* runs `codecA`, and injects the result into `Either` via `Left.apply`.
* If it is a `1`, it runs `codecB` and injects the result into `Either`
* via `Right.apply`.
*
* There are a few variations on this syntax. See [[DiscriminatorCodec]] for details.
*/
def discriminated[A]: NeedDiscriminatorCodec[A] = new NeedDiscriminatorCodec[A] {
final def by[B](discriminatorCodec: Codec[B]): DiscriminatorCodec[A, B] =
new DiscriminatorCodec[A, B](discriminatorCodec, Vector(), [x] => (x: Codec[x]) => x)
}
/**
* Provides a codec for an enumerated set of values, where each enumerated value is
* mapped to a tag.
*
* @param discriminatorCodec codec used to encode/decode tag value
* @param mappings mapping from tag values to/from enum values
*/
def mappedEnum[A, B](discriminatorCodec: Codec[B], mappings: (A, B)*): DiscriminatorCodec[A, B] =
mappedEnum(discriminatorCodec, mappings.toMap)
/**
* Provides a codec for an enumerated set of values, where each enumerated value is
* mapped to a tag.
*
* @param discriminatorCodec codec used to encode/decode tag value
* @param map mapping from tag values to/from enum values
*/
def mappedEnum[A, B](discriminatorCodec: Codec[B], map: Map[A, B]): DiscriminatorCodec[A, B] =
map.foldLeft(discriminated[A].by(discriminatorCodec)) {
case (acc, (value, tag)) =>
acc.subcaseO(tag)(a => if a == value then Some(a) else None)(provide(value))
}
/**
* Alternative to [[fallback]] that only falls back to left codec when the right codec fails to decode
* due to an unknown discriminator (i.e., `KnownDiscriminatorType[_]#UnknownDiscriminator`).
*
* @param left codec to use when the right codec fails due to an unknown discriminator error
* @param right codec to use by default when decoding
*/
def discriminatorFallback[L, R](left: Codec[L], right: Codec[R]): Codec[Either[L, R]] =
new Codec[Either[L, R]] {
def sizeBound = left.sizeBound | right.sizeBound
def encode(e: Either[L, R]) = e.fold(left.encode, right.encode)
def decode(b: BitVector) = right.decode(b).map(_.map(Right(_))).recoverWith {
case _: KnownDiscriminatorType[?]#UnknownDiscriminator => left.decode(b).map(_.map(Left(_)))
}
}
/**
* Codec for an `Enumeration` that encodes/decodes using `Enumeration.Value.id` values.
*
* @param discriminator the codec for `Enumeration.Value.id` values
* @param enumeration the target `Enumeration`
* @return
*/
def enumerated(discriminator: Codec[Int], enumeration: Enumeration) =
mappedEnum(
discriminator,
(enumeration.values: Set[enumeration.Value]).map(e => e -> e.id).toMap
) // https://github.com/scala/bug/issues/10906
/**
* Wraps a codec and adds logging of each encoding and decoding operation.
*
* The `logEncode` and `logDecode` functions are called with the result of each encoding and decoding
* operation.
*
* This method is intended to be used to build a domain specific logging combinator. For example: {{{
* def log[A] = logBuilder[A]((a, r) => myLogger.debug(s"..."), (b, r) => myLogger.debug(s"...")) _
* ...
* log(myCodec)
* }}}
*
* For quick logging to standard out, consider using [[logFailuresToStdOut]].
*/
def logBuilder[A](
logEncode: (A, Attempt[BitVector]) => Unit,
logDecode: (BitVector, Attempt[DecodeResult[A]]) => Unit
)(codec: Codec[A]): Codec[A] = new Codec[A] {
override def sizeBound = codec.sizeBound
override def encode(a: A) =
val res = codec.encode(a)
logEncode(a, res)
res
override def decode(b: BitVector) =
val res = codec.decode(b)
logDecode(b, res)
res
override def toString = codec.toString
}
private val constUnit: Any => Unit = _ => ()
/**
* Variant of [[logBuilder]] that only logs successful results.
*/
def logSuccessesBuilder[A](
logEncode: (A, BitVector) => Unit,
logDecode: (BitVector, DecodeResult[A]) => Unit
)(codec: Codec[A]): Codec[A] =
logBuilder[A](
(a, r) => r.fold(constUnit, logEncode(a, _)),
(b, r) => r.fold(constUnit, logDecode(b, _))
)(codec)
/**
* Variant of [[logBuilder]] that only logs failed results.
*/
def logFailuresBuilder[A](logEncode: (A, Err) => Unit, logDecode: (BitVector, Err) => Unit)(
codec: Codec[A]
): Codec[A] =
logBuilder[A](
(a, r) => r.fold(logEncode(a, _), constUnit),
(b, r) => r.fold(logDecode(b, _), constUnit)
)(codec)
/**
* Combinator intended for use in debugging that logs all encoded values and decoded values to standard out.
*
* @param prefix prefix string to include in each log statement
*/
def logToStdOut[A](codec: Codec[A], prefix: String = ""): Codec[A] =
val pfx = if prefix.isEmpty then "" else s"$prefix: "
logBuilder[A](
(a, r) => println(s"${pfx}encoded $a to $r"),
(b, r) => println(s"${pfx}decoded $b to $r")
)(codec)
/**
* Combinator intended for use in debugging that logs all failures while encoding or decoding to standard out.
*
* @param prefix prefix string to include in each log statement
*/
def logFailuresToStdOut[A](codec: Codec[A], prefix: String = ""): Codec[A] =
val pfx = if prefix.isEmpty then "" else s"$prefix: "
logFailuresBuilder[A](
(a, e) => println(s"${pfx}failed to encode $a: $e"),
(b, e) => println(s"${pfx}failed to decode $b: $e")
)(codec)
/**
* Codec that ensures variable size data is constrained within a minSize and maxSize bounds.
*
* This means that the size is variable only within a limited range. It will work just as variableSizeBytes codec,
* but ensuring that the binary data is at least `minSize` bytes long and at most `maxSize` bytes long.
*
* The `minSize` has the default value of `0`.
*
* @param size codec that encodes/decodes the size in bits
* @param value codec the encodes/decodes the value
* @param minSize minimum size in bytes that the message can have
* @param maxSize maximum size in bytes that the message can have
*/
def constrainedVariableSizeBytes[A](
size: Codec[Int],
value: Codec[A],
minSize: Int,
maxSize: Int
): Codec[A] =
new ConstrainedVariableSizeCodec(widenIntToLong(size), value, minSize.toLong, maxSize.toLong)
/**
* Codec that ensures variable size data is constrained within a minSize and maxSize bounds.
*
* This means that the size is variable only within a limited range. It will work just as variableSizeBytes codec,
* but ensuring that the binary data is at least `minSize` bytes long and at most `maxSize` bytes long.
*
* The `minSize` has the default value of `0`.
*
* @param size codec that encodes/decodes the size in bits
* @param value codec the encodes/decodes the value
* @param maxSize maximum size in bytes that the message can have
* @param minSize minimum size in bytes that the message can have
*/
def constrainedVariableSizeBytesLong[A](
size: Codec[Long],
value: Codec[A],
minSize: Long,
maxSize: Long
): Codec[A] =
new ConstrainedVariableSizeCodec(size, value, minSize, maxSize)
/**
* Codec that ensures variable size data is constrained within a minSize and maxSize bounds.
*
* This means that the size is variable only within a limited range. It will work just as variableSizeBytes codec,
* but ensuring that the binary data is at least `minSize` bytes long and at most `maxSize` bytes long.
*
* The `minSize` has the default value of `0`.
*
* @param size codec that encodes/decodes the size in bits
* @param value codec the encodes/decodes the value
* @param maxSize maximum size in bytes that the message can have
*/
def constrainedVariableSizeBytes[A](size: Codec[Int], value: Codec[A], maxSize: Int): Codec[A] =
new ConstrainedVariableSizeCodec(widenIntToLong(size), value, 0L, maxSize.toLong)
/**
* Codec that ensures variable size data is constrained within a minSize and maxSize bounds.
*
* This means that the size is variable only within a limited range. It will work just as variableSizeBytes codec,
* but ensuring that the binary data is at least `minSize` bytes long and at most `maxSize` bytes long.
*
* The `minSize` has the default value of `0`.
*
* @param size codec that encodes/decodes the size in bits
* @param value codec the encodes/decodes the value
* @param maxSize maximum size in bytes that the message can have
*/
def constrainedVariableSizeBytesLong[A](
size: Codec[Long],
value: Codec[A],
maxSize: Long
): Codec[A] =
new ConstrainedVariableSizeCodec(size, value, 0, maxSize)
© 2015 - 2025 Weber Informatics LLC | Privacy Policy