com.pippsford.encoding.Base58 Maven / Gradle / Ivy

Go to download
Show more of this group Show more artifacts with this name
Show all versions of common-utils Show documentation
Code that seems to me to have utility across multiple projects
The newest version!
package com.pippsford.encoding;

import java.util.Arrays;
import javax.annotation.Nullable;


/**
 * Base58 is a way to encode Bitcoin addresses (or arbitrary data) as alphanumeric strings.
 *
 * Note that this is not the same base58 as used by Flickr, which you may find referenced around the Internet.
 *
 * 
Satoshi explains: why base-58 instead of standard base-64 encoding?
 *
 * 
 Don't want 0OIl characters that look the same in some fonts and could be used to create visually identical looking account numbers. 
A string
 * with non-alphanumeric characters is not as easily accepted as an account number. 
E-mail usually won't line-break if there's no punctuation to break at.
 * 
Double-clicking selects the whole number as one word if it's all alphanumeric. 
 *
 * However, note that the encoding/decoding runs in O(n²) time, so it is not useful for large data.
 The basic idea of the encoding is to treat
 * the data bytes as a large number represented using base-256 digits, convert the number to be represented using base-58 digits, preserve the exact number of
 * leading zeros (which are otherwise lost during the mathematical operations on the numbers), and finally represent the resulting base-58 digits as
 * alphanumeric ASCII characters.
 */
public class Base58 implements Converter {

  private static final char[] ALPHABET =
      "123456789ABCDEFGHJKLMNPQRSTUVWXYZabcdefghijkmnopqrstuvwxyz".toCharArray();

  private static final char ENCODED_ZERO = ALPHABET[0];

  private static final int[] INDEXES = new int[128];


  /**
   * Divides a number, represented as an array of bytes each containing a single digit in the specified base, by the given divisor. The given number is modified
   * in-place to contain the quotient, and the return value is the remainder.
   *
   * @param number     the number to divide
   * @param firstDigit the index within the array of the first non-zero digit (this is used for optimization by skipping the leading zeros)
   * @param base       the base in which the number's digits are represented (up to 256)
   * @param divisor    the number to divide by (up to 256)
   *
   * @return the remainder of the division operation
   */
  private static byte divmod(byte[] number, int firstDigit, int base, int divisor) {
    // this is just long division which accounts for the base of the input digits
    int remainder = 0;
    for (int i = firstDigit; i < number.length; i++) {
      int digit = (int) number[i] & 0xFF;
      int temp = remainder * base + digit;
      number[i] = (byte) (temp / divisor);
      remainder = temp % divisor;
    }
    return (byte) remainder;
  }


  static {
    Arrays.fill(INDEXES, -1);
    for (int i = 0; i < ALPHABET.length; i++) {
      INDEXES[ALPHABET[i]] = i;
    }
  }


  @Nullable
  @Override
  public char[] clean(char[] text) {
    if (text == null) {
      return null;
    }
    char[] buf = new char[text.length];
    int pos = 0;
    for (char ch : text) {
      if (ch < 128 && INDEXES[ch] != -1) {
        buf[pos] = ch;
        pos++;
      }
    }
    return TextToByte.trim(buf, pos);
  }


  /**
   * Decodes the given base58 string into the original data bytes.
   *
   * @param input the base58-encoded string to decode
   *
   * @return the decoded data bytes
   */
  @Nullable
  public byte[] decode(char[] input) {
    if (input == null) {
      return null;
    }
    if (input.length == 0) {
      return new byte[0];
    }
    // Convert the base58-encoded ASCII chars to a base58 byte sequence (base58 digits).
    byte[] input58 = new byte[input.length];
    for (int i = 0; i < input.length; ++i) {
      char c = input[i];
      int digit = c < 128 ? INDEXES[c] : -1;
      if (digit < 0) {
        throw new IllegalArgumentException("Illegal character " + c + " at position " + i);
      }
      input58[i] = (byte) digit;
    }
    // Count leading zeros.
    int zeros = 0;
    while (zeros < input58.length && input58[zeros] == 0) {
      ++zeros;
    }
    // Convert base-58 digits to base-256 digits.
    byte[] decoded = new byte[input.length];
    int outputStart = decoded.length;
    int inputStart = zeros;
    while (inputStart < input58.length) {
      decoded[--outputStart] = divmod(input58, inputStart, 58, 256);
      if (input58[inputStart] == 0) {
        ++inputStart; // optimization - skip leading zeros
      }
    }
    // Ignore extra leading zeroes that were added during the calculation.
    while (outputStart < decoded.length && decoded[outputStart] == 0) {
      ++outputStart;
    }
    // Return decoded data (including original number of leading zeros).
    return Arrays.copyOfRange(decoded, outputStart - zeros, decoded.length);
  }


  /**
   * Encodes the given bytes as a base58 string (no checksum is appended).
   *
   * @param input the bytes to encode
   *
   * @return the base58-encoded string
   */
  @Nullable
  public char[] encodeChars(byte[] input) {
    if (input == null) {
      return null;
    }
    if (input.length == 0) {
      return new char[0];
    }
    // Count leading zeros.
    int zeros = 0;
    while (zeros < input.length && input[zeros] == 0) {
      ++zeros;
    }
    // Convert base-256 digits to base-58 digits (plus conversion to ASCII characters)
    input = Arrays.copyOf(input, input.length); // since we modify it in-place
    char[] encoded = new char[input.length * 2]; // upper bound
    int outputStart = encoded.length;
    int inputStart = zeros;
    while (inputStart < input.length) {
      encoded[--outputStart] = ALPHABET[divmod(input, inputStart, 256, 58)];
      if (input[inputStart] == 0) {
        ++inputStart; // optimization - skip leading zeros
      }
    }
    // Preserve exactly as many leading encoded zeros in output as there were leading zeros in
    // input.
    while (outputStart < encoded.length && encoded[outputStart] == ENCODED_ZERO) {
      ++outputStart;
    }
    while (--zeros >= 0) {
      encoded[--outputStart] = ENCODED_ZERO;
    }
    // Return encoded string (including encoded leading zeros).
    char[] out = new char[encoded.length - outputStart];
    System.arraycopy(encoded, outputStart, out, 0, out.length);
    return out;
  }

}