org.wildfly.common.archive.Archive Maven / Gradle / Ivy
package org.wildfly.common.archive;
import static java.lang.Math.min;
import java.io.Closeable;
import java.io.IOException;
import java.io.InputStream;
import java.nio.ByteBuffer;
import java.nio.ByteOrder;
import java.nio.channels.FileChannel;
import java.nio.charset.StandardCharsets;
import java.nio.file.Path;
import java.nio.file.StandardOpenOption;
import java.time.LocalDateTime;
import java.time.ZoneOffset;
import java.util.zip.DataFormatException;
import java.util.zip.Inflater;
import java.util.zip.InflaterInputStream;
import org.wildfly.common.Assert;
/**
*/
public final class Archive implements Closeable {
public static final int GP_ENCRYPTED = 1 << 0;
// only if method == implode
public static final int GP_IMPLODE_8K_DICTIONARY = 1 << 1;
public static final int GP_IMPLODE_3_TREES = 1 << 2;
// only if method == deflate
public static final int GP_DEFLATE_COMP_OPT_MASK = 0b11 << 1;
public static final int GP_DEFLATE_COMP_OPT_NORMAL = 0b00 << 1;
public static final int GP_DEFLATE_COMP_OPT_MAXIMUM = 0b01 << 1;
public static final int GP_DEFLATE_COMP_OPT_FAST = 0b10 << 1;
public static final int GP_DEFLATE_COMP_OPT_SUPER_FAST = 0b11 << 1;
// only if method == lzma
public static final int GP_LZMA_EOS_USED = 1 << 1;
public static final int GP_LATE_SIZES = 1 << 3;
// reserved 1 << 4
public static final int GP_COMPRESSED_PATCHED = 1 << 5;
public static final int GP_STRONG_ENCRYPTION = 1 << 6;
// reserved 1 << 7
// reserved 1 << 8
// reserved 1 << 9
// reserved 1 << 10
public static final int GP_UTF_8 = 1 << 11;
// reserved 1 << 12
public static final int GP_CD_MASKED = 1 << 13;
// reserved 1 << 14
// reserved 1 << 15
public static final int METHOD_STORED = 0;
public static final int METHOD_SHRINK = 1;
public static final int METHOD_REDUCE_1 = 2;
public static final int METHOD_REDUCE_2 = 3;
public static final int METHOD_REDUCE_3 = 4;
public static final int METHOD_REDUCE_4 = 5;
public static final int METHOD_IMPLODE = 6;
public static final int METHOD_DEFLATE = 8;
public static final int METHOD_DEFLATE64 = 9;
public static final int METHOD_BZIP2 = 12;
public static final int METHOD_LZMA = 14;
public static final int MADE_BY_MS_DOS = 0;
public static final int MADE_BY_UNIX = 3;
public static final int MADE_BY_NTFS = 10;
public static final int MADE_BY_OS_X = 19;
public static final int SIG_LH = 0x04034b50;
public static final int LH_SIGNATURE = 0;
public static final int LH_MIN_VERSION = 4;
public static final int LH_GP_BITS = 6;
public static final int LH_COMP_METHOD = 8;
public static final int LH_MOD_TIME = 10;
public static final int LH_MOD_DATE = 12;
public static final int LH_CRC_32 = 14;
public static final int LH_COMPRESSED_SIZE = 18;
public static final int LH_UNCOMPRESSED_SIZE = 22;
public static final int LH_FILE_NAME_LENGTH = 26;
public static final int LH_EXTRA_LENGTH = 28;
public static final int LH_END = 30;
public static final int SIG_DD = 0x08074b50;
public static final int DD_SIGNATURE = 0;
public static final int DD_CRC_32 = 4;
public static final int DD_COMPRESSED_SIZE = 8;
public static final int DD_UNCOMPRESSED_SIZE = 12;
public static final int DD_END = 16;
public static final int DD_ZIP64_COMPRESSED_SIZE = 8;
public static final int DD_ZIP64_UNCOMPRESSED_SIZE = 16;
public static final int DD_ZIP64_END = 24;
public static final int SIG_CDE = 0x02014b50;
public static final int CDE_SIGNATURE = 0;
public static final int CDE_VERSION_MADE_BY = 4;
public static final int CDE_VERSION_NEEDED = 6;
public static final int CDE_GP_BITS = 8;
public static final int CDE_COMP_METHOD = 10;
public static final int CDE_MOD_TIME = 12;
public static final int CDE_MOD_DATE = 14;
public static final int CDE_CRC_32 = 16;
public static final int CDE_COMPRESSED_SIZE = 20;
public static final int CDE_UNCOMPRESSED_SIZE = 24;
public static final int CDE_FILE_NAME_LENGTH = 28;
public static final int CDE_EXTRA_LENGTH = 30;
public static final int CDE_COMMENT_LENGTH = 32;
public static final int CDE_FIRST_DISK_NUMBER = 34;
public static final int CDE_INTERNAL_ATTRIBUTES = 36;
public static final int CDE_EXTERNAL_ATTRIBUTES = 38;
public static final int CDE_LOCAL_HEADER_OFFSET = 42; // relative to the start of the above first disk number
public static final int CDE_END = 46;
public static final int SIG_EOCD = 0x06054b50;
public static final int EOCD_SIGNATURE = 0;
public static final int EOCD_DISK_NUMBER = 4;
public static final int EOCD_CD_FIRST_DISK_NUMBER = 6;
public static final int EOCD_CDE_COUNT_THIS_DISK = 8;
public static final int EOCD_CDE_COUNT_ALL = 10;
public static final int EOCD_CD_SIZE = 12;
public static final int EOCD_CD_START_OFFSET = 16;
public static final int EOCD_COMMENT_LENGTH = 20;
public static final int EOCD_END = 22;
public static final int EXT_ID_ZIP64 = 0x0001;
public static final int ZIP64_UNCOMPRESSED_SIZE = 0;
public static final int ZIP64_COMPRESSED_SIZE = 8;
public static final int ZIP64_LOCAL_HEADER_OFFSET = 16;
public static final int ZIP64_FIRST_DISK_NUMBER = 24; // 4 bytes
public static final int ZIP64_END = 28;
public static final int EXT_ID_UNIX = 0x000d;
public static final int UNIX_ACCESS_TIME = 0;
public static final int UNIX_MODIFIED_TIME = 4;
public static final int UNIX_UID = 8;
public static final int UNIX_GID = 10;
public static final int UNIX_END = 12; // symlink target
public static final int UNIX_DEV_MAJOR = 12; // if it's a device node
public static final int UNIX_DEV_MINOR = 16;
public static final int UNIX_DEV_END = 20;
public static final int SIG_EOCD_ZIP64 = 0x06064b50;
public static final int EOCD_ZIP64_SIGNATURE = 0;
public static final int EOCD_ZIP64_SIZE = 4;
public static final int EOCD_ZIP64_VERSION_MADE_BY = 12;
public static final int EOCD_ZIP64_VERSION_NEEDED = 14;
public static final int EOCD_ZIP64_DISK_NUMBER = 16;
public static final int EOCD_ZIP64_CD_FIRST_DISK_NUMBER = 20;
public static final int EOCD_ZIP64_CDE_COUNT_THIS_DISK = 24;
public static final int EOCD_ZIP64_CDE_COUNT_ALL = 28;
public static final int EOCD_ZIP64_CD_SIZE = 36;
public static final int EOCD_ZIP64_CD_START_OFFSET = 44;
public static final int EOCD_ZIP64_END = 52;
public static final int SIG_EOCDL_ZIP64 = 0x07064b50;
public static final int EOCDL_ZIP64_SIGNATURE = 0;
public static final int EOCDL_ZIP64_EOCD_DISK_NUMBER = 4;
public static final int EOCDL_ZIP64_EOCD_OFFSET = 8;
public static final int EOCDL_ZIP64_DISK_COUNT = 16;
public static final int EOCDL_ZIP64_END = 20;
/**
* Maximum size of a single buffer.
*/
private static final int BUF_SIZE_MAX = 0x4000_0000;
private static final int BUF_SHIFT = Integer.numberOfTrailingZeros(BUF_SIZE_MAX);
private static final int BUF_SIZE_MASK = BUF_SIZE_MAX - 1;
private final ByteBuffer[] bufs;
private final long offset;
private final long length;
private final long cd;
private final Index index;
private Archive(final ByteBuffer[] bufs, final long offset, final long length, final long cd, final Index index) {
this.bufs = bufs;
this.offset = offset;
this.length = length;
this.cd = cd;
this.index = index;
}
public static Archive open(Path path) throws IOException {
try (FileChannel fc = FileChannel.open(path, StandardOpenOption.READ)) {
long size = fc.size();
final int bufCnt = Math.toIntExact((size + BUF_SIZE_MASK) >> BUF_SHIFT);
final ByteBuffer[] array = new ByteBuffer[bufCnt];
long offs = 0;
int idx = 0;
while (size > BUF_SIZE_MASK) {
array[idx++] = fc.map(FileChannel.MapMode.READ_ONLY, offs, BUF_SIZE_MAX).order(ByteOrder.LITTLE_ENDIAN);
size -= BUF_SIZE_MAX;
offs += BUF_SIZE_MAX;
}
array[idx] = fc.map(FileChannel.MapMode.READ_ONLY, offs, size).order(ByteOrder.LITTLE_ENDIAN);
return open(array);
}
}
public static Archive open(ByteBuffer buf) throws IOException {
Assert.checkNotNullParam("buf", buf);
if (buf.order() == ByteOrder.BIG_ENDIAN) {
buf = buf.duplicate().order(ByteOrder.LITTLE_ENDIAN);
}
return open(new ByteBuffer[] { buf });
}
static Archive open(ByteBuffer[] bufs) throws IOException {
return open(bufs, 0, capacity(bufs));
}
static Archive open(ByteBuffer[] bufs, long offset, long length) throws IOException {
// find the directory by looking first at its expected location and working our way backwards
long eocd = length - EOCD_END;
// todo: this could be optimized a bit (boyer-moore for example)
while (getUnsignedInt(bufs, offset + eocd) != SIG_EOCD) {
if (eocd == 0) {
throw new IOException("Invalid archive");
}
eocd--;
}
int entries = getUnsignedShort(bufs, offset + eocd + EOCD_CDE_COUNT_ALL);
// validate the EOCD record
if (getUnsignedShort(bufs, offset + eocd + EOCD_CD_FIRST_DISK_NUMBER) != 0 || getUnsignedShort(bufs, offset + eocd + EOCD_DISK_NUMBER) != 0 || entries != getUnsignedShort(bufs, offset + eocd + EOCD_CDE_COUNT_THIS_DISK)) {
throw new IOException("Multi-disk archives are not supported");
}
// check now for zip64
long eocdLocZip64 = eocd - EOCDL_ZIP64_END;
long eocdZip64 = -1;
if (getInt(bufs, offset + eocdLocZip64 + EOCDL_ZIP64_SIGNATURE) == SIG_EOCDL_ZIP64) {
// probably zip64
// validate the EOCDL_ZIP64
if (getInt(bufs, offset + eocdLocZip64 + EOCDL_ZIP64_DISK_COUNT) != 1 || getInt(bufs, offset + eocdLocZip64 + EOCDL_ZIP64_EOCD_DISK_NUMBER) != 0) {
throw new IOException("Multi-disk archives are not supported");
}
eocdZip64 = getLong(bufs, offset + eocdLocZip64 + EOCDL_ZIP64_EOCD_OFFSET);
if (getUnsignedInt(bufs, offset + eocdZip64 + EOCD_ZIP64_SIGNATURE) != SIG_EOCD_ZIP64) {
// oops, zip64 isn't really present, just bad luck
eocdZip64 = -1;
}
}
long cd;
cd = getUnsignedInt(bufs, offset + eocd + EOCD_CD_START_OFFSET);
if (cd == 0xffffffffL && eocdZip64 != -1) {
cd = getLong(bufs, offset + eocdZip64 + EOCD_ZIP64_CD_START_OFFSET);
}
if (entries == 0xffff && eocdZip64 != -1) {
final long cnt = getUnsignedInt(bufs, offset + eocdZip64 + EOCD_ZIP64_CDE_COUNT_ALL);
if (cnt > 0x07ff_ffffL) {
throw new IOException("Archive has too many entries");
}
entries = (int) cnt;
}
// generate the index
Index index;
if (length <= 0xfffe) {
index = new TinyIndex(entries);
} else if (length <= 0xffff_ffffeL) {
index = new LargeIndex(entries);
} else {
index = new HugeIndex(entries);
}
// iterate the directory
final int mask = index.getMask();
long cde = cd;
for (int i = 0; i < entries; i ++) {
if (getInt(bufs, offset + cde + CDE_SIGNATURE) != SIG_CDE) {
throw new IOException("Archive appears to be corrupted");
}
int hc = getHashCodeOfEntry(bufs, offset + cde);
index.put(hc & mask, cde);
cde = cde + CDE_END + getUnsignedShort(bufs, offset + cde + CDE_FILE_NAME_LENGTH) + getUnsignedShort(bufs, offset + cde + CDE_EXTRA_LENGTH) + getUnsignedShort(bufs, offset + cde + CDE_COMMENT_LENGTH);
}
return new Archive(bufs, offset, length, cd, index);
}
private static String getNameOfEntry(ByteBuffer[] bufs, long cde) {
long name = cde + CDE_END;
int nameLen = getUnsignedShort(bufs, cde + CDE_FILE_NAME_LENGTH);
boolean utf8 = (getUnsignedShort(bufs, cde + CDE_GP_BITS) & GP_UTF_8) != 0;
if (utf8) {
return new String(getBytes(bufs, name, nameLen), StandardCharsets.UTF_8);
} else {
char[] nameChars = new char[nameLen];
for (int i = 0; i < nameLen; i ++) {
nameChars[i] = Cp437.charFor(getUnsignedByte(bufs, name + i));
}
return new String(nameChars);
}
}
private static int getHashCodeOfEntry(ByteBuffer[] bufs, long cde) {
long name = cde + CDE_END;
int nameLen = getUnsignedShort(bufs, cde + CDE_FILE_NAME_LENGTH);
boolean utf8 = (getUnsignedShort(bufs, cde + CDE_GP_BITS) & GP_UTF_8) != 0;
int hc = 0;
if (utf8) {
int cp;
for (int i = 0; i < nameLen; i += Utf8.getByteCount(getUnsignedByte(bufs, name + i))) {
cp = Utf8.codePointAt(bufs, name + i);
if (Character.isSupplementaryCodePoint(cp)) {
hc = hc * 31 + Character.highSurrogate(cp);
hc = hc * 31 + Character.lowSurrogate(cp);
} else {
hc = hc * 31 + cp;
}
}
} else {
for (int i = 0; i < nameLen; i ++) {
hc = hc * 31 + Cp437.charFor(getUnsignedByte(bufs, name + i));
}
}
return hc;
}
public long getFirstEntryHandle() {
return cd;
}
public long getNextEntryHandle(long entryHandle) {
final long next = entryHandle + CDE_END + getUnsignedShort(bufs, offset + entryHandle + CDE_FILE_NAME_LENGTH) + getUnsignedShort(bufs, offset + entryHandle + CDE_EXTRA_LENGTH);
if (next >= length || getInt(bufs, offset + next + CDE_SIGNATURE) != SIG_CDE) {
return -1;
}
return next;
}
public long getEntryHandle(String fileName) {
final int mask = index.getMask();
final int base = fileName.hashCode();
long entryHandle;
for (int i = 0; i < mask; i ++) {
entryHandle = index.get(base + i & mask);
if (entryHandle == -1) {
return -1;
}
if (entryNameEquals(entryHandle, fileName)) {
return entryHandle;
}
}
return -1;
}
public boolean entryNameEquals(final long entryHandle, final String fileName) {
long name = entryHandle + CDE_END;
int nameLen = getUnsignedShort(bufs, offset + entryHandle + CDE_FILE_NAME_LENGTH);
boolean utf8 = (getUnsignedShort(bufs, offset + entryHandle + CDE_GP_BITS) & GP_UTF_8) != 0;
final int length = fileName.length();
if (utf8) {
long i;
int j;
for (i = 0, j = 0; i < nameLen && j < length; i += Utf8.getByteCount(getUnsignedByte(bufs, offset + name + i)), j = fileName.offsetByCodePoints(j, 1)) {
if (Utf8.codePointAt(bufs, offset + name + i) != fileName.codePointAt(j)) {
return false;
}
}
return i == nameLen && j == length;
} else {
int i, j;
for (i = 0, j = 0; i < nameLen && j < length; i++, j = fileName.offsetByCodePoints(j, 1)) {
if (Cp437.charFor(getUnsignedByte(bufs, offset + i + entryHandle + CDE_END)) != fileName.codePointAt(j)) {
return false;
}
}
return i == nameLen && j == length;
}
}
private long getLocalHeader(long entryHandle) {
long lh = getUnsignedInt(bufs, offset + entryHandle + CDE_LOCAL_HEADER_OFFSET);
if (lh == 0xffff_ffffL) {
long zip64 = getExtraRecord(entryHandle, EXT_ID_ZIP64);
if (zip64 != -1) {
lh = getLong(bufs, offset + zip64 + ZIP64_LOCAL_HEADER_OFFSET);
}
}
return lh;
}
public String getEntryName(long entryHandle) {
return getNameOfEntry(bufs, entryHandle);
}
public ByteBuffer getEntryContents(long entryHandle) throws IOException {
long size = getUncompressedSize(entryHandle);
long compSize = getCompressedSize(entryHandle);
if (size > 0x1000_0000 || compSize > 0x1000_0000) {
throw new IOException("Entry is too large to read into RAM");
}
long localHeader = getLocalHeader(entryHandle);
if ((getUnsignedShort(bufs, offset + localHeader + LH_GP_BITS) & (GP_ENCRYPTED | GP_STRONG_ENCRYPTION)) != 0) {
throw new IOException("Cannot read encrypted entries");
}
final long offset = getDataOffset(localHeader);
final int method = getCompressionMethod(entryHandle);
switch (method) {
case METHOD_STORED: {
return bufferOf(bufs, this.offset + offset, (int) size);
}
case METHOD_DEFLATE: {
final Inflater inflater = new Inflater(true);
try {
return JDKSpecific.inflate(inflater, bufs, this.offset + offset, (int) compSize, (int) size);
} catch (DataFormatException e) {
throw new IOException(e);
} finally {
inflater.end();
}
}
default: {
throw new IOException("Unsupported compression scheme");
}
}
}
private long getDataOffset(final long localHeader) {
return localHeader + LH_END + getUnsignedShort(bufs, offset + localHeader + LH_FILE_NAME_LENGTH) + getUnsignedShort(bufs, offset + localHeader + LH_EXTRA_LENGTH);
}
public InputStream getEntryStream(final long entryHandle) throws IOException {
long size = getCompressedSize(entryHandle);
long localHeader = getLocalHeader(entryHandle);
if ((getUnsignedShort(bufs, offset + localHeader + LH_GP_BITS) & (GP_ENCRYPTED | GP_STRONG_ENCRYPTION)) != 0) {
throw new IOException("Cannot read encrypted entries");
}
final long offset = getDataOffset(localHeader);
final int method = getCompressionMethod(entryHandle);
switch (method) {
case METHOD_STORED: {
return new ByteBufferInputStream(bufs, this.offset + offset, size);
}
case METHOD_DEFLATE: {
return new InflaterInputStream(new ByteBufferInputStream(bufs, this.offset + offset, size));
}
default: {
throw new IOException("Unsupported compression scheme");
}
}
}
public Archive getNestedArchive(long entryHandle) throws IOException {
long localHeader = getLocalHeader(entryHandle);
if ((getUnsignedShort(bufs, this.offset + localHeader + LH_GP_BITS) & (GP_ENCRYPTED | GP_STRONG_ENCRYPTION)) != 0) {
throw new IOException("Cannot read encrypted entries");
}
final long offset = getDataOffset(localHeader);
final int method = getCompressionMethod(entryHandle);
if (method != METHOD_STORED) {
throw new IOException("Cannot open compressed nested archive");
}
long size = getUncompressedSize(entryHandle);
if (size < Integer.MAX_VALUE) {
final ByteBuffer slice = sliceOf(bufs, this.offset + offset, (int) size);
if (slice != null) {
return Archive.open(slice);
}
}
return Archive.open(bufs, this.offset + offset, size);
}
public boolean isCompressed(long entryHandle) {
return getCompressionMethod(entryHandle) != METHOD_STORED;
}
private int getCompressionMethod(final long entryHandle) {
return getUnsignedShort(bufs, offset + entryHandle + CDE_COMP_METHOD);
}
private long getExtraRecord(final long entryHandle, final int headerId) {
long extra = entryHandle + CDE_END + getUnsignedShort(bufs, offset + entryHandle + CDE_FILE_NAME_LENGTH) + getUnsignedShort(bufs, offset + entryHandle + CDE_COMMENT_LENGTH);
int extraLen = getUnsignedShort(bufs, offset + entryHandle + CDE_EXTRA_LENGTH);
for (int i = 0; i < extraLen; i = i + getUnsignedShort(bufs, offset + extra + i + 2)) {
if (getUnsignedShort(bufs, offset + extra + i) == headerId) {
return extra + i + 4;
}
}
return -1;
}
public long getUncompressedSize(long entryHandle) {
long size = getUnsignedInt(bufs, offset + entryHandle + CDE_UNCOMPRESSED_SIZE);
if (size == 0xffffffff) {
long zip64 = getExtraRecord(entryHandle, EXT_ID_ZIP64);
if (zip64 != -1) {
size = getLong(bufs, offset + zip64 + ZIP64_UNCOMPRESSED_SIZE);
}
}
return size;
}
public long getCompressedSize(long entryHandle) {
long size = getUnsignedInt(bufs, offset + entryHandle + CDE_COMPRESSED_SIZE);
if (size == 0xffffffff) {
long zip64 = getExtraRecord(entryHandle, EXT_ID_ZIP64);
if (zip64 != -1) {
size = getLong(bufs, offset + zip64 + ZIP64_COMPRESSED_SIZE);
}
}
return size;
}
public long getModifiedTime(long entryHandle) {
long unix = getExtraRecord(entryHandle, EXT_ID_UNIX);
if (unix != -1) {
long unixTime = getUnsignedInt(bufs, offset + unix + UNIX_MODIFIED_TIME);
if (unixTime != 0) {
return unixTime * 1000;
}
}
// todo: NTFS (0x000a) sub-tag ID 0x0001 contains an 8-byte mtime
return dosTimeStamp(getUnsignedShort(bufs, offset + entryHandle + CDE_MOD_TIME), getUnsignedShort(bufs, offset + entryHandle + CDE_MOD_DATE));
}
public void close() {
}
private static long dosTimeStamp(int modTime, int modDate) {
int year = 1980 + (modDate >> 9);
int month = 1 + ((modDate >> 5) & 0b1111);
int day = modDate & 0b11111;
int hour = modTime >> 11;
int minute = (modTime >> 5) & 0b111111;
int second = (modTime & 0b11111) << 1;
return LocalDateTime.of(year, month, day, hour, minute, second).toInstant(ZoneOffset.UTC).toEpochMilli();
}
public boolean isDirectory(final long entryHandle) {
final int madeBy = getUnsignedShort(bufs, offset + entryHandle + CDE_VERSION_MADE_BY);
final int extAttr = getInt(bufs, entryHandle + CDE_EXTERNAL_ATTRIBUTES);
switch (madeBy) {
case MADE_BY_UNIX: {
//noinspection OctalInteger
return (extAttr & 0170000) == 0040000;
}
default: {
return (extAttr & 0b10000) != 0;
}
}
}
/**
* Only loaded if CP-437 zip entries exist, which is unlikely but allowed.
*/
static final class Cp437 {
static final char[] codePoints = {
'\0','☺', '☻', '♥', '♦', '♣', '♠', '•', '◘', '○', '◙', '♂', '♀', '♪', '♫', '☼',
'►', '◄', '↕', '‼', '¶', '§', '▬', '↨', '↑', '↓', '→', '←', '∟', '↔', '▲', '▼',
' ', '!', '"', '#', '$', '%', '&', '\'','(', ')', '*', '+', ',', '-', '.', '/',
'0', '1', '2', '3', '4', '5', '6', '7', '8', '9', ':', ';', '<', '=', '>', '?',
'@', 'A', 'B', 'C', 'D', 'E', 'F', 'G', 'H', 'I', 'J', 'K', 'L', 'M', 'N', 'O',
'P', 'Q', 'R', 'S', 'T', 'U', 'V', 'W', 'X', 'Y', 'Z', '[', '\\',']', '^', '_',
'`', 'a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i', 'j', 'k', 'l', 'm', 'n', 'o',
'p', 'q', 'r', 's', 't', 'u', 'v', 'w', 'x', 'y', 'z', '{', '|', '}', '~', '⌂',
'Ç', 'ü', 'é', 'â', 'ä', 'à', 'å', 'ç', 'ê', 'ë', 'è', 'ï', 'î', 'ì', 'Ä', 'Å',
'É', 'æ', 'Æ', 'ô', 'ö', 'ò', 'û', 'ù', 'ÿ', 'Ö', 'Ü', '¢', '£', '¥', '₧', 'ƒ',
'á', 'í', 'ó', 'ú', 'ñ', 'Ñ', 'ª', 'º', '¿', '⌐', '¬', '½', '¼', '¡', '«', '»',
'░', '▒', '▓', '│', '┤', '╡', '╢', '╖', '╕', '╣', '║', '╗', '╝', '╜', '╛', '┐',
'└', '┴', '┬', '├', '─', '┼', '╞', '╟', '╚', '╔', '╩', '╦', '╠', '═', '╬', '╧',
'╨', '╤', '╥', '╙', '╘', '╒', '╓', '╫', '╪', '┘', '┌', '█', '▄', '▌', '▐', '▀',
'α', 'ß', 'Γ', 'π', 'Σ', 'σ', 'µ', 'τ', 'Φ', 'Θ', 'Ω', 'δ', '∞', 'φ', 'ε', '∩',
'≡', '±', '≥', '≤', '⌠', '⌡', '÷', '≈', '°', '∙', '·', '√', 'ⁿ', '²', '■', 0xA0
};
private Cp437() {}
static char charFor(int c) {
return codePoints[c];
}
}
static final class Utf8 {
private Utf8() {}
static int getByteCount(final int a) {
if (a <= 0b0111_1111) {
return 1;
} else if (a <= 0b1011_1111) {
// invalid garbage (1 byte)
return 1;
} else if (a <= 0b1101_1111) {
return 2;
} else if (a <= 0b1110_1111) {
return 3;
} else if (a <= 0b1111_0111) {
return 4;
} else {
// invalid garbage (1 byte)
return 1;
}
}
static int codePointAt(final ByteBuffer[] bufs, final long i) {
final int a = getUnsignedByte(bufs, i);
if (a <= 0b0111_1111) {
return a;
} else if (a <= 0b1011_1111) {
// invalid garbage (1 byte)
return '�';
}
int b = getUnsignedByte(bufs, i + 1);
if ((b & 0b11_000000) != 0b10_000000) {
// second byte is invalid; return � instead
return '�';
}
if (a <= 0b1101_1111) {
// two bytes
return (a & 0b000_11111) << 6 | b & 0b00_111111;
}
int c = getUnsignedByte(bufs, i + 2);
if ((c & 0b11_000000) != 0b10_000000) {
// third byte is invalid; return � instead
return '�';
}
if (a <= 0b1110_1111) {
// three bytes
return (a & 0b0000_1111) << 12 | (b & 0b00_111111) << 6 | c & 0b00_111111;
}
int d = getUnsignedByte(bufs, i + 3);
if ((d & 0b11_000000) != 0b10_000000) {
// fourth byte is invalid; return � instead
return '�';
}
if (a <= 0b1111_0111) {
// four bytes
return (a & 0b00000_111) << 18 | (b & 0b00_111111) << 12 | (c & 0b00_111111) << 6 | d & 0b00_111111;
}
// invalid garbage (1 byte)
return '�';
}
}
static int bufIdx(long idx) {
return (int) (idx >>> BUF_SHIFT);
}
static int bufOffs(long idx) {
return ((int)idx) & BUF_SIZE_MASK;
}
static byte getByte(ByteBuffer[] bufs, long idx) {
return bufs[bufIdx(idx)].get(bufOffs(idx));
}
static int getUnsignedByte(ByteBuffer[] bufs, long idx) {
return getByte(bufs, idx) & 0xff;
}
static int getUnsignedByte(ByteBuffer buf, int idx) {
return buf.get(idx) & 0xff;
}
static short getShort(ByteBuffer[] bufs, long idx) {
final int bi = bufIdx(idx);
return bi == bufIdx(idx + 1) ? bufs[bi].getShort(bufOffs(idx)) : (short) (getUnsignedByte(bufs, idx) | getByte(bufs, idx + 1) << 8);
}
static int getUnsignedShort(ByteBuffer[] bufs, long idx) {
return getShort(bufs, idx) & 0xffff;
}
static int getMedium(ByteBuffer[] bufs, long idx) {
return getUnsignedByte(bufs, idx) | getUnsignedShort(bufs, idx + 1) << 8;
}
static long getUnsignedMedium(ByteBuffer[] bufs, long idx) {
return getUnsignedByte(bufs, idx) | getUnsignedShort(bufs, idx + 1) << 8;
}
static int getInt(ByteBuffer[] bufs, long idx) {
final int bi = bufIdx(idx);
return bi == bufIdx(idx + 3) ? bufs[bi].getInt(bufOffs(idx)) : getUnsignedShort(bufs, idx) | getShort(bufs, idx + 2) << 16;
}
static long getUnsignedInt(ByteBuffer[] bufs, long idx) {
return getInt(bufs, idx) & 0xffff_ffffL;
}
static long getLong(ByteBuffer[] bufs, long idx) {
final int bi = bufIdx(idx);
return bi == bufIdx(idx + 7) ? bufs[bi].getLong(bufOffs(idx)) : getUnsignedInt(bufs, idx) | (long)getInt(bufs, idx + 4) << 32;
}
static void readBytes(ByteBuffer[] bufs, long idx, byte[] dest, int off, int len) {
while (len > 0) {
final int bi = bufIdx(idx);
final int bo = bufOffs(idx);
ByteBuffer buf = bufs[bi].duplicate();
buf.position(bo);
final int cnt = min(len, buf.remaining());
buf.get(dest, 0, cnt);
len -= cnt;
off += cnt;
idx += cnt;
}
}
static byte[] getBytes(ByteBuffer[] bufs, long idx, int len) {
final byte[] bytes = new byte[len];
readBytes(bufs, idx, bytes, 0, len);
return bytes;
}
private static final ByteBuffer EMPTY_BUF = ByteBuffer.allocateDirect(0);
static ByteBuffer sliceOf(ByteBuffer[] bufs, long idx, int len) {
if (len == 0) return EMPTY_BUF;
final int biStart = bufIdx(idx);
final int biEnd = bufIdx(idx + len - 1);
if (biStart == biEnd) {
final ByteBuffer buf = bufs[biStart].duplicate();
buf.position(bufOffs(idx));
buf.limit(buf.position() + len);
return buf.slice();
} else {
return null;
}
}
static ByteBuffer bufferOf(ByteBuffer[] bufs, long idx, int len) {
ByteBuffer buf = sliceOf(bufs, idx, len);
if (buf == null) {
buf = ByteBuffer.wrap(getBytes(bufs, idx, len));
}
return buf;
}
static long capacity(ByteBuffer[] bufs) {
final int lastIdx = bufs.length - 1;
return ((long) lastIdx) * BUF_SIZE_MAX + bufs[lastIdx].capacity();
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy