All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.scudata.dw.BlockLinkReader Maven / Gradle / Ivy

Go to download

SPL(Structured Process Language) A programming language specially for structured data computing.

There is a newer version: 20241126
Show newest version
package com.scudata.dw;

import java.io.IOException;
import java.io.InputStream;
import java.util.Arrays;

import com.scudata.dm.Sequence;

public class BlockLinkReader extends InputStream {
	private BlockLink blockLink;
	private IBlockStorage storage;
	
	private final int blockSize; // ???С
	private final int pointerPos; // ??һ??ָ???ڿ???λ??
	
	private long currentBlockPos = Long.MAX_VALUE;
	private byte []block; // ??ǰ????Ŀ?
	private int caret; // ?????block?е?λ??
	
	private byte[] readBuffer = new byte[32];
	private LZ4Util lz4 = LZ4Util.instance();
	private byte []decompressBuffer;
	
	private boolean isPureStorage;//???°汾?Ĵ??д洢??ʽ
	private Sequence dict;
	
	public BlockLinkReader(BlockLink blockLink) {
		this(blockLink, 0);
	}
	
	public BlockLinkReader(BlockLink blockLink, int sbLen) {
		this.blockLink = blockLink;
		storage = blockLink.getBlockStorage();
		
		blockSize = storage.getBlockSize();
		pointerPos = blockSize - IBlockStorage.POS_SIZE;
		block = new byte[blockSize];
		isPureStorage = storage.isPureFormat();
	}
	
	public BlockLinkReader(BlockLinkReader blockLinkReader) {
		blockLink = blockLinkReader.blockLink;
		storage = blockLinkReader.storage;
		blockSize = blockLinkReader.blockSize;
		pointerPos = blockLinkReader.pointerPos;
		currentBlockPos = blockLinkReader.currentBlockPos;
		block = Arrays.copyOf(blockLinkReader.block, blockSize);
		caret = blockLinkReader.caret;
		decompressBuffer = new byte[4096];
		isPureStorage = storage.isPureFormat();
		dict = blockLinkReader.dict;
	}
	
	public void close() {
		block = null;
	}
	
	void setDecompressBufferSize(int size) {
		decompressBuffer = new byte[size];
	}

	public void loadFirstBlock() throws IOException {
		loadBlock(blockLink.firstBlockPos);
	}
	
	public void loadBlock(long pos) throws IOException {
		currentBlockPos = pos;
		storage.loadBlock(pos, block);
		caret = 0;
	}
	
	public int read() throws IOException {
		if (caret == pointerPos) {
			loadBlock(readPosition(pointerPos));
		}
		
		return block[caret++] & 0xff;
	}
	
	public int read(byte b[], int off, int len) throws IOException {
		int count = len;
		while (true) {
			int freeSize = pointerPos - caret;
			if (len <= freeSize) {
				System.arraycopy(block, caret, b, off, len);
				caret += len;
				return count;
			} else {
				System.arraycopy(block, caret, b, off, freeSize);
				if (currentBlockPos < blockLink.lastBlockPos) {
					off += freeSize;
					len -= freeSize;
					loadBlock(readPosition(pointerPos));
				} else {
					caret = pointerPos;
					return count - len + freeSize;
				}
			}
		}
	}
	
	public void readFully(byte []b, int off, int len) throws IOException {
		while (true) {
			int freeSize = pointerPos - caret;
			if (len <= freeSize) {
				System.arraycopy(block, caret, b, off, len);
				caret += len;
				break;
			} else {
				System.arraycopy(block, caret, b, off, freeSize);
				off += freeSize;
				len -= freeSize;
				loadBlock(readPosition(pointerPos));
			}
		}
	}
	
	public int readInt32() throws IOException {
		if (pointerPos - caret >= 4) {
			byte []data = this.block;
			int index = this.caret;
			this.caret += 4;
			return (data[index] << 24) + ((data[index + 1] & 0xff) << 16) +
				((data[index + 2] & 0xff) << 8) + (data[index + 3] & 0xff);
		} else {
			byte []readBuffer = this.readBuffer;
			readFully(readBuffer, 0, 4);
			return (readBuffer[0] << 24) + ((readBuffer[1] & 0xff) << 16) +
				((readBuffer[2] & 0xff) << 8) + (readBuffer[3] & 0xff);
		}
	}
	
	// ????һ???ݿ鲢??ѹ
	public byte[] readDataBlock() throws IOException {
		int srcCount = readInt32();
		if (storage.isCompress()) {
			int count = readInt32();
			if (count > 0) {
				byte []buffer = new byte[count];
				
				readFully(buffer, 0, count);
	
				if (srcCount > decompressBuffer.length) {
					decompressBuffer = new byte[srcCount];
				}
				
				lz4.decompress(buffer, decompressBuffer, srcCount);
				return decompressBuffer;
			} else {
				byte []buffer = new byte[srcCount];
				readFully(buffer, 0, srcCount);
				return buffer;
			}
		} else {
			byte []buffer = new byte[srcCount];
			readFully(buffer, 0, srcCount);
			return buffer;
		}
	}
	
	// ????һ???ݿ?(????ѹ)
	public byte[] readDataBlock0() throws IOException {
		byte []readBuffer = this.readBuffer;
		readFully(readBuffer, 0, 4);
		int srcCount = (readBuffer[0] << 24) + ((readBuffer[1] & 0xff) << 16) +
			((readBuffer[2] & 0xff) << 8) + (readBuffer[3] & 0xff);

		if (storage.isCompress()) {
			readFully(readBuffer, 4, 4);
			int count = (readBuffer[4] << 24) + ((readBuffer[5] & 0xff) << 16) +
					((readBuffer[6] & 0xff) << 8) + (readBuffer[7] & 0xff);
			if (count > 0) {
				byte []buffer = new byte[count + 8];
				readFully(buffer, 8, count);
				System.arraycopy(readBuffer, 0, buffer, 0, 8);
				return buffer;
			} else {
				byte []buffer = new byte[srcCount + 8];
				readFully(buffer, 8, srcCount);
				System.arraycopy(readBuffer, 0, buffer, 0, 8);
				return buffer;
			}
		} else {
			byte []buffer = new byte[srcCount + 4];
			readFully(buffer, 4, srcCount);
			System.arraycopy(readBuffer, 0, buffer, 0, 4);
			return buffer;
		}
	}
	
	private long getBlockPos(long pos) {
		return pos - pos % blockSize;
	}
	
	public void seek(long pos) throws IOException {
		long blockPos = getBlockPos(pos);
		if (blockPos != currentBlockPos) {
			storage.loadBlock(blockPos, block);
			currentBlockPos = blockPos;
		}
		
		caret = (int)(pos - blockPos);
	}
	
	// ??ָ??λ?õ????ݿ鲢??ѹ
	public byte[] readDataBlock(long pos) throws IOException {
		seek(pos);
		return readDataBlock();
	}
	
	// ????????????һ???λ??
	private long readPosition(int i) {
		byte []block = this.block;
		return (((long)(block[i] & 0xff) << 32) +
				((long)(block[i + 1] & 0xff) << 24) +
				((block[i + 2] & 0xff) << 16) +
				((block[i + 3] & 0xff) <<  8) +
				(block[i + 4] & 0xff));
	}
	
	// ?????????????????ֽ????鷵??
	public byte[] readBlocks() throws IOException {
		int blockCount = blockLink.blockCount;
		if (blockCount > 1) {
			byte []bytes = new byte[pointerPos * blockCount];
			long blockPos = blockLink.firstBlockPos;
			for (int i = 0, j = 0; i < blockCount; ++i, j += pointerPos) {
				storage.loadBlock(blockPos, block);
				System.arraycopy(block, 0, bytes, j, pointerPos);
				blockPos = readPosition(pointerPos);
			}
			
			return bytes;
		} else {
			storage.loadBlock(blockLink.firstBlockPos, block);
			return block;
		}
	}
	
	//????ʽ?α???
	public BufferReader readBlockData(int recordCount) throws IOException {
		return getBufferReader(readDataBlock(), recordCount);
	}
	
	//????ʽ?α???
	public BufferReader readBlockData(long pos, int recordCount) throws IOException {
		byte[] buffer = readDataBlock(pos);
		return getBufferReader(buffer, recordCount);
	}
	
	//????ʽ?α???
	public BufferReader readPureBlockData(int recordCount) throws IOException {
		return new BufferReader(storage.getStructManager(), readDataBlock());
	}
	
	//????ʽ?α???
	public BufferReader readPureBlockData(long pos, int recordCount) throws IOException {
		return new BufferReader(storage.getStructManager(), readDataBlock(pos));
	}
	
	//????ʽ?α???
	private BufferReader getBufferReader(byte[] buffer, int recordCount) {
		if (isPureStorage) {
			if (PureBufferReader.canUseBufferReader(buffer, 0)) {
				BufferReader reader = new BufferReader(storage.getStructManager(), buffer);
				reader.index++;
				return reader;
			} else {
				return new PureBufferReader(storage.getStructManager(), buffer, recordCount, dict);
			}
		} else {
			return new BufferReader(storage.getStructManager(), buffer);
		}
	}
	
	//??ѹ????ȡ
	public RowBufferReader readBlockBuffer() throws IOException {
		int count = readInt32();
		byte []buffer = new byte[count];
		readFully(buffer, 0, count);
		return new RowBufferReader(storage.getStructManager(), buffer);
	}
	
	public BufferReader readBlockBuffer(long pos) throws IOException {
		seek(pos);
		int count = readInt32();
		byte []buffer = new byte[count];
		readFully(buffer, 0, count);
		return new BufferReader(storage.getStructManager(), buffer);
	}
	
	public long position() {
		return currentBlockPos;
	}
	
	public int getCaret() {
		return caret;
	}
	
	public IBlockStorage getStorage() {
		return storage;
	}
	
	public Sequence getDict() {
		return dict;
	}

	public void setDict(Sequence dict) {
		this.dict = dict;
	}
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy