All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.kafka.common.utils.ChunkedBytesStream Maven / Gradle / Ivy

There is a newer version: 3.9.0
Show newest version
/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements. See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License. You may obtain a copy of the License at
 *
 *    http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.kafka.common.utils;

import java.io.BufferedInputStream;
import java.io.FilterInputStream;
import java.io.IOException;
import java.io.InputStream;
import java.nio.ByteBuffer;

/**
 * ChunkedBytesStream is a copy of {@link BufferedInputStream} with the following differences:
 * - Unlike {@link java.io.BufferedInputStream#skip(long)} this class could be configured to not push skip() to
 * input stream. We may want to avoid pushing this to input stream because it's implementation maybe inefficient,
 * e.g. the case of ZstdInputStream which allocates a new buffer from buffer pool, per skip call.
 * - Unlike {@link java.io.BufferedInputStream}, which allocates an intermediate buffer, this uses a buffer supplier to
 * create the intermediate buffer.
 * - Unlike {@link java.io.BufferedInputStream}, this implementation does not support {@link InputStream#mark(int)} and
 * {@link InputStream#markSupported()} will return false.
 * 

* Note that: * - this class is not thread safe and shouldn't be used in scenarios where multiple threads access this. * - the implementation of this class is performance sensitive. Minor changes such as usage of ByteBuffer instead of byte[] * can significantly impact performance, hence, proceed with caution. */ public class ChunkedBytesStream extends FilterInputStream { /** * Supplies the ByteBuffer which is used as intermediate buffer to store the chunk of output data. */ private final BufferSupplier bufferSupplier; /** * Intermediate buffer to store the chunk of output data. The ChunkedBytesStream is considered closed if * this buffer is null. */ private byte[] intermediateBuf; /** * The index one greater than the index of the last valid byte in * the buffer. * This value is always in the range 0 through intermediateBuf.length; * elements intermediateBuf[0] through intermediateBuf[count-1] * contain buffered input data obtained * from the underlying input stream. */ protected int count = 0; /** * The current position in the buffer. This is the index of the next * character to be read from the buf array. *

* This value is always in the range 0 * through count. If it is less * than count, then intermediateBuf[pos] * is the next byte to be supplied as input; * if it is equal to count, then * the next read or skip * operation will require more bytes to be * read from the contained input stream. */ protected int pos = 0; /** * Reference for the intermediate buffer. This reference is only kept for releasing the buffer from the * buffer supplier. */ private final ByteBuffer intermediateBufRef; /** * If this flag is true, we will delegate the responsibility of skipping to the * sourceStream. This is an alternative to reading the data from source stream, storing in an intermediate buffer and * skipping the values using this implementation. */ private final boolean delegateSkipToSourceStream; public ChunkedBytesStream(InputStream in, BufferSupplier bufferSupplier, int intermediateBufSize, boolean delegateSkipToSourceStream) { super(in); this.bufferSupplier = bufferSupplier; intermediateBufRef = bufferSupplier.get(intermediateBufSize); if (!intermediateBufRef.hasArray() || (intermediateBufRef.arrayOffset() != 0)) { throw new IllegalArgumentException("provided ByteBuffer lacks array or has non-zero arrayOffset"); } intermediateBuf = intermediateBufRef.array(); this.delegateSkipToSourceStream = delegateSkipToSourceStream; } /** * Check to make sure that buffer has not been nulled out due to * close; if not return it; */ private byte[] getBufIfOpen() throws IOException { byte[] buffer = intermediateBuf; if (buffer == null) throw new IOException("Stream closed"); return buffer; } /** * See the general contract of the read * method of InputStream. * * @return the next byte of data, or -1 if the end of the * stream is reached. * @throws IOException if this input stream has been closed by * invoking its {@link #close()} method, * or an I/O error occurs. * @see BufferedInputStream#read() */ @Override public int read() throws IOException { if (pos >= count) { fill(); if (pos >= count) return -1; } return getBufIfOpen()[pos++] & 0xff; } /** * Check to make sure that underlying input stream has not been * nulled out due to close; if not return it; */ InputStream getInIfOpen() throws IOException { InputStream input = in; if (input == null) throw new IOException("Stream closed"); return input; } /** * Fills the intermediate buffer with more data. The amount of new data read is equal to the remaining empty space * in the buffer. For optimal performance, read as much data as possible in this call. * This method also assumes that all data has already been read in, hence pos > count. */ int fill() throws IOException { byte[] buffer = getBufIfOpen(); pos = 0; count = pos; int n = getInIfOpen().read(buffer, pos, buffer.length - pos); if (n > 0) count = n + pos; return n; } @Override public void close() throws IOException { byte[] mybuf = intermediateBuf; intermediateBuf = null; InputStream input = in; in = null; if (mybuf != null) bufferSupplier.release(intermediateBufRef); if (input != null) input.close(); } /** * Reads bytes from this byte-input stream into the specified byte array, * starting at the given offset. * *

This method implements the general contract of the corresponding * {@link InputStream#read(byte[], int, int) read} method of * the {@link InputStream} class. As an additional * convenience, it attempts to read as many bytes as possible by repeatedly * invoking the read method of the underlying stream. This * iterated read continues until one of the following * conditions becomes true:

    * *
  • The specified number of bytes have been read, * *
  • The read method of the underlying stream returns * -1, indicating end-of-file, or * *
  • The available method of the underlying stream * returns zero, indicating that further input requests would block. * *
If the first read on the underlying stream returns * -1 to indicate end-of-file then this method returns * -1. Otherwise this method returns the number of bytes * actually read. * *

Subclasses of this class are encouraged, but not required, to * attempt to read as many bytes as possible in the same fashion. * * @param b destination buffer. * @param off offset at which to start storing bytes. * @param len maximum number of bytes to read. * @return the number of bytes read, or -1 if the end of * the stream has been reached. * @throws IOException if this input stream has been closed by * invoking its {@link #close()} method, * or an I/O error occurs. * @see BufferedInputStream#read(byte[], int, int) */ public int read(byte[] b, int off, int len) throws IOException { getBufIfOpen(); // Check for closed stream if ((off | len | (off + len) | (b.length - (off + len))) < 0) { throw new IndexOutOfBoundsException(); } else if (len == 0) { return 0; } int n = 0; for (; ; ) { int nread = read1(b, off + n, len - n); if (nread <= 0) return (n == 0) ? nread : n; n += nread; if (n >= len) return n; // if not closed but no bytes available, return InputStream input = in; if (input != null && input.available() <= 0) return n; } } /** * Read characters into a portion of an array, reading from the underlying * stream at most once if necessary. *

* Note - Implementation copied from {@link BufferedInputStream}. Slight modification done to remove * the mark position. */ private int read1(byte[] b, int off, int len) throws IOException { int avail = count - pos; if (avail <= 0) { /* If the requested length is at least as large as the buffer, and if there is no mark/reset activity, do not bother to copy the bytes into the local buffer. In this way buffered streams will cascade harmlessly. */ if (len >= getBufIfOpen().length) { return getInIfOpen().read(b, off, len); } fill(); avail = count - pos; if (avail <= 0) return -1; } int cnt = (avail < len) ? avail : len; System.arraycopy(getBufIfOpen(), pos, b, off, cnt); pos += cnt; return cnt; } /** * Skips over and discards exactly {@code n} bytes of data from this input stream. * If {@code n} is zero, then no bytes are skipped. * If {@code n} is negative, then no bytes are skipped. *

* This method blocks until the requested number of bytes has been skipped, end of file is reached, or an * exception is thrown. *

If end of stream is reached before the stream is at the desired position, then the bytes skipped till than pointed * are returned. *

If an I/O error occurs, then the input stream may be in an inconsistent state. It is strongly recommended that the * stream be promptly closed if an I/O error occurs. *

* This method first skips and discards bytes in the intermediate buffer. * After that, depending on the value of {@link #delegateSkipToSourceStream}, it either delegates the skipping of * bytes to the sourceStream or it reads the data from input stream in chunks, copies the data into intermediate * buffer and skips it. *

* Starting JDK 12, a new method was introduced in InputStream, skipNBytes which has a similar behaviour as * this method. * * @param toSkip the number of bytes to be skipped. * @return the actual number of bytes skipped which might be zero. * @throws IOException if this input stream has been closed by invoking its {@link #close()} method, * {@code in.skip(n)} throws an IOException, or an I/O error occurs. */ @Override public long skip(long toSkip) throws IOException { getBufIfOpen(); // Check for closed stream if (toSkip <= 0) { return 0; } long remaining = toSkip; // Skip bytes stored in intermediate buffer first int avail = count - pos; int bytesSkipped = (int) Math.min(avail, remaining); pos += bytesSkipped; remaining -= bytesSkipped; while (remaining > 0) { if (delegateSkipToSourceStream) { // Use sourceStream's skip() to skip the rest. // conversion to int is acceptable because toSkip and remaining are int. long delegateBytesSkipped = getInIfOpen().skip(remaining); if (delegateBytesSkipped == 0) { // read one byte to check for EOS if (read() == -1) { break; } // one byte read so decrement number to skip remaining--; } else if (delegateBytesSkipped > remaining || delegateBytesSkipped < 0) { // skipped negative or too many bytes throw new IOException("Unable to skip exactly"); } remaining -= delegateBytesSkipped; } else { // skip from intermediate buffer, filling it first (if required) if (pos >= count) { fill(); // if we don't have data in intermediate buffer after fill, then stop skipping if (pos >= count) break; } avail = count - pos; bytesSkipped = (int) Math.min(avail, remaining); pos += bytesSkipped; remaining -= bytesSkipped; } } return toSkip - remaining; } // visible for testing public InputStream sourceStream() { return in; } /** * Returns an estimate of the number of bytes that can be read (or * skipped over) from this input stream without blocking by the next * invocation of a method for this input stream. The next invocation might be * the same thread or another thread. A single read or skip of this * many bytes will not block, but may read or skip fewer bytes. *

* This method returns the sum of the number of bytes remaining to be read in * the buffer (count - pos) and the result of calling the * {@link java.io.FilterInputStream#in in}.available(). * * @return an estimate of the number of bytes that can be read (or skipped * over) from this input stream without blocking. * @throws IOException if this input stream has been closed by * invoking its {@link #close()} method, * or an I/O error occurs. * @see BufferedInputStream#available() */ @Override public synchronized int available() throws IOException { int n = count - pos; int avail = getInIfOpen().available(); return n > (Integer.MAX_VALUE - avail) ? Integer.MAX_VALUE : n + avail; } }





© 2015 - 2024 Weber Informatics LLC | Privacy Policy