All Downloads are FREE. Search and download functionalities are using the official Maven repository.

play.data.parsing.MultipartStream Maven / Gradle / Ivy

There is a newer version: 2.6.2
Show newest version
package play.data.parsing;

import java.io.ByteArrayOutputStream;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.nio.charset.Charset;
import org.apache.commons.fileupload.FileItemStream;
import org.apache.commons.fileupload.ProgressListener;
import org.apache.commons.fileupload.util.Closeable;
import org.apache.commons.fileupload.util.Streams;

/**
 * Low level API for processing file uploads.
 *
 * 

This class can be used to process data streams conforming to MIME 'multipart' format as * defined in RFC 1867. Arbitrarily large amounts * of data in the stream can be processed under constant memory usage. * *

The format of the stream is defined in the following way:
* * multipart-body := preamble 1*encapsulation close-delimiter epilogue
* encapsulation := delimiter body CRLF
* delimiter := "--" boundary CRLF
* close-delimiter := "--" boundary "--"
* preamble := <ignore>
* epilogue := <ignore>
* body := header-part CRLF body-part
* header-part := 1*header CRLF
* header := header-name ":" header-value
* header-name := <printable ascii characters except ":">
* header-value := <any ascii characters except CR & LF>
* body-data := <arbitrary data>
*
* *

Note that body-data can contain another multipart entity. There is limited support for single * pass processing of such nested streams. The nested stream is required to have a * boundary token of the same length as the parent stream (see {@link #setBoundary(byte[])}). * *

Here is an example of usage of this class.
* *

 *    try {
 *        MultipartStream multipartStream = new MultipartStream(input,
 *                                                              boundary);
 *        boolean nextPart = multipartStream.skipPreamble();
 *        OutputStream output;
 *        while(nextPart) {
 *            header = chunks.readHeader();
 *            // process headers
 *            // create some output stream
 *            multipartStream.readBodyPart(output);
 *            nextPart = multipartStream.readBoundary();
 *        }
 *    } catch(MultipartStream.MalformedStreamException e) {
 *          // the stream failed to follow required syntax
 *    } catch(IOException) {
 *          // a read or write error occurred
 *    }
 *
 * 
* * @author Rafal Krzewski * @author Martin Cooper * @author Sean C. Sullivan * @version $Id: MultipartStream.java 174 2007-11-04 21:25:00Z leo $ */ public class MultipartStream { /** Internal class, which is used to invoke the {@link ProgressListener}. */ static class ProgressNotifier { /** The listener to invoke. */ private final ProgressListener listener; /** Number of expected bytes, if known, or -1. */ private final long contentLength; /** Number of bytes, which have been read so far. */ private long bytesRead; /** Number of items, which have been read so far. */ private int items; /** * Creates a new instance with the given listener and content length. * * @param pListener The listener to invoke. * @param pContentLength The expected content length. */ ProgressNotifier(ProgressListener pListener, long pContentLength) { listener = pListener; contentLength = pContentLength; } /** * Called to indicate that bytes have been read. * * @param pBytes Number of bytes, which have been read. */ void noteBytesRead(int pBytes) { /* Indicates, that the given number of bytes have been read from * the input stream. */ bytesRead += pBytes; notifyListener(); } /** Called to indicate, that a new file item has been detected. */ void noteItem() { ++items; } /** Called for notifying the listener. */ private void notifyListener() { if (listener != null) { listener.update(bytesRead, contentLength, items); } } } // ----------------------------------------------------- Manifest constants /** The Carriage Return ASCII character value. */ public static final byte CR = 0x0D; /** The Line Feed ASCII character value. */ public static final byte LF = 0x0A; /** The dash (-) ASCII character value. */ public static final byte DASH = 0x2D; /** * The maximum length of header-part that will be processed (10 kilobytes = 10240 * bytes.). */ public static final int HEADER_PART_SIZE_MAX = 10240; /** The default length of the buffer used for processing a request. */ protected static final int DEFAULT_BUFSIZE = 4096; /** A byte sequence that marks the end of header-part (CRLFCRLF). */ protected static final byte[] HEADER_SEPARATOR = {CR, LF, CR, LF}; /** * A byte sequence that that follows a delimiter that will be followed by an encapsulation ( * CRLF). */ protected static final byte[] FIELD_SEPARATOR = {CR, LF}; /** * A byte sequence that that follows a delimiter of the last encapsulation in the stream (-- * ). */ protected static final byte[] STREAM_TERMINATOR = {DASH, DASH}; /** A byte sequence that precedes a boundary (CRLF--). */ protected static final byte[] BOUNDARY_PREFIX = {CR, LF, DASH, DASH}; /** The number of bytes, over and above the boundary size, to use for the keep region. */ private static final int KEEP_REGION_PAD = 3; // ----------------------------------------------------------- Data members /** The input stream from which data is read. */ private final InputStream input; /** The length of the boundary token plus the leading CRLF--. */ private int boundaryLength; /** * The amount of data, in bytes, that must be kept in the buffer in order to detect delimiters * reliably. */ private final int keepRegion; /** The byte sequence that partitions the stream. */ private final byte[] boundary; /** The length of the buffer used for processing the request. */ private final int bufSize; /** The buffer used for processing the request. */ private final byte[] buffer; /** * The index of first valid character in the buffer.
* 0 <= head < bufSize */ private int head; /** * The index of last valid character in the buffer + 1.
* 0 <= tail <= bufSize */ private int tail; /** The content encoding to use when reading headers. */ private Charset headerEncoding; /** The progress notifier, if any, or null. */ private final ProgressNotifier notifier; /** * Constructs a MultipartStream with a custom size buffer. * *

Note that the buffer must be at least big enough to contain the boundary string, plus 4 * characters for CR/LF and double dash, plus at least one byte of data. Too small a buffer size * setting will degrade performance. * * @param input The InputStream to serve as a data source. * @param boundary The token used for dividing the stream into encapsulations. * @param bufSize The size of the buffer to be used, in bytes. * @param pNotifier The notifier, which is used for calling the progress listener, if any. * @see #MultipartStream(InputStream, byte[], ProgressNotifier) */ MultipartStream(InputStream input, byte[] boundary, int bufSize, ProgressNotifier pNotifier) { this.input = input; this.bufSize = bufSize; this.buffer = new byte[bufSize]; this.notifier = pNotifier; // We prepend CR/LF to the boundary to chop trailing CR/LF from // body-data tokens. this.boundary = new byte[boundary.length + BOUNDARY_PREFIX.length]; this.boundaryLength = boundary.length + BOUNDARY_PREFIX.length; this.keepRegion = boundary.length + KEEP_REGION_PAD; System.arraycopy(BOUNDARY_PREFIX, 0, this.boundary, 0, BOUNDARY_PREFIX.length); System.arraycopy(boundary, 0, this.boundary, BOUNDARY_PREFIX.length, boundary.length); head = 0; tail = 0; } /** * Constructs a MultipartStream with a default size buffer. * * @param input The InputStream to serve as a data source. * @param boundary The token used for dividing the stream into encapsulations. * @param pNotifier An object for calling the progress listener, if any. * @see #MultipartStream(InputStream, byte[], int, ProgressNotifier) */ MultipartStream(InputStream input, byte[] boundary, ProgressNotifier pNotifier) { this(input, boundary, DEFAULT_BUFSIZE, pNotifier); } /** * Retrieves the character encoding used when reading the headers of an individual part. When not * specified, or null, the platform default encoding is used. * * @return The encoding used to read part headers. */ public Charset getHeaderEncoding() { return headerEncoding; } /** * Specifies the character encoding to be used when reading the headers of individual parts. When * not specified, or null, the platform default encoding is used. * * @param encoding The encoding used to read part headers. */ public void setHeaderEncoding(Charset encoding) { headerEncoding = encoding; } /** * Reads a byte from the buffer, and refills it as necessary. * * @return The next byte from the input stream. * @throws IOException if there is no more data available. */ public byte readByte() throws IOException { // Buffer depleted ? if (head == tail) { head = 0; // Refill. tail = input.read(buffer, head, bufSize); if (tail == -1) { // No more data available. throw new IOException("No more data is available"); } if (notifier != null) { notifier.noteBytesRead(tail); } } return buffer[head++]; } /** * Skips a boundary token, and checks whether more encapsulations are * contained in the stream. * * @return true if there are more encapsulations in this stream; false * otherwise. * @throws MalformedStreamException if the stream ends unexpectedly or fails to follow required * syntax. */ public boolean readBoundary() throws MalformedStreamException { byte[] marker = new byte[2]; boolean nextChunk; head += boundaryLength; try { marker[0] = readByte(); if (marker[0] == LF) { // Work around IE5 Mac bug with input type=image. // Because the boundary delimiter, not including the trailing // CRLF, must not appear within any file (RFC 2046, section // 5.1.1), we know the missing CR is due to a buggy browser // rather than a file containing something similar to a // boundary. return true; } marker[1] = readByte(); if (arraysEqual(marker, STREAM_TERMINATOR, 2)) { nextChunk = false; } else if (arraysEqual(marker, FIELD_SEPARATOR, 2)) { nextChunk = true; } else { throw new MalformedStreamException("Unexpected characters follow a boundary"); } } catch (IOException e) { throw new MalformedStreamException("Stream ended unexpectedly", e); } return nextChunk; } /** * Changes the boundary token used for partitioning the stream. * *

This method allows single pass processing of nested multipart streams. * *

The boundary token of the nested stream is required to be of the same length as * the boundary token in parent stream. * *

Restoring the parent stream boundary token after processing of a nested stream is left to * the application. * * @param boundary The boundary to be used for parsing of the nested stream. * @throws IllegalBoundaryException if the boundary has a different length than the * one being currently parsed. */ public void setBoundary(byte[] boundary) throws IllegalBoundaryException { if (boundary.length != boundaryLength - BOUNDARY_PREFIX.length) { throw new IllegalBoundaryException("The length of a boundary token can not be changed"); } System.arraycopy(boundary, 0, this.boundary, BOUNDARY_PREFIX.length, boundary.length); } /** * Reads the header-part of the current encapsulation. * *

Headers are returned verbatim to the input stream, including the trailing CRLF * marker. Parsing is left to the application. * *

TODO allow limiting maximum header size to protect against abuse. * * @return The header-part of the current encapsulation. * @throws MalformedStreamException if the stream ends unexpectedly. */ public String readHeaders() throws MalformedStreamException { int i = 0; byte[] b = new byte[1]; // to support multi-byte characters ByteArrayOutputStream baos = new ByteArrayOutputStream(); int sizeMax = HEADER_PART_SIZE_MAX; int size = 0; while (i < HEADER_SEPARATOR.length) { try { b[0] = readByte(); } catch (IOException e) { throw new MalformedStreamException("Stream ended unexpectedly", e); } size++; if (b[0] == HEADER_SEPARATOR[i]) { i++; } else { i = 0; } if (size <= sizeMax) { baos.write(b[0]); } } String headers = null; if (headerEncoding != null) { headers = baos.toString(headerEncoding); } else { headers = baos.toString(); } return headers; } /** * Reads body-data from the current encapsulation and writes its * contents into the output Stream. * *

Arbitrary large amounts of data can be processed by this method using a constant size * buffer. (see {@link #MultipartStream(InputStream,byte[],int, ProgressNotifier) constructor}). * * @param output The Stream to write data into. May be null, in which case this * method is equivalent to {@link #discardBodyData()}. * @return the amount of data written. * @throws MalformedStreamException if the stream ends unexpectedly. * @throws IOException if an i/o error occurs. */ public int readBodyData(OutputStream output) throws MalformedStreamException, IOException { InputStream istream = newInputStream(); return (int) Streams.copy(istream, output, false); } /** * Creates a new {@link ItemInputStream}. * * @return A new instance of {@link ItemInputStream}. */ ItemInputStream newInputStream() { return new ItemInputStream(); } /** * Reads body-data from the current encapsulation and discards it. * *

Use this method to skip encapsulations you don't need or don't understand. * * @return The amount of data discarded. * @throws MalformedStreamException if the stream ends unexpectedly. * @throws IOException if an i/o error occurs. */ public int discardBodyData() throws MalformedStreamException, IOException { return readBodyData(null); } /** * Finds the beginning of the first encapsulation. * * @return true if an encapsulation was found in the stream. * @throws IOException if an i/o error occurs. */ public boolean skipPreamble() throws IOException { // First delimiter may be not preceded with a CRLF. System.arraycopy(boundary, 2, boundary, 0, boundary.length - 2); boundaryLength = boundary.length - 2; try { // Discard all data up to the delimiter. discardBodyData(); // Read boundary - if succeded, the stream contains an // encapsulation. return readBoundary(); } catch (MalformedStreamException e) { return false; } finally { // Restore delimiter. System.arraycopy(boundary, 0, boundary, 2, boundary.length - 2); boundaryLength = boundary.length; boundary[0] = CR; boundary[1] = LF; } } /** * Compares count first bytes in the arrays a and b. * * @param a The first array to compare. * @param b The second array to compare. * @param count How many bytes should be compared. * @return true if count first bytes in arrays a and * b are equal. */ private static boolean arraysEqual(byte[] a, byte[] b, int count) { for (int i = 0; i < count; i++) { if (a[i] != b[i]) { return false; } } return true; } /** * Searches for a byte of specified value in the buffer, starting at the specified * position. * * @param value The value to find. * @param pos The starting position for searching. * @return The position of byte found, counting from beginning of the buffer, or * -1 if not found. */ protected int findByte(byte value, int pos) { for (int i = pos; i < tail; i++) { if (buffer[i] == value) { return i; } } return -1; } /** * Searches for the boundary in the buffer region delimited by * head and tail. * * @return The position of the boundary found, counting from the beginning of the buffer * , or -1 if not found. */ protected int findSeparator() { int first; int match = 0; int maxPos = tail - boundaryLength; for (first = head; (first <= maxPos) && (match != boundaryLength); first++) { first = findByte(boundary[0], first); if (first == -1 || (first > maxPos)) { return -1; } for (match = 1; match < boundaryLength; match++) { if (buffer[first + match] != boundary[match]) { break; } } } if (match == boundaryLength) { return first - 1; } return -1; } /** Thrown to indicate that the input stream fails to follow the required syntax. */ public static class MalformedStreamException extends IOException { /** Constructs a MalformedStreamException with no detail message. */ public MalformedStreamException() { super(); } /** * Constructs an MalformedStreamException with the specified detail message. * * @param message The detail message. */ public MalformedStreamException(String message) { super(message); } public MalformedStreamException(String message, Throwable cause) { super(message, cause); } } /** Thrown upon attempt of setting an invalid boundary token. */ public static class IllegalBoundaryException extends IOException { /** Constructs an IllegalBoundaryException with no detail message. */ public IllegalBoundaryException() { super(); } /** * Constructs an IllegalBoundaryException with the specified detail message. * * @param message The detail message. */ public IllegalBoundaryException(String message) { super(message); } } /** An {@link InputStream} for reading an items contents. */ public class ItemInputStream extends InputStream implements Closeable { /** The number of bytes, which have been read so far. */ private long total; /** The number of bytes, which must be hold, because they might be a part of the boundary. */ private int pad; /** The current offset in the buffer. */ private int pos; /** Whether the stream is already closed. */ private boolean closed; /** Creates a new instance. */ ItemInputStream() { findSeparator(); } /** Called for finding the separator. */ private void findSeparator() { pos = MultipartStream.this.findSeparator(); if (pos == -1) { pad = Math.min(tail - head, keepRegion); } } /** * Returns the number of bytes, which have been read by the stream. * * @return Number of bytes, which have been read so far. */ public long getBytesRead() { return total; } /** * Returns the number of bytes, which are currently available, without blocking. * * @return Number of bytes in the buffer. */ @Override public int available() { if (pos == -1) { return tail - head - pad; } return pos - head; } /** Offset when converting negative bytes to integers. */ private static final int BYTE_POSITIVE_OFFSET = 256; /** * Returns the next byte in the stream. * * @return The next byte in the stream, as a non-negative integer, or -1 for EOF. * @throws IOException An I/O error occurred. */ @Override public int read() throws IOException { if (closed) { throw new FileItemStream.ItemSkippedException(); } if (available() == 0) { if (makeAvailable() == 0) { return -1; } } ++total; int b = buffer[head++]; if (b >= 0) { return b; } return b + BYTE_POSITIVE_OFFSET; } /** * Reads bytes into the given buffer. * * @param b The destination buffer, where to write to. * @param off Offset of the first byte in the buffer. * @param len Maximum number of bytes to read. * @return Number of bytes, which have been actually read, or -1 for EOF. * @throws IOException An I/O error occurred. */ @Override public int read(byte[] b, int off, int len) throws IOException { if (closed) { throw new FileItemStream.ItemSkippedException(); } if (len == 0) { return 0; } int res = available(); if (res == 0) { res = makeAvailable(); if (res == 0) { return -1; } } res = Math.min(res, len); System.arraycopy(buffer, head, b, off, res); head += res; total += res; return res; } /** * Closes the input stream. * * @throws IOException An I/O error occurred. */ @Override public void close() throws IOException { if (closed) { return; } for (; ; ) { int av = available(); if (av == 0) { av = makeAvailable(); if (av == 0) { break; } } skip(av); } closed = true; } /** * Skips the given number of bytes. * * @param bytes Number of bytes to skip. * @return The number of bytes, which have actually been skipped. * @throws IOException An I/O error occurred. */ @Override public long skip(long bytes) throws IOException { if (closed) { throw new FileItemStream.ItemSkippedException(); } int av = available(); if (av == 0) { av = makeAvailable(); if (av == 0) { return 0; } } long res = Math.min(av, bytes); head += res; return res; } /** * Attempts to read more data. * * @return Number of available bytes * @throws IOException An I/O error occurred. */ private int makeAvailable() throws IOException { if (pos != -1) { return 0; } // Move the data to the beginning of the buffer. total += tail - head - pad; System.arraycopy(buffer, tail - pad, buffer, 0, pad); // Refill buffer with new data. head = 0; int bytesRead = input.read(buffer, pad, bufSize - pad); if (bytesRead == -1) { // The last pad amount is left in the buffer. // Boundary can't be in there so signal an error // condition. throw new MalformedStreamException("Stream ended unexpectedly"); } // notifier.noteBytesRead(bytesRead); tail = pad + bytesRead; findSeparator(); return available(); } /** * Returns, whether the stream is closed. * * @return True, if the stream is closed, otherwise false. */ @Override public boolean isClosed() { return closed; } } }





© 2015 - 2024 Weber Informatics LLC | Privacy Policy