com.cybermkd.upload.multipart.MultipartParser Maven / Gradle / Ivy

Go to download

Show more of this group Show more artifacts with this name
Show all versions of ICEREST Show documentation

一个极简的restful框架

There is a newer version: 1.0.1.3

package com.cybermkd.upload.multipart;

import com.cybermkd.common.http.ContentType;
import com.cybermkd.common.http.HttpRequest;
import com.cybermkd.common.http.exception.WebException;

import java.io.IOException;
import java.io.InputStream;
import java.util.Enumeration;
import java.util.Vector;


/**
 * A utility class to handle multipart/form-data requests,
 * the kind of requests that support file uploads.  This class uses a
 * "pull" model where the reading of incoming files and params is
 * controlled by the client code, which allows incoming files to be stored
 * into any OutputStream.  If you wish to use an API which
 * resembles HttpRequest, use the "push" model
 * MultipartRequest instead.  It's an easy-to-use wrapper
 * around this class.
 * 
 * This class can receive arbitrarily large files (up to an artificial limit
 * you can set), and fairly efficiently too.
 * It cannot handle nested data (multipart content within multipart content).
 * It can now with the latest release handle internationalized content
 * (such as non Latin-1 filenames).
 * 

 * It also optionally includes enhanced buffering and Content-Length
 * limitation.  Buffering is only required if your servlet container is
 * poorly implemented (many are, including Tomcat 3.2),
 * but it is generally recommended because it will make a slow servlet
 * container a lot faster, and will only make a fast servlet container a
 * little slower.  Content-Length limiting is usually only required if you find
 * that your servlet is hanging trying to read the input stram from the POST,
 * and it is similarly recommended because it only has a minimal impact on
 * performance.
 * 

 * See the included upload.war for an example of how to use this class.
 * 

 * The full file upload specification is contained in experimental RFC 1867,
 * available at 
 * http://www.ietf.org/rfc/rfc1867.txt.
 *
 * @author Jason Hunter
 * @author Geoff Soutter
 * @version 1.0, 2000/10/27, initial revision
 * @see com.cybermkd.upload.MultipartRequest
 */
public class MultipartParser {

    /**
     * default encoding
     */
    private static String DEFAULT_ENCODING = "ISO-8859-1";
    /**
     * input stream to read parts from
     */
    private ServletInputStream in;
    /**
     * MIME boundary that delimits parts
     */
    private String boundary;
    /**
     * reference to the last file part we returned
     */
    private FilePart lastFilePart;
    /**
     * buffer for readLine method
     */
    private byte[] buf = new byte[8 * 1024];
    /**
     * preferred encoding
     */
    private String encoding = DEFAULT_ENCODING;

    /**
     * Creates a MultipartParser from the specified request,
     * which limits the upload size to the specified length, buffers for
     * performance and prevent attempts to read past the amount specified
     * by the Content-Length.
     *
     * @param req     the servlet request.
     * @param maxSize the maximum size of the POST content.
     */
    public MultipartParser(HttpRequest req,
                           int maxSize) throws IOException {
        this(req, maxSize, true, true);
    }

    /**
     * Creates a MultipartParser from the specified request,
     * which limits the upload size to the specified length, and optionally
     * buffers for performance and prevents attempts to read past the amount
     * specified by the Content-Length.
     *
     * @param req         the servlet request.
     * @param maxSize     the maximum size of the POST content.
     * @param buffer      whether to do internal buffering or let the server buffer,
     *                    useful for servers that don't buffer
     * @param limitLength boolean flag to indicate if we need to filter
     *                    the request's input stream to prevent trying to
     *                    read past the end of the stream.
     */
    public MultipartParser(HttpRequest req, int maxSize, boolean buffer,
                           boolean limitLength) throws IOException {
        this(req, maxSize, buffer, limitLength, null);
    }

    /**
     * Creates a MultipartParser from the specified request,
     * which limits the upload size to the specified length, and optionally
     * buffers for performance and prevents attempts to read past the amount
     * specified by the Content-Length, and with a specified encoding.
     *
     * @param req         the servlet request.
     * @param maxSize     the maximum size of the POST content.
     * @param buffer      whether to do internal buffering or let the server buffer,
     *                    useful for servers that don't buffer
     * @param limitLength boolean flag to indicate if we need to filter
     *                    the request's input stream to prevent trying to
     *                    read past the end of the stream.
     * @param encoding    the encoding to use for parsing, default is ISO-8859-1.
     */
    public MultipartParser(HttpRequest req, int maxSize, boolean buffer,
                           boolean limitLength, String encoding)
            throws IOException {
        // First make sure we know the encoding to handle chars correctly.
        // Thanks to Andreas Granzer, [email protected],
        // for pointing out the need to have this in the constructor.
        if (encoding != null) {
            setEncoding(encoding);
        }

        // Check the content type to make sure it's "multipart/form-data"
        // Access header two ways to work around WebSphere oddities
        String type = null;
        String type1 = req.getHeader("Content-Type");
        String type2 = req.getContentType();
        // If one value is null, choose the other value
        if (type1 == null && type2 != null) {
            type = type2;
        } else if (type2 == null && type1 != null) {
            type = type1;
        }
        // If neither value is null, choose the longer value
        else if (type1 != null) {
            type = (type1.length() > type2.length() ? type1 : type2);
        }

        if (type == null || !type.toLowerCase().startsWith(ContentType.MULTIPART.value())) {
            throw new WebException("Posted content type isn't '" + ContentType.MULTIPART.value() + "'.");
        }
        // Check the content length to prevent denial of service attacks
        int length = req.getContentLength();
        if (length > maxSize) {
            throw new WebException("Posted content length of " + length +
                    " exceeds limit of " + maxSize + ".");
        }

        // Get the boundary string; it's included in the content type.
        // Should look something like "------------------------12012133613061"
        String boundary = extractBoundary(type);
        if (boundary == null) {
            throw new IOException("File separation boundary was not specified.");
        }

        InputStream is = req.getContentStream();

        // If required, wrap the real input stream with classes that
        // "enhance" its behaviour for performance and stability
        if (buffer) {
            in = new BufferedServletInputStream(is);
        }
        if (limitLength) {
            in = new LimitedServletInputStream(is, length);
        }

        // Save our values for later
        this.boundary = boundary;

        // Read until we hit the boundary
        // Some clients send a preamble (per RFC 2046), so ignore that
        // Thanks to Ben Johnson, [email protected], for pointing out
        // the need for preamble support.
        do {
            String line = readLine();
            if (line == null) {
                throw new IOException("Corrupt form data: premature ending");
            }
            // See if this line is the boundary, and if so break
            if (line.startsWith(boundary)) {
                break;  // success
            }
        } while (true);
    }

    /**
     * Extracts and returns the content type from a line, or null if the
     * line was empty.
     *
     * @return content type, or null if line was empty.
     * @throws IOException if the line is malformatted.
     */
    private static String extractContentType(String line) throws IOException {
        // Convert the line to a lowercase string
        line = line.toLowerCase();

        // Get the content type, if any
        // Note that Opera at least puts extra info after the type, so handle
        // that.  For example:  Content-Type: text/plain; name="foo"
        // Thanks to Leon Poyyayil, [email protected], for noticing this.
        int end = line.indexOf(";");
        if (end == -1) {
            end = line.length();
        }

        return line.substring(13, end).trim();  // "content-type:" is 13
    }

    /**
     * Sets the encoding used to parse from here onward.  The default is
     * ISO-8859-1.  Encodings are actually best passed into the contructor,
     * so even the initial line reads are correct.
     *
     * @param encoding The encoding to use for parsing
     */
    public void setEncoding(String encoding) {
        this.encoding = encoding;
    }

    /**
     * Read the next part arriving in the stream. Will be either a
     * FilePart or a ParamPart, or null
     * to indicate there are no more parts to read. The order of arrival
     * corresponds to the order of the form elements in the submitted form.
     *
     * @return either a FilePart, a ParamPart or
     * null if there are no more parts to read.
     * @throws IOException if an input or output exception has occurred.
     * @see FilePart
     * @see ParamPart
     */
    public Part readNextPart() throws IOException {
        // Make sure the last file was entirely read from the input
        if (lastFilePart != null) {
            lastFilePart.getInputStream().close();
            lastFilePart = null;
        }

        // Read the headers; they look like this (not all may be present):
        // Content-Disposition: form-data; name="field1"; filename="file1.txt"
        // Content-Type: type/subtype
        // Content-Transfer-Encoding: binary
        Vector headers = new Vector();

        String line = readLine();
        if (line == null) {
            // No parts left, we're done
            return null;
        } else if (line.length() == 0) {
            // IE4 on Mac sends an empty line at the end; treat that as the end.
            // Thanks to Daniel Lemire and Henri Tourigny for this fix.
            return null;
        }

        // Read the following header lines we hit an empty line
        // A line starting with whitespace is considered a continuation;
        // that requires a little special logic.  Thanks to Nic Ferrier for
        // identifying a good fix.
        while (line != null && line.length() > 0) {
            String nextLine = null;
            boolean getNextLine = true;
            while (getNextLine) {
                nextLine = readLine();
                if (nextLine != null
                        && (nextLine.startsWith(" ")
                        || nextLine.startsWith("\t"))) {
                    line = line + nextLine;
                } else {
                    getNextLine = false;
                }
            }
            // Add the line to the header list
            headers.addElement(line);
            line = nextLine;
        }

        // If we got a null above, it's the end
        if (line == null) {
            return null;
        }

        String name = null;
        String filename = null;
        String origname = null;
        String contentType = "text/plain";  // rfc1867 says this is the default

        Enumeration enumeration = headers.elements();
        while (enumeration.hasMoreElements()) {
            String headerline = (String) enumeration.nextElement();
            if (headerline.toLowerCase().startsWith("content-disposition:")) {
                // Parse the content-disposition line
                String[] dispInfo = extractDispositionInfo(headerline);
                // String disposition = dispInfo[0];  // not currently used
                name = dispInfo[1];
                filename = dispInfo[2];
                origname = dispInfo[3];
            } else if (headerline.toLowerCase().startsWith("content-type:")) {
                // Get the content type, or null if none specified
                contentType = extractContentType(headerline);
            }
        }

        // Now, finally, we read the content (end after reading the boundary)
        if (filename == null) {
            // This is a parameter, add it to the vector of values
            // The encoding is needed to help parse the value
            return new ParamPart(name, in, boundary, encoding);
        } else {
            // This is a file
            if (filename.equals("")) {
                filename = null; // empty filename, probably an "empty" file param
            }
            lastFilePart = new FilePart(name, in, boundary, contentType, filename, origname);
            return lastFilePart;
        }
    }

    /**
     * Extracts and returns the boundary token from a line.
     *
     * @return the boundary token.
     */
    private String extractBoundary(String line) {
        // Use lastIndexOf() because IE 4.01 on Win98 has been known to send the
        // "boundary=" string multiple times.  Thanks to David Wall for this fix.
        int index = line.lastIndexOf("boundary=");
        if (index == -1) {
            return null;
        }
        String boundary = line.substring(index + 9);  // 9 for "boundary="
        if (boundary.charAt(0) == '"') {
            // The boundary is enclosed in quotes, strip them
            index = boundary.lastIndexOf('"');
            boundary = boundary.substring(1, index);
        }

        // The real boundary is always preceeded by an extra "--"
        boundary = "--" + boundary;

        return boundary;
    }

    /**
     * Extracts and returns disposition info from a line, as a String
     * array with elements: disposition, name, filename.
     *
     * @return String[] of elements: disposition, name, filename.
     * @throws IOException if the line is malformatted.
     */
    private String[] extractDispositionInfo(String line) throws IOException {
        // Return the line's data as an array: disposition, name, filename
        String[] retval = new String[4];

        // Convert the line to a lowercase string without the ending \r\n
        // Keep the original line for error messages and for variable names.
        String origline = line;
        line = origline.toLowerCase();

        // Get the content disposition, should be "form-data"
        int start = line.indexOf("content-disposition: ");
        int end = line.indexOf(";");
        if (start == -1 || end == -1) {
            throw new IOException("Content disposition corrupt: " + origline);
        }
        String disposition = line.substring(start + 21, end);
        if (!disposition.equals("form-data")) {
            throw new IOException("Invalid content disposition: " + disposition);
        }

        // Get the field name
        start = line.indexOf("name=\"", end);  // start at last semicolon
        end = line.indexOf("\"", start + 7);   // skip name=\"
        int startOffset = 6;
        if (start == -1 || end == -1) {
            // Some browsers like lynx don't surround with ""
            // Thanks to Deon van der Merwe, [email protected], for noticing
            start = line.indexOf("name=", end);
            end = line.indexOf(";", start + 6);
            if (start == -1) {
                throw new IOException("Content disposition corrupt: " + origline);
            } else if (end == -1) {
                end = line.length();
            }
            startOffset = 5;  // without quotes we have one fewer char to skip
        }
        String name = origline.substring(start + startOffset, end);

        // Get the filename, if given
        String filename = null;
        String origname = null;
        start = line.indexOf("filename=\"", end + 2);  // start after name
        end = line.indexOf("\"", start + 10);          // skip filename=\"
        if (start != -1 && end != -1) {                // note the !=
            filename = origline.substring(start + 10, end);
            origname = filename;
            // The filename may contain a full path.  Cut to just the filename.
            int slash =
                    Math.max(filename.lastIndexOf('/'), filename.lastIndexOf('\\'));
            if (slash > -1) {
                filename = filename.substring(slash + 1);  // past last slash
            }
        }

        // Return a String array: disposition, name, filename
        // empty filename denotes no file posted!
        retval[0] = disposition;
        retval[1] = name;
        retval[2] = filename;
        retval[3] = origname;
        return retval;
    }

    /**
     * Read the next line of input.
     *
     * @return a String containing the next line of input from the stream,
     * or null to indicate the end of the stream.
     * @throws IOException if an input or output exception has occurred.
     */
    private String readLine() throws IOException {
        StringBuilder sbuf = new StringBuilder();
        int result;
        String line;

        do {
            result = in.readLine(buf, 0, buf.length);  // does +=
            if (result != -1) {
                sbuf.append(new String(buf, 0, result, encoding));
            }
        } while (result == buf.length);  // loop only if the buffer was filled

        if (sbuf.length() == 0) {
            return null;  // nothing read, must be at the end of stream
        }

        // Cut off the trailing \n or \r\n
        // It should always be \r\n but IE5 sometimes does just \n
        // Thanks to Luke Blaikie for helping make this work with \n
        int len = sbuf.length();
        if (len >= 2 && sbuf.charAt(len - 2) == '\r') {
            sbuf.setLength(len - 2);  // cut \r\n
        } else if (len >= 1 && sbuf.charAt(len - 1) == '\n') {
            sbuf.setLength(len - 1);  // cut \n
        }
        return sbuf.toString();
    }
}

    

    

    
            
    
            

    
        
            
                Related Artifacts
                
                     mysql-connector-java mysql
 facebook-messenger com.github.codedrinker
 selenium-java org.seleniumhq.selenium
 instagram-java com.github.sola92
 gson com.google.code.gson
 poi org.apache.poi
 httpclient org.apache.httpcomponents
 json org.json
 facebook-java-api com.google.code.facebook-java-api
 poi-ooxml org.apache.poi
 jackson-databind com.fasterxml.jackson.core
 junit junit
 primefaces org.primefaces
 ojdbc7 com.github.noraui
 jfoenix com.jfoenix
 testng org.testng
 json-simple com.googlecode.json-simple
 selenium-server org.seleniumhq.selenium
 itextpdf com.itextpdf
 spring-core org.springframework
                
            
        
        
            
                Related Groups
                
                     org.springframework
 org.apache.poi
 org.hibernate
 org.springframework.boot
 com.fasterxml.jackson.core
 com.itextpdf
 org.seleniumhq.selenium
 mysql
 org.finos.legend.engine
 org.apache.httpcomponents
 org.apache.logging.log4j
 org.openjfx
 org.apache.commons
 org.json
 com.google.guava
 com.google.zxing
 net.sf.jasperreports
 javax.xml.bind
 ojdbc
 com.google.code.facebook-java-api