src.java.com.ctc.wstx.io.SingleByteTextWriter Maven / Gradle / Ivy

Go to download
Show more of this group Show more artifacts with this name
Show all versions of wstx-lgpl
There is a newer version: 3.2.7
package com.ctc.wstx.io;

import java.io.*;

/**
 * Escaping writer that will properly escape normal textual content
 * that need to be escaped, when outputting using a Writer that
 * produces a subset of Unicode values.
 * When underlying Writer only allows for direct outputting of a subset of
 * Unicode values, it is generally done so that only lowest
 * Unicode characters (7-bit ones for Ascii, 8-bit ones for ISO-Latin,
 * something similar for other ISO-8859-1 encodings) can be output
 * as is, and the rest need to be output as character entities.
 */
public class SingleByteTextWriter
    extends WriterBase
{
    /**
     * First Unicode character (one with lowest value) after (and including)
     * which character entities have to be used.
     */
    private final char mHighChar;
    
    private boolean mJustWroteBracket = false;

    /**
     * @param out Underlying Writer to use for actual writes
     * @param enc Encoding that the Writer is using
     * @param charsetSize Number of Unicode characters (starting
     *   with the null one) that need not be escaped (for example,
     *   128 for US-ASCII, 256 for ISO-Latin etc)
     */
    public SingleByteTextWriter(Writer out, String enc,
                                int charsetSize)
    {
        super(out);
        mHighChar = (char) charsetSize;
    }


    public void write(int c) throws IOException
    {
        if (c <= HIGHEST_ENCODABLE_TEXT_CHAR) {
            if (c == '<') {
                out.write("<");
            } else if (c == '&') {
                out.write("&");
            } else if (c == '>') {
                if (mJustWroteBracket) {
                    out.write(">");
                } else {
                    out.write(c);
                }
            } else {
                out.write(c);
            } 
            mJustWroteBracket = false;
        } else if (c >= mHighChar) {
            writeAsEntity(c);
        } else {
            out.write(c);
            mJustWroteBracket = (c == ']');
        }
    }
    
    public void write(char cbuf[], int offset, int len) throws IOException
    {
        // Let's simplify code a bit and offload the trivial case...
        if (len < 2) {
            if (len == 1) {
                write(cbuf[offset]);
            }
            return;
        }
        
        len += offset; // to get the index past last char to output
        // Need special handing for leftover ']' to cause quoting of '>'
        if (mJustWroteBracket) {
            if (cbuf[offset] == '>') {
                out.write(">");
                ++offset;
            }
        }
        
        char c = CHAR_NULL;
        do {
            int start = offset;
            String ent = null;
            
            for (; offset < len; ++offset) {
                c = cbuf[offset]; 
                if (c <= HIGHEST_ENCODABLE_TEXT_CHAR) {
                    if (c == '<') {
                        ent = "<";
                        break;
                    } else if (c == '&') {
                        ent = "&";
                        break;
                    } else if (c == '>' && (offset > start)
                               && cbuf[offset-1] == ']') {
                        ent = ">";
                        break;
                    } else if (c == CHAR_NULL) {
                        throwNullChar();
                    }
                    // should we escape \r?
                } else if (c >= mHighChar) {
                    break;
                }
                // otherwise ok
            }
            int outLen = offset - start;

            if (outLen > 0) {
                out.write(cbuf, start, outLen);
            }
            if (ent != null) {
                out.write(ent);
                ent = null;
            } else if (offset < len) {
                writeAsEntity(c);
            }
        } while (++offset < len);
        
        // Ok, did we end up with a bracket?
        mJustWroteBracket = (c == ']');
    }

    public void write(String str, int offset, int len) throws IOException
    {
        if (len < 2) { // let's do a simple check here
            if (len == 1) {
                write(str.charAt(offset));
            }
            return;
        }

        len += offset; // to get the index past last char to output
        // Ok, leftover ']' to cause quoting of '>'?
        if (mJustWroteBracket) {
            if (str.charAt(offset) == '>') {
                out.write(">");
                ++offset;
            }
        }

        char c = CHAR_NULL;
        do {
            int start = offset;
            String ent = null;

            for (; offset < len; ++offset) {
                c = str.charAt(offset); 
                if (c <= HIGHEST_ENCODABLE_TEXT_CHAR) {
                    if (c == '<') {
                        ent = "<";
                        break;
                    } else if (c == '&') {
                        ent = "&";
                        break;
                    } else if (c == '>' && (offset > start)
                               && str.charAt(offset-1) == ']') {
                        ent = ">";
                        break;
                    }
                    // should we escape \r?
                } else if (c >= mHighChar) {
                    break;
                }
                // otherwise ok
            }
            int outLen = offset - start;
            if (outLen > 0) {
                out.write(str, start, outLen);
            } 
            if (ent != null) {
                out.write(ent);
                ent = null;
            } else if (offset < len) {
                writeAsEntity(c);
            }
        } while (++offset < len);

        // Ok, did we end up with a bracket?
        mJustWroteBracket = (c == ']');
    }
}