All Downloads are FREE. Search and download functionalities are using the official Maven repository.

src.main.java.com.mebigfatguy.fbcontrib.detect.CharsetIssues Maven / Gradle / Ivy

/*
 * fb-contrib - Auxiliary detectors for Java programs
 * Copyright (C) 2005-2019 Dave Brosius
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with this library; if not, write to the Free Software
 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
 */
package com.mebigfatguy.fbcontrib.detect;

import java.nio.charset.Charset;
import java.util.Collections;
import java.util.HashMap;
import java.util.List;
import java.util.Locale;
import java.util.Map;
import java.util.Set;

import org.apache.bcel.Constants;
import org.apache.bcel.classfile.Method;

import com.mebigfatguy.fbcontrib.utils.BugType;
import com.mebigfatguy.fbcontrib.utils.FQMethod;
import com.mebigfatguy.fbcontrib.utils.PublicAPI;
import com.mebigfatguy.fbcontrib.utils.SignatureBuilder;
import com.mebigfatguy.fbcontrib.utils.SignatureUtils;
import com.mebigfatguy.fbcontrib.utils.UnmodifiableSet;
import com.mebigfatguy.fbcontrib.utils.Values;

import edu.umd.cs.findbugs.BugInstance;
import edu.umd.cs.findbugs.BugReporter;
import edu.umd.cs.findbugs.BytecodeScanningDetector;
import edu.umd.cs.findbugs.OpcodeStack;
import edu.umd.cs.findbugs.ba.ClassContext;

/**
 * looks for issues related to manually specified charsets by using string literals.
 */
public class CharsetIssues extends BytecodeScanningDetector {

    private static final String CHARSET_SIG = SignatureUtils.classToSignature("java/nio/charset/Charset");

    private static final Map REPLACEABLE_ENCODING_METHODS;
    private static final Map UNREPLACEABLE_ENCODING_METHODS;
    public static final Set STANDARD_JDK7_ENCODINGS = UnmodifiableSet.create("US-ASCII", "ISO-8859-1", "UTF-8", "UTF-16BE", "UTF-16LE", "UTF-16");

    /*
     * The stack offset refers to the relative position of the Ljava/lang/String; of interest (i.e. the one that is the charset) For example, a stack offset of
     * 0 means the String charset was the last param, and a stack offset of 2 means it was the 3rd to last.
     *
     * Not coincidentally, the argument that needs to be replaced is the [(# of arguments) - offset]th one
     */
    static {
        Map replaceable = new HashMap<>(8);
        replaceable.put(new FQMethod("java/io/InputStreamReader", Values.CONSTRUCTOR,
                new SignatureBuilder().withParamTypes("java/io/InputStream", Values.SLASHED_JAVA_LANG_STRING).toString()), Values.ZERO);
        replaceable.put(new FQMethod("java/io/OutputStreamWriter", Values.CONSTRUCTOR,
                new SignatureBuilder().withParamTypes("java/io/OutputStream", Values.SLASHED_JAVA_LANG_STRING).toString()), Values.ZERO);
        replaceable.put(new FQMethod(Values.SLASHED_JAVA_LANG_STRING, Values.CONSTRUCTOR,
                new SignatureBuilder().withParamTypes(SignatureBuilder.SIG_BYTE_ARRAY, Values.SLASHED_JAVA_LANG_STRING).toString()), Values.ZERO);
        replaceable.put(new FQMethod(Values.SLASHED_JAVA_LANG_STRING, Values.CONSTRUCTOR,
                new SignatureBuilder()
                        .withParamTypes(SignatureBuilder.SIG_BYTE_ARRAY, Values.SIG_PRIMITIVE_INT, Values.SIG_PRIMITIVE_INT, Values.SLASHED_JAVA_LANG_STRING)
                        .toString()),
                Values.ZERO);
        replaceable.put(
                new FQMethod(Values.SLASHED_JAVA_LANG_STRING, "getBytes",
                        new SignatureBuilder().withParamTypes(Values.SLASHED_JAVA_LANG_STRING).withReturnType(SignatureBuilder.SIG_BYTE_ARRAY).toString()),
                Values.ZERO);
        replaceable.put(new FQMethod("java/util/Formatter", Values.CONSTRUCTOR,
                new SignatureBuilder().withParamTypes("java/io/File", Values.SLASHED_JAVA_LANG_STRING, "java/util/Locale").toString()), Values.ONE);

        REPLACEABLE_ENCODING_METHODS = Collections.unmodifiableMap(replaceable);

        String twoStringsToString = new SignatureBuilder().withParamTypes(Values.SLASHED_JAVA_LANG_STRING, Values.SLASHED_JAVA_LANG_STRING)
                .withReturnType(Values.SLASHED_JAVA_LANG_STRING).toString();
        String fileAndStringToVoid = new SignatureBuilder().withParamTypes("java/io/File", Values.SLASHED_JAVA_LANG_STRING).toString();
        String stringToCharset = new SignatureBuilder().withParamTypes(Values.SLASHED_JAVA_LANG_STRING).withReturnType("java/nio/charset/Charset").toString();
        Map unreplaceable = new HashMap<>(32);
        unreplaceable.put(new FQMethod("java/net/URLEncoder", "encode", twoStringsToString), Values.ZERO);
        unreplaceable.put(new FQMethod("java/net/URLDecoder", "decode", twoStringsToString), Values.ZERO);
        unreplaceable.put(new FQMethod("java/io/ByteArrayOutputStream", Values.TOSTRING, SignatureBuilder.SIG_STRING_TO_VOID), Values.ZERO);
        unreplaceable.put(new FQMethod("java/io/PrintStream", Values.CONSTRUCTOR, SignatureBuilder.SIG_TWO_STRINGS_TO_VOID), Values.ZERO);
        unreplaceable.put(new FQMethod("java/io/PrintStream", Values.CONSTRUCTOR, fileAndStringToVoid), Values.ZERO);
        unreplaceable.put(
                new FQMethod("java/io/PrintStream", Values.CONSTRUCTOR,
                        new SignatureBuilder().withParamTypes("java/io/OutputStream", Values.SIG_PRIMITIVE_BYTE, Values.SLASHED_JAVA_LANG_STRING).toString()),
                Values.ZERO);
        unreplaceable.put(new FQMethod("java/io/PrintStream", "toCharset", stringToCharset), Values.ZERO);
        unreplaceable.put(new FQMethod("java/io/PrintWriter", Values.CONSTRUCTOR, SignatureBuilder.SIG_TWO_STRINGS_TO_VOID), Values.ZERO);
        unreplaceable.put(new FQMethod("java/io/PrintWriter", Values.CONSTRUCTOR, fileAndStringToVoid), Values.ZERO);
        unreplaceable.put(new FQMethod("java/io/PrintWriter", "toCharset", stringToCharset), Values.ZERO);
        unreplaceable.put(new FQMethod("java/lang/StringCoding", "decode",
                new SignatureBuilder()
                        .withParamTypes(Values.SLASHED_JAVA_LANG_STRING, SignatureBuilder.SIG_BYTE_ARRAY, Values.SIG_PRIMITIVE_INT, Values.SIG_PRIMITIVE_INT)
                        .withReturnType(SignatureBuilder.SIG_CHAR_ARRAY).toString()),
                Values.THREE);
        unreplaceable.put(new FQMethod("java/lang/StringCoding", "encode",
                new SignatureBuilder()
                        .withParamTypes(Values.SLASHED_JAVA_LANG_STRING, SignatureBuilder.SIG_CHAR_ARRAY, Values.SIG_PRIMITIVE_INT, Values.SIG_PRIMITIVE_INT)
                        .withReturnType(SignatureBuilder.SIG_BYTE_ARRAY).toString()),
                Values.THREE);
        unreplaceable.put(new FQMethod("java/util/Formatter", Values.CONSTRUCTOR, fileAndStringToVoid), Values.ZERO);
        unreplaceable.put(
                new FQMethod("java/util/Formatter", Values.CONSTRUCTOR,
                        new SignatureBuilder().withParamTypes("java/io/OutputStream", Values.SLASHED_JAVA_LANG_STRING, "java/util/Locale").toString()),
                Values.ONE);
        unreplaceable.put(new FQMethod("java/util/Formatter", Values.CONSTRUCTOR,
                new SignatureBuilder().withParamTypes("java/io/OutputStream", Values.SLASHED_JAVA_LANG_STRING).toString()), Values.ZERO);
        unreplaceable.put(
                new FQMethod("java/util/Formatter", Values.CONSTRUCTOR,
                        new SignatureBuilder().withParamTypes(Values.SLASHED_JAVA_LANG_STRING, Values.SLASHED_JAVA_LANG_STRING, "java/util/Locale").toString()),
                Values.ONE);
        unreplaceable.put(new FQMethod("java/util/Formatter", Values.CONSTRUCTOR, SignatureBuilder.SIG_TWO_STRINGS_TO_VOID), Values.ZERO);
        unreplaceable.put(new FQMethod("java/util/Formatter", "toCharset", SignatureBuilder.SIG_STRING_TO_VOID), Values.ZERO);
        unreplaceable.put(new FQMethod("java/util/logging/Handler", "setEncoding", SignatureBuilder.SIG_STRING_TO_VOID), Values.ZERO);
        unreplaceable.put(new FQMethod("java/util/logging/MemoryHandler", "setEncoding", SignatureBuilder.SIG_STRING_TO_VOID), Values.ZERO);
        unreplaceable.put(new FQMethod("java/util/logging/StreamHandler", "setEncoding", SignatureBuilder.SIG_STRING_TO_VOID), Values.ZERO);
        unreplaceable.put(new FQMethod("java/util/Scanner", Values.CONSTRUCTOR, fileAndStringToVoid), Values.ZERO);
        unreplaceable.put(new FQMethod("java/util/Scanner", Values.CONSTRUCTOR,
                new SignatureBuilder().withParamTypes("java/io/InputStream", Values.SLASHED_JAVA_LANG_STRING).toString()), Values.ZERO);
        unreplaceable.put(new FQMethod("java/util/Scanner", Values.CONSTRUCTOR,
                new SignatureBuilder().withParamTypes("java/nio/file/Path", Values.SLASHED_JAVA_LANG_STRING).toString()), Values.ZERO);
        unreplaceable.put(
                new FQMethod("java/util/Scanner", Values.CONSTRUCTOR,
                        new SignatureBuilder().withParamTypes("java/nio/channels/ReadableByteChannel", Values.SLASHED_JAVA_LANG_STRING).toString()),
                Values.ZERO);
        unreplaceable.put(new FQMethod("javax/servlet/ServletResponse", "setCharacterEncoding", SignatureBuilder.SIG_STRING_TO_VOID), Values.ZERO);
        unreplaceable.put(new FQMethod("java/beans/XMLEncoder", Values.CONSTRUCTOR, new SignatureBuilder()
                .withParamTypes("java/io/OutputStream", Values.SLASHED_JAVA_LANG_STRING, Values.SIG_PRIMITIVE_BOOLEAN, Values.SIG_PRIMITIVE_INT).toString()),
                Values.TWO);
        unreplaceable.put(
                new FQMethod("java/nio/channels/Channels", "newReader", new SignatureBuilder()
                        .withParamTypes("java/nio/channels/ReadableByteChannel", Values.SLASHED_JAVA_LANG_STRING).withReturnType("java/io/Reader").toString()),
                Values.ZERO);
        unreplaceable.put(
                new FQMethod("java/nio/channels/Channels", "newWriter", new SignatureBuilder()
                        .withParamTypes("java/nio/channels/WritableByteChannel", Values.SLASHED_JAVA_LANG_STRING).withReturnType("java/io/Writer").toString()),
                Values.ZERO);

        UNREPLACEABLE_ENCODING_METHODS = Collections.unmodifiableMap(unreplaceable);
    }

    private final BugReporter bugReporter;
    private OpcodeStack stack;
    private int classVersion;

    /**
     * constructs a CSI detector given the reporter to report bugs on
     *
     * @param bugReporter
     *            the sync of bug reports
     */
    public CharsetIssues(BugReporter bugReporter) {
        this.bugReporter = bugReporter;
    }

    /**
     * implements the visitor to make sure the class is at least 1.4, and if so continues, reseting the opcode stack
     *
     * @param classContext
     *            the currently parsed java class
     */
    @Override
    public void visitClassContext(ClassContext classContext) {
        try {
            classVersion = classContext.getJavaClass().getMajor();
            if (classVersion >= Constants.MAJOR_1_4) {
                stack = new OpcodeStack();
                super.visitClassContext(classContext);
            }
        } finally {
            stack = null;
        }
    }

    /**
     * implements the visitor to reset the opcode stack for a new method
     *
     * @param obj
     *            the currently parsed method
     */
    @Override
    public void visitMethod(Method obj) {
        stack.resetForMethodEntry(this);
    }

    /**
     * implements the visitor to look for method calls that take a parameter that either represents a encoding via a string, or takes a Charset. If the method
     * can take both, and a string is presented for a standard charset available in jdk 7, and the code is compiled against 7, then report. It also looks for
     * mistakes, encodings that aren't recognized in the current jvm.
     *
     * @param seen
     *            the currently parsed opcode
     */
    @Override
    public void sawOpcode(int seen) {
        try {
            stack.precomputation(this);

            switch (seen) {
                case INVOKESPECIAL:
                case INVOKESTATIC:
                case INVOKEINTERFACE:
                case INVOKEVIRTUAL:
                    String encoding = null;
                    String className = getClassConstantOperand();
                    String methodName = getNameConstantOperand();
                    String methodSig = getSigConstantOperand();
                    FQMethod methodInfo = new FQMethod(className, methodName, methodSig);
                    Integer stackOffset = REPLACEABLE_ENCODING_METHODS.get(methodInfo);
                    if (stackOffset != null) {
                        int offset = stackOffset.intValue();
                        if (stack.getStackDepth() > offset) {
                            OpcodeStack.Item item = stack.getStackItem(offset);
                            encoding = (String) item.getConstant();
                            if (encoding != null) {
                                encoding = encoding.toUpperCase(Locale.ENGLISH);
                                if ((classVersion >= Constants.MAJOR_1_7) && STANDARD_JDK7_ENCODINGS.contains(encoding)) {
                                    // the counts put in the Pair are indexed from
                                    // the beginning of
                                    String changedMethodSig = replaceNthArgWithCharsetString(methodSig, offset);
                                    bugReporter.reportBug(new BugInstance(this, BugType.CSI_CHAR_SET_ISSUES_USE_STANDARD_CHARSET.name(), NORMAL_PRIORITY)
                                            .addClass(this).addMethod(this).addSourceLine(this).addCalledMethod(this)
                                            .addCalledMethod(className, methodName, changedMethodSig, seen == INVOKESTATIC));
                                }
                            }
                        }
                    } else {
                        Integer offsetValue = UNREPLACEABLE_ENCODING_METHODS.get(methodInfo);
                        if (offsetValue != null) {
                            int offset = offsetValue.intValue();
                            if (stack.getStackDepth() > offset) {
                                OpcodeStack.Item item = stack.getStackItem(offset);
                                encoding = (String) item.getConstant();
                                if (encoding != null) {
                                    encoding = encoding.toUpperCase(Locale.ENGLISH);
                                    if ((classVersion >= Constants.MAJOR_1_7) && STANDARD_JDK7_ENCODINGS.contains(encoding)) {
                                        bugReporter
                                                .reportBug(new BugInstance(this, BugType.CSI_CHAR_SET_ISSUES_USE_STANDARD_CHARSET_NAME.name(), NORMAL_PRIORITY)
                                                        .addClass(this).addMethod(this).addSourceLine(this).addCalledMethod(this));
                                    }
                                }
                            }
                        }
                    }

                    if (encoding != null) {
                        try {
                            Charset.forName(encoding);
                        } catch (IllegalArgumentException e) { // encompasses both
                                                               // IllegalCharsetNameException
                                                               // and
                                                               // UnsupportedCharsetException
                            bugReporter.reportBug(new BugInstance(this, BugType.CSI_CHAR_SET_ISSUES_UNKNOWN_ENCODING.name(), NORMAL_PRIORITY).addClass(this)
                                    .addMethod(this).addSourceLine(this).addCalledMethod(this).addString(encoding));
                        }
                    }
                break;
                default:
                break;
            }
        } finally {
            stack.sawOpcode(this, seen);
        }
    }

    /**
     * rebuilds a signature replacing a String argument at a specified spot, with a Charset parameter.
     *
     * @param sig
     *            the signature to replace
     * @param stackOffset
     *            the offset of the parameter to replace
     *
     * @return a new signature with a Charset parameter
     */
    private static String replaceNthArgWithCharsetString(String sig, int stackOffset) {

        List arguments = SignatureUtils.getParameterSignatures(sig);

        StringBuilder sb = new StringBuilder("(");
        int argumentIndexToReplace = (arguments.size() - stackOffset) - 1;

        for (int i = 0; i < arguments.size(); i++) {
            if (i == argumentIndexToReplace) {
                sb.append(CHARSET_SIG);
            } else {
                sb.append(arguments.get(i));
            }
        }

        sb.append(sig.substring(sig.lastIndexOf(')'), sig.length()));
        return sb.toString();
    }

    /**
     * used by external tools, lists the method signature checked for, for unreplaceable encoding methods
     *
     * @return a map of these methods
     */
    @PublicAPI("Used by fb-contrib-eclipse-quickfixes to determine type of fix to apply")
    public static Map getUnreplaceableCharsetEncodings() {
        Map encodings = new HashMap<>(UNREPLACEABLE_ENCODING_METHODS.size());
        for (Map.Entry entry : UNREPLACEABLE_ENCODING_METHODS.entrySet()) {
            encodings.put(entry.getKey().toString(), entry.getValue());
        }
        return encodings;
    }

    /**
     * used by external tools, lists the method signature checked for, for replaceable encoding methods
     *
     * @return a map of these methods
     */
    @PublicAPI("Used by fb-contrib-eclipse-quickfixes to determine type of fix to apply")
    public static Map getReplaceableCharsetEncodings() {
        Map encodings = new HashMap<>(REPLACEABLE_ENCODING_METHODS.size());
        for (Map.Entry entry : REPLACEABLE_ENCODING_METHODS.entrySet()) {
            encodings.put(entry.getKey().toString(), entry.getValue());
        }
        return encodings;
    }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy