All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.camel.util.UnsafeUriCharactersEncoder Maven / Gradle / Ivy

The newest version!
/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.camel.util;

import java.util.BitSet;
import java.util.List;

/**
 * Encoder for unsafe URI characters.
 * 

* A good source for details is wikipedia url encode article. */ public final class UnsafeUriCharactersEncoder { private static final BitSet unsafeCharactersFastParser; private static final BitSet unsafeCharactersRfc1738; private static final BitSet unsafeCharactersHttp; private static final char[] HEX_DIGITS = { '0', '1', '2', '3', '4', '5', '6', '7', '8', '9', 'A', 'B', 'C', 'D', 'E', 'F', 'a', 'b', 'c', 'd', 'e', 'f' }; static { unsafeCharactersFastParser = new BitSet(14); unsafeCharactersFastParser.set(' '); unsafeCharactersFastParser.set('"'); unsafeCharactersFastParser.set('<'); unsafeCharactersFastParser.set('>'); unsafeCharactersFastParser.set('%'); unsafeCharactersFastParser.set('{'); unsafeCharactersFastParser.set('}'); unsafeCharactersFastParser.set('|'); unsafeCharactersFastParser.set('\\'); unsafeCharactersFastParser.set('^'); unsafeCharactersFastParser.set('~'); unsafeCharactersFastParser.set('['); unsafeCharactersFastParser.set(']'); unsafeCharactersFastParser.set('`'); // we allow # as a safe when using the fast parser as its used for // looking up beans in the registry (foo=#myBar) } static { unsafeCharactersRfc1738 = new BitSet(15); unsafeCharactersRfc1738.set(' '); unsafeCharactersRfc1738.set('"'); unsafeCharactersRfc1738.set('<'); unsafeCharactersRfc1738.set('>'); unsafeCharactersRfc1738.set('#'); unsafeCharactersRfc1738.set('%'); unsafeCharactersRfc1738.set('{'); unsafeCharactersRfc1738.set('}'); unsafeCharactersRfc1738.set('|'); unsafeCharactersRfc1738.set('\\'); unsafeCharactersRfc1738.set('^'); unsafeCharactersRfc1738.set('~'); unsafeCharactersRfc1738.set('['); unsafeCharactersRfc1738.set(']'); unsafeCharactersRfc1738.set('`'); } static { unsafeCharactersHttp = new BitSet(13); unsafeCharactersHttp.set(' '); unsafeCharactersHttp.set('"'); unsafeCharactersHttp.set('<'); unsafeCharactersHttp.set('>'); unsafeCharactersHttp.set('#'); unsafeCharactersHttp.set('%'); unsafeCharactersHttp.set('{'); unsafeCharactersHttp.set('}'); unsafeCharactersHttp.set('|'); unsafeCharactersHttp.set('\\'); unsafeCharactersHttp.set('^'); unsafeCharactersHttp.set('~'); unsafeCharactersHttp.set('`'); } private UnsafeUriCharactersEncoder() { // util class } public static boolean isSafeFastParser(char ch) { return !unsafeCharactersFastParser.get(ch); } public static String encode(String s) { return encode(s, unsafeCharactersRfc1738); } public static String encodeHttpURI(String s) { return encode(s, unsafeCharactersHttp); } public static String encode(String s, BitSet unsafeCharacters) { return encode(s, unsafeCharacters, false); } public static String encode(String s, boolean checkRaw) { return encode(s, unsafeCharactersRfc1738, checkRaw); } public static String encodeHttpURI(String s, boolean checkRaw) { return encode(s, unsafeCharactersHttp, checkRaw); } // Just skip the encode for isRAW part public static String encode(String s, BitSet unsafeCharacters, boolean checkRaw) { if (s == null) { return null; } int len = s.length(); if (len == 0) { return s; } // first check whether we actually need to encode boolean safe = true; for (int i = 0; i < len; i++) { char ch = s.charAt(i); // just deal with the ascii character if (ch > 0 && ch < 128 && unsafeCharacters.get(ch)) { safe = false; break; } } if (safe) { return s; } List> rawPairs = null; if (checkRaw) { rawPairs = URISupport.scanRaw(s); } // add a bit of extra space as initial capacity int initial = len + 8; // okay there are some unsafe characters so we do need to encode // see details at: http://en.wikipedia.org/wiki/Url_encode StringBuilder sb = new StringBuilder(initial); for (int i = 0; i < len; i++) { char ch = s.charAt(i); if (ch > 0 && ch < 128 && unsafeCharacters.get(ch)) { // special for % sign as it may be a decimal encoded value if (ch == '%') { char next = i + 1 < len ? s.charAt(i + 1) : ' '; char next2 = i + 2 < len ? s.charAt(i + 2) : ' '; if (isHexDigit(next) && isHexDigit(next2) && !URISupport.isRaw(i, rawPairs)) { // its already encoded (decimal encoded) so just append as is sb.append(ch); } else { // must escape then, as its an unsafe character appendEscape(sb, (byte) ch); } } else { // must escape then, as its an unsafe character appendEscape(sb, (byte) ch); } } else { sb.append(ch); } } return sb.toString(); } private static void appendEscape(StringBuilder sb, byte b) { sb.append('%'); sb.append(HEX_DIGITS[(b >> 4) & 0x0f]); sb.append(HEX_DIGITS[(b) & 0x0f]); } private static boolean isHexDigit(char ch) { // 0..9 A..F a..f return ch >= 48 && ch <= 57 || ch >= 65 && ch <= 70 || ch >= 97 && ch <= 102; } }





© 2015 - 2025 Weber Informatics LLC | Privacy Policy