All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.drill.common.util.DrillStringUtils Maven / Gradle / Ivy

The newest version!
/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.drill.common.util;

import io.netty.buffer.ByteBuf;

import org.apache.commons.text.StringEscapeUtils;
import org.apache.commons.lang3.StringUtils;

import java.util.Arrays;
import java.util.stream.Collectors;

public class DrillStringUtils {

  /**
   * Converts the long number into more human readable string.
   */
  public static String readable(long bytes) {
    int unit = 1024;
    long absBytes = Math.abs(bytes);
    if (absBytes < unit) {
      return bytes + " B";
    }
    int exp = (int) (Math.log(absBytes) / Math.log(unit));
    char pre = ("KMGTPE").charAt(exp-1);
    return String.format("%s%.1f %ciB", (bytes == absBytes ? "" : "-"), absBytes / Math.pow(unit, exp), pre);
  }


  /**
   * Unescapes any Java literals found in the {@code String}.
   * For example, it will turn a sequence of {@code '\'} and
   * {@code 'n'} into a newline character, unless the {@code '\'}
   * is preceded by another {@code '\'}.
   *
   * @param input  the {@code String} to unescape, may be null
   * @return a new unescaped {@code String}, {@code null} if null string input
   */
  public static String unescapeJava(String input) {
    return StringEscapeUtils.unescapeJava(input);
  }

  /**
   * Escapes the characters in a {@code String} according to Java string literal
   * rules.
   *
   * Deals correctly with quotes and control-chars (tab, backslash, cr, ff,
   * etc.) so, for example, a tab becomes the characters {@code '\\'} and
   * {@code 't'}.
   *
   * Example:
   * 
   * input string: He didn't say, "Stop!"
   * output string: He didn't say, \"Stop!\"
   * 
* * @param input String to escape values in, may be null * @return String with escaped values, {@code null} if null string input */ public static String escapeJava(String input) { return StringEscapeUtils.escapeJava(input); } public static String escapeNewLines(String input) { if (input == null) { return null; } StringBuilder result = new StringBuilder(); boolean sawNewline = false; for (int i = 0; i < input.length(); i++) { char curChar = input.charAt(i); if (curChar == '\r' || curChar == '\n') { if (sawNewline) { continue; } sawNewline = true; result.append("\\n"); } else { sawNewline = false; result.append(curChar); } } return result.toString(); } /** * Copied form commons-lang 2.x code as common-lang 3.x has this API removed. * (http://commons.apache.org/proper/commons-lang/article3_0.html#StringEscapeUtils.escapeSql) * @param str * @return */ public static String escapeSql(String str) { return (str == null) ? null : StringUtils.replace(str, "'", "''"); } /** * Return a printable representation of a byte buffer, escaping the non-printable * bytes as '\\xNN' where NN is the hexadecimal representation of such bytes. * * This function does not modify the {@code readerIndex} and {@code writerIndex} * of the byte buffer. */ public static String toBinaryString(ByteBuf buf, int strStart, int strEnd) { StringBuilder result = new StringBuilder(); for (int i = strStart; i < strEnd; ++i) { appendByte(result, buf.getByte(i)); } return result.toString(); } /** * Return a printable representation of a byte array, escaping the non-printable * bytes as '\\xNN' where NN is the hexadecimal representation of such bytes. */ public static String toBinaryString(byte[] buf) { return toBinaryString(buf, 0, buf.length); } /** * Return a printable representation of a byte array, escaping the non-printable * bytes as '\\xNN' where NN is the hexadecimal representation of such bytes. */ public static String toBinaryString(byte[] buf, int strStart, int strEnd) { StringBuilder result = new StringBuilder(); for (int i = strStart; i < strEnd; ++i) { appendByte(result, buf[i]); } return result.toString(); } private static void appendByte(StringBuilder result, byte b) { int ch = b & 0xFF; if ( (ch >= '0' && ch <= '9') || (ch >= 'A' && ch <= 'Z') || (ch >= 'a' && ch <= 'z') || " `~!@#$%^&*()-_=+[]{}|;:'\",.<>/?".indexOf(ch) >= 0 ) { result.append((char)ch); } else { result.append(String.format("\\x%02X", ch)); } } /** * parsing a hex encoded binary string and write to an output buffer. * * This function does not modify the {@code readerIndex} and {@code writerIndex} * of the byte buffer. * * @return Index in the byte buffer just after the last written byte. */ public static int parseBinaryString(ByteBuf str, int strStart, int strEnd, ByteBuf out) { int dstEnd = 0; for (int i = strStart; i < strEnd; i++) { byte b = str.getByte(i); if (b == '\\' && strEnd > i+3 && (str.getByte(i+1) == 'x' || str.getByte(i+1) == 'X')) { // ok, take next 2 hex digits. byte hd1 = str.getByte(i+2); byte hd2 = str.getByte(i+3); if (isHexDigit(hd1) && isHexDigit(hd2)) { // [a-fA-F0-9] // turn hex ASCII digit -> number b = (byte) ((toBinaryFromHex(hd1) << 4) + toBinaryFromHex(hd2)); i += 3; // skip 3 } } out.setByte(dstEnd++, b); } return dstEnd; } /** * Takes a ASCII digit in the range A-F0-9 and returns * the corresponding integer/ordinal value. * @param ch The hex digit. * @return The converted hex value as a byte. */ private static byte toBinaryFromHex(byte ch) { if ( ch >= 'A' && ch <= 'F' ) { return (byte) ((byte)10 + (byte) (ch - 'A')); } else if ( ch >= 'a' && ch <= 'f' ) { return (byte) ((byte)10 + (byte) (ch - 'a')); } return (byte) (ch - '0'); } private static boolean isHexDigit(byte c) { return (c >= 'a' && c <= 'f') || (c >= 'A' && c <= 'F') || (c >= '0' && c <= '9'); } /** * Removes extra spaces and empty values in a CSV String * @param csv The CSV string to be sanitized * @return The sanitized CSV string */ public static String sanitizeCSV(String csv) { String[] tokens = csv.split(","); return Arrays.stream(tokens) .map(String::trim) .filter(StringUtils::isNotEmpty) .collect(Collectors.joining(",")); } /** * Removes all leading slash characters from specified string. * * @param path string to remove all leading slash characters * @return string with removed leading slash characters */ public static String removeLeadingSlash(String path) { return StringUtils.stripStart(path, "/"); } }




© 2015 - 2025 Weber Informatics LLC | Privacy Policy