ai.platon.pulsar.common.Strings Maven / Gradle / Ivy

Go to download
Show more of this group Show more artifacts with this name
Show all versions of pulsar-common Show documentation
There is a newer version: 2.1.0
/**
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 * 
 * http://www.apache.org/licenses/LICENSE-2.0
 * 

 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package ai.platon.pulsar.common;

import org.apache.commons.lang3.StringUtils;
import org.apache.commons.lang3.Validate;
import org.apache.commons.lang3.math.NumberUtils;

import java.awt.event.KeyEvent;
import java.nio.ByteBuffer;
import java.util.*;
import java.util.regex.Matcher;
import java.util.regex.Pattern;

import static java.util.regex.Pattern.CASE_INSENSITIVE;

public final class Strings {

  final public static String[] emptyStringArray = {};

  final public static char COMMA = ',';

  final public static String COMMA_STR = ",";

  final public static char FULL_WIDTH_COMMA = '，';

  final public static String FULL_WIDTH_COMMA_STR = "，";

  final public static char ESCAPE_CHAR = '\\';

  // public static final Pattern HTML_CHARSET_PATTERN = Pattern.compile("^]*?content\\s*=[\\s\"']*)?([^>]*?)[\\s\"';]*charset\\s*=[\\s\"']([a-zA-Z0-9]{3,8})([^\\s\"'(/>)]*)", CASE_INSENSITIVE);

  public static final Pattern HTML_CHARSET_PATTERN = Pattern.compile("^]*", CASE_INSENSITIVE);

  public static final Pattern PRICE_PATTERN = Pattern.compile("[1-9](,{0,1}\\d+){0,8}(\\.\\d{1,2})|[1-9](,{0,1}\\d+){0,8}");

  // all special chars on a standard keyboard

  public static final String DEFAULT_KEEP_CHARS = "~!@#$%^&*()_+`-={}|[]\\:\";'<>?,./' \n\r\t";

  public static final String HTML_TAG_REGEX = "<(\"[^\"]*\"|'[^']*'|[^'\">])*>";

  public static final String FLOAT_REGEX = "^([+-]?(\\d+\\.)?\\d+)$";

  public static Pattern FLOAT_PATTERN = Pattern.compile(FLOAT_REGEX);

  public static Pattern HTML_TAG_PATTERN = Pattern.compile(HTML_TAG_REGEX);

  public static final String NUMERIC_LIKE_REGEX = "^.{0,2}[-+]?[0-9]*\\.?[0-9]+.{0,2}$";

  public static Pattern NUMERIC_LIKE_PATTERN = Pattern.compile(NUMERIC_LIKE_REGEX);

  public static final String MONEY_LIKE_REGEX = "^[¥￥$]?[0-9]+(\\.[0-9]{1,2})?$";

  public static Pattern MONEY_LIKE_PATTERN = Pattern.compile(MONEY_LIKE_REGEX);

  public static final String CHINESE_PHONE_NUMBER_LIKE_REGEX = "^((13[0-9])|(14[5|7])|(15([0-3]|[5-9]))|(18[0,1,2,5-9])|(177))\\d{8}$";

  public static Pattern CHINESE_PHONE_NUMBER_LIKE_PATTERN = Pattern.compile(CHINESE_PHONE_NUMBER_LIKE_REGEX);

  public static final String IP_PORT_REGEX = "^"
          + "(((?!-)[A-Za-z0-9-]{1,63}(? LongerFirstComparator = (s, s2) -> {
    int result = Integer.compare(s2.length(), s.length());
    if (result == 0)
      return s.compareTo(s2);
    return result;
  };

  public static final Comparator ShorterFirstComparator = (s, s2) -> LongerFirstComparator.compare(s2, s);

  public static final Pattern PatternTime = Pattern.compile("[0-2][0-3]:[0-5][0-9]");

  public static int countTimeString(String text) {
    Matcher matcher = PatternTime.matcher(text);
    int count = 0;
    while (matcher.find())
      count++;
    return count;
  }

  /**
   * Tests if a code point is "whitespace" as defined by what it looks like. Used for Element.text etc.
   *
   * @param c code point to test
   * @return true if code point is whitespace, false otherwise
   */
  public static boolean isActuallyWhitespace(int c) {
    return c == CODE_KEYBOARD_WHITESPACE || c == '\t' || c == '\n' || c == '\f' || c == '\r' || c == CODE_NBSP;
  }

  /**
   * Convenience call for {@link #toHexString(ByteBuffer, String, int)}, where
   * sep = null; lineLen = Integer.MAX_VALUE.
   *
   * @param buf The byte buffer
   * @return The hex string
   */
  public static String toHexString(ByteBuffer buf) {
    return toHexString(buf, null, Integer.MAX_VALUE);
  }

  /**
   * Get a text representation of a ByteBuffer as hexadecimal String, where each
   * pair of hexadecimal digits corresponds to consecutive bytes in the array.
   *
   * @param buf     input data
   * @param sep     separate every pair of hexadecimal digits with this separator, or
   *                null if no separation is needed.
   * @param lineLen break the output String into lines containing output for lineLen
   *                bytes.
   * @return The hex string
   */
  public static String toHexString(ByteBuffer buf, String sep, int lineLen) {
    return toHexString(buf.array(), buf.arrayOffset() + buf.position(), buf.remaining(), sep, lineLen);
  }

  /**
   * Convenience call for {@link #toHexString(byte[], String, int)}, where
   * sep = null; lineLen = Integer.MAX_VALUE.
   *
   * @param buf the buffer
   * @return a {@link java.lang.String} object.
   */
  public static String toHexString(byte[] buf) {
    return toHexString(buf, null, Integer.MAX_VALUE);
  }

  /**
   * Get a text representation of a byte[] as hexadecimal String, where each
   * pair of hexadecimal digits corresponds to consecutive bytes in the array.
   *
   * @param buf     input data
   * @param sep     separate every pair of hexadecimal digits with this separator, or
   *                null if no separation is needed.
   * @param lineLen break the output String into lines containing output for lineLen
   *                bytes.
   * @return a {@link java.lang.String} object.
   */
  public static String toHexString(byte[] buf, String sep, int lineLen) {
    return toHexString(buf, 0, buf.length, sep, lineLen);
  }

  /**
   * Get a text representation of a byte[] as hexadecimal String, where each
   * pair of hexadecimal digits corresponds to consecutive bytes in the array.
   *
   * @param buf     input data
   * @param of      the offset into the byte[] to start reading
   * @param cb      the number of bytes to read from the byte[]
   * @param sep     separate every pair of hexadecimal digits with this separator, or
   *                null if no separation is needed.
   * @param lineLen break the output String into lines containing output for lineLen
   *                bytes.
   * @return a {@link java.lang.String} object.
   */
  public static String toHexString(byte[] buf, int of, int cb, String sep, int lineLen) {
    if (buf == null)
      return null;
    if (lineLen <= 0)
      lineLen = Integer.MAX_VALUE;
    StringBuffer res = new StringBuffer(cb * 2);
    for (int c = 0; c < cb; c++) {
      int b = buf[of++];
      res.append(HEX_DIGITS[(b >> 4) & 0xf]);
      res.append(HEX_DIGITS[b & 0xf]);
      if (c > 0 && (c % lineLen) == 0)
        res.append('\n');
      else if (sep != null && c < lineLen - 1)
        res.append(sep);
    }
    return res.toString();
  }

  // 根据Unicode编码完美的判断中文汉字和符号

  public static boolean isChinese(char c) {
    Character.UnicodeBlock ub = Character.UnicodeBlock.of(c);
    return ub == Character.UnicodeBlock.CJK_UNIFIED_IDEOGRAPHS
            || ub == Character.UnicodeBlock.CJK_COMPATIBILITY_IDEOGRAPHS
            || ub == Character.UnicodeBlock.CJK_UNIFIED_IDEOGRAPHS_EXTENSION_A
            || ub == Character.UnicodeBlock.CJK_UNIFIED_IDEOGRAPHS_EXTENSION_B
            || ub == Character.UnicodeBlock.CJK_SYMBOLS_AND_PUNCTUATION
            || ub == Character.UnicodeBlock.HALFWIDTH_AND_FULLWIDTH_FORMS
            || ub == Character.UnicodeBlock.GENERAL_PUNCTUATION;

  }

  // 完整的判断中文汉字和符号

  public static boolean isChinese(String text) {
    char[] ch = text.toCharArray();
    for (char c : ch) {
      if (isChinese(c)) {
        return true;
      }
    }

    return false;
  }

  public static boolean isMainlyChinese(String text, double percentage) {
    if ("".equals(text)) return false;

    return 1.0 * countChinese(text) / text.length() >= percentage;
  }

  public static int countChinese(String text) {
    if ("".equals(text)) return 0;

    int count = 0;
    char[] ch = text.toCharArray();
    for (char c : ch) {
      if (isChinese(c)) {
        ++count;
      }
    }

    return count;
  }

  // 只能判断部分CJK字符（CJK统一汉字）

  public static boolean isChineseByREG(String str) {
    if (str == null) {
      return false;
    }

    final Pattern pattern = Pattern.compile("[\\u4E00-\\u9FBF]+");
    return pattern.matcher(str.trim()).find();
  }

  // 只能判断部分CJK字符（CJK统一汉字）
  public static boolean isChineseCharByREG(char ch) {
    return ch >= '\u4E00' && ch <= '\u9FBF';
  }

  // 只能判断部分CJK字符（CJK统一汉字）
  public static boolean isChineseByName(String str) {
    if (str == null) {
      return false;
    }

    // 大小写不同：\\p 表示包含，\\P 表示不包含
    // \\p{Cn} 的意思为 Unicode 中未被定义字符的编码，\\P{Cn} 就表示 Unicode中已经被定义字符的编码
    String reg = "\\p{InCJK Unified Ideographs}&&\\P{Cn}";
    Pattern pattern = Pattern.compile(reg);
    return pattern.matcher(str.trim()).find();
  }

  // 对整个字符串：
  // 1. 仅保留英文字符、数字、汉字字符和keeps中的字符
  // 2. 去除网页空白： 
  //
  // String attrName = "配 送 至：京 东 价：当 当 价";
  // attrName = StringUtils.strip(attrName).replaceAll("[\\s+:：( )]",
  // "");
  // the "blank" characters in the above phrase can not be stripped
  public static String removeNonChar(String text) {
    return removeNonChar(text, null);
  }

  /**
   * @deprecated Use {@link #removeNonChar(String)} instead
   * */
  public static String stripNonChar(String text) {
    return removeNonChar(text);
  }

  /**
   * @deprecated Use {@link #removeNonChar(String, String)} instead
   * */
  public static String stripNonChar(String text, String keeps) {
    return removeNonChar(text, keeps);
  }

  public static String removeNonChar(String text, String keeps) {
    StringBuilder builder = new StringBuilder();

    if (keeps == null) {
      keeps = "";
    }

    for (int i = 0; i < text.length(); ++i) {
      char ch = text.charAt(i);
      if (Character.isLetterOrDigit(ch) || isChineseCharByREG(ch)) {
        builder.append(ch);
      } else if (!keeps.equals("") && keeps.indexOf(ch) != -1) {
        builder.append(ch);
      }
    }

    return builder.toString();
  }

  public static String trimNonChar(String text) {
    return trimNonChar(text, null);
  }

  /**
   // 对字符串的头部和尾部：
   // 1. 仅保留英文字符、数字、汉字字符和keeps中的字符
   // 2. 去除网页空白： 
   */
  public static String trimNonChar(String text, String keeps) {
    int start = 0;
    int end = text.length();
    if (keeps == null)
      keeps = "";

    for (int i = 0; i < text.length(); ++i) {
      char ch = text.charAt(i);
      if (Character.isLetterOrDigit(ch) || isChineseCharByREG(ch)
              || keeps.indexOf(ch) != -1) {
        start = i;
        break;
      }
    }

    for (int i = text.length() - 1; i >= 0; --i) {
      char ch = text.charAt(i);
      if (Character.isLetterOrDigit(ch) || isChineseCharByREG(ch)
              || keeps.indexOf(ch) != -1) {
        end = i + 1;
        break;
      }
    }

    return text.substring(start, end);
  }

  public static boolean isCJK(char ch) {
    return Character.UnicodeBlock.of(ch) == Character.UnicodeBlock.CJK_UNIFIED_IDEOGRAPHS;
  }

  /**
   * 对整个字符串：
   * 1. 仅保留英文字符、数字、汉字字符和 keeps 中的字符
   * 2. 去除网页空白： 
   * String attrName = "配 送 至：京 东 价：当 当 价";
   * attrName = StringUtils.strip(attrName).replaceAll("[\\s+:：( )]", "");
   * the "blank" characters in the above phrase can not be removed
   */
  public static String removeNonCJKChar(String text) {
    return removeNonCJKChar(text, null);
  }

  public static String removeNonCJKChar(String text, String keeps) {
    StringBuilder builder = new StringBuilder();

    if (keeps == null) {
      keeps = "";
    }

    for (int i = 0; i < text.length(); ++i) {
      char ch = text.charAt(i);
      if (Character.isLetterOrDigit(ch) || isCJK(ch)) {
        builder.append(ch);
      } else if (!keeps.isEmpty() && keeps.indexOf(ch) != -1) {
        builder.append(ch);
      }
    }

    return builder.toString();
  }

  public static String trimNonCJKChar(String text) {
    return trimNonCJKChar(text, null);
  }


  /**
   * 对字符串的头部和尾部：
   * 1. 仅保留英文字符、数字、汉字字符和keeps中的字符
   * 2. 去除网页空白： 
   */
  public static String trimNonCJKChar(String text, String keeps) {
    int start = 0;
    int end = text.length();
    if (keeps == null)
      keeps = "";

    for (int i = 0; i < text.length(); ++i) {
      char ch = text.charAt(i);
      if (Character.isLetterOrDigit(ch) || isCJK(ch) || keeps.indexOf(ch) != -1) {
        start = i;
        break;
      }
    }

    for (int i = text.length() - 1; i >= 0; --i) {
      char ch = text.charAt(i);
      if (Character.isLetterOrDigit(ch) || isCJK(ch) || keeps.indexOf(ch) != -1) {
        end = i + 1;
        break;
      }
    }

    return text.substring(start, end);
  }

  /**
   * Strip non-printable characters from a string.
   *
   * @param s the string to strip.
   * @return a new string with non-printable characters removed.
   */
  public static String removeNonPrintableChar(String s) {
    if (s == null) {
      return null;
    }

    StringBuilder builder = new StringBuilder();

    int len = s.length();
    for (int i = 0; i < len; ++i) {
      char ch = s.charAt(i);
      if (isActuallyWhitespace(ch)) {
        if (i > 0 && i < len - 1) {
          builder.append(' ');
        }
        int j = i + 1;
        while (j < len && isActuallyWhitespace(s.charAt(j))) {
          ++j;
        }
        i = j - 1;
      } else if (isPrintableUnicodeChar(ch)) {
        builder.append(ch);
      }
    }

    return builder.toString();
  }

  /**
   * @deprecated use {@link #removeNonPrintableChar(String)} instead.
   */
  public static String stripNonPrintableChar1(String s) {
    return removeNonPrintableChar(s);
  }

  public static boolean isPrintableUnicodeChar(char ch) {
    Character.UnicodeBlock block = Character.UnicodeBlock.of(ch);
    return (!Character.isISOControl(ch)) && ch != KeyEvent.CHAR_UNDEFINED
            && block != null && block != Character.UnicodeBlock.SPECIALS;
  }

  public static String removeControlChars(String input) {
    return clearControlChars(input, "");
  }

  public static String clearControlChars(String input) {
    return clearControlChars(input, " ");
  }

  public static String clearControlChars(String input, String replacement) {
    if (input == null) {
      return null;
    }

    return input.replaceAll("\\p{Cntrl}", replacement);
  }

  public static String getLongestPart(final String text, final Pattern pattern) {
    String[] parts = pattern.split(text);

    if (parts.length == 1) {
      return "";
    }

    String longestPart = "";
    for (String p : parts) {
      if (p.length() > longestPart.length()) {
        longestPart = p;
      }
    }

    if (longestPart.isEmpty()) {
      return "";
    } else {
      return longestPart.trim();
    }
  }

  public static String getLongestPart(final String text, final String regex) {
    return getLongestPart(text, Pattern.compile(regex));
  }

  /**
   * See CaseFormat from Guava, for example, LOWER_UNDERSCORE.to(LOWER_CAMEL, str)
   */
  public static String csslize(String text) {
    text = StringUtils.uncapitalize(text).trim();
    text = StringUtils.join(text.split("(?=\\p{Upper})"), "-").toLowerCase();
    text = text.replaceAll("[-_]+", "-");
    text = text.replaceAll("\\s+", "-");

    return text;
  }

  /**
   * See CaseFormat from Guava, for example, LOWER_UNDERSCORE.to(LOWER_CAMEL, str)
   */
  public static String humanize(String text) {
    text = StringUtils.join(text.split("(?=\\p{Upper})"), " ");
    text = text.replaceAll("[-_]", " ").toLowerCase().trim();

    return text;
  }

  /**
   * See CaseFormat from Guava, for example, LOWER_UNDERSCORE.to(LOWER_CAMEL, str)
   */
  public static String humanize(String text, String seperator) {
    text = StringUtils.join(text.split("(?=\\p{Upper})"), seperator);
    text = text.replaceAll("[-_]", seperator).toLowerCase().trim();

    return text;
  }

  /**
   * See CaseFormat from Guava, for example, LOWER_UNDERSCORE.to(LOWER_CAMEL, str)
   */
  public static String humanize(String text, String suffix, String seperator) {
    text = StringUtils.join(text.split("(?=\\p{Upper})"), seperator);
    text = text.replaceAll("[-_]", seperator).toLowerCase().trim();

    return text + seperator + suffix;
  }

  /**
   * See CaseFormat from Guava, for example, LOWER_UNDERSCORE.to(LOWER_CAMEL, str)
   */
  public static String humanize(Class clazz, String suffix, String seperator) {
    String text = StringUtils.join(clazz.getSimpleName().split("(?=\\p{Upper})"), seperator);
    text = text.replaceAll("[-_]", seperator).toLowerCase().trim();

    return text + seperator + suffix;
  }

  public static int getLeadingInteger(String s, int defaultValue) {
    int numberEnd = StringUtils.lastIndexOfAny(s, "123456789");
    if (numberEnd == StringUtils.INDEX_NOT_FOUND) {
      return defaultValue;
    }
    return NumberUtils.toInt(s.substring(0, numberEnd), defaultValue);
  }

  public static int getTailingInteger(String s, int defaultValue) {
    int numberStart = StringUtils.indexOfAny(s, "123456789");
    if (numberStart == StringUtils.INDEX_NOT_FOUND) {
      return defaultValue;
    }
    return NumberUtils.toInt(s.substring(numberStart), defaultValue);
  }


  public static int getFirstInteger(String s, int defaultValue) {
    var number = getFirstInteger(s);
    return number == null ? defaultValue : number;
  }

  /**
   * @deprecated use {@link #findFirstInteger(String)} instead
   * */
  public static Integer getFirstInteger(String s) {
    return findFirstInteger(s);
  }

  /**
   * Find the first integer in the string.
   *
   * @return the first integer in the string, or null if not found
   * */
  public static Integer findFirstInteger(String s) {
    if (s == null) {
      return null;
    }

    int numberStart = StringUtils.indexOfAny(s, "123456789");
    if (numberStart == StringUtils.INDEX_NOT_FOUND) {
      return null;
    }

    StringBuilder sb = new StringBuilder(s.length() - numberStart);
    for (int i = numberStart; i < s.length(); ++i) {
      char c = s.charAt(i);
      if (Character.isDigit(c)) {
        sb.append(c);
      } else if (c == ',' || c == '_') {
        // skip number delimiter, 12,345,678 or java style 12_345_678
        // nothing to do
      } else {
        break;
      }
    }

    return Integer.parseInt(sb.toString());
  }

  public static int findFirstInteger(String s, int defaultValue) {
    return getFirstInteger(s, defaultValue);
  }

  /**
   * @deprecated use {@link #findLastInteger(String)} instead
   * */
  public static int getLastInteger(String s, int defaultValue) {
    return findLastInteger(s, defaultValue);
  }

  /**
   * Find the last integer in the string.
   *
   * @return the last integer in the string, or null if not found
   * */
  public static Integer findLastInteger(String s) {
    if (s == null) {
      return null;
    }

    s = s.replaceAll("[,_]", "");
    s = StringUtils.reverse(s);
    Pattern pattern = Pattern.compile("[0-9]+");

    Matcher m = pattern.matcher(s);
    if (m.find()) {
      return NumberUtils.toInt(StringUtils.reverse(m.group()));
    }

    return null;
  }

  public static int findLastInteger(String s, int defaultValue) {
    Integer number = findLastInteger(s);
    return number == null ? defaultValue : number;
  }

  public static float getFirstFloatNumber(String s, float defaultValue) {
    System.out.println(s);

    // number separators
    s = s.replaceAll("[,_]", "");
    Pattern pattern = Pattern.compile("[+-]?[0-9]*\\.?,?[0-9]+");

    Matcher m = pattern.matcher(s);
    if (m.find()) {

      System.out.println(m.group());

      return NumberUtils.toFloat(m.group());
    }

    return defaultValue;
  }

  public static float findLastFloatNumber(String s, float defaultValue) {
    s = s.replaceAll("[,_]", "");
    Pattern pattern = Pattern.compile("[+-]?[0-9]*\\.?,?[0-9]+");

    Matcher m = pattern.matcher(s);
    if (m.find()) {
      return NumberUtils.toFloat(m.group(m.groupCount()));
    }

    return defaultValue;
  }

  public static boolean contains(String text, CharSequence... searchCharSequences) {
    Validate.notNull(searchCharSequences);

    for (CharSequence search : searchCharSequences) {
      if (!text.contains(search)) return false;
    }

    return true;
  }

  public static boolean containsAny(String text, CharSequence... searchCharSequences) {
    Validate.notNull(searchCharSequences);

    for (CharSequence search : searchCharSequences) {
      if (text.contains(search)) return true;
    }

    return false;
  }

  public static boolean containsNone(String text, CharSequence... searchCharSequences) {
    Validate.notNull(searchCharSequences);

    for (CharSequence search : searchCharSequences) {
      if (text.contains(search)) return false;
    }

    return true;
  }

  public static String reverse(String s) {
    if (s == null || s.isEmpty()) {
      return s;
    }

    StringBuilder sb = new StringBuilder(s);
    return sb.reverse().toString();
  }

  public static String doubleQuoteIfContainsWhitespace(String s) {
    if (StringUtils.containsWhitespace(s)) return "\"" + s + "\"";
    else return s;
  }

  /**
   * Formats a decimal number in its compact, readable form.
   *
   * @see 
   * CompactNumberFormat
   */
  public static String compactFormat(int number) {
    return compactFormat(number, -1, false);
  }

  /**
   * Formats a decimal number in its compact, readable form.
   *
   * @see 
   * CompactNumberFormat
   */
  public static String compactFormat(long number) {
    return compactFormat(number, -1, false);
  }

  /**
   * Formats a decimal number in its compact, readable form.
   *
   * @see 
   * CompactNumberFormat
   */
  public static String compactFormat(int number, boolean si) {
    return compactFormat(number, -1, si);
  }

  /**
   * Formats a decimal number in its compact, readable form.
   *
   * @see 
   * CompactNumberFormat
   */
  public static String compactFormat(long number, boolean si) {
    return compactFormat(number, -1, si);
  }

  /**
   * Formats a decimal number in its compact, readable form.
   *
   * @see 
   * CompactNumberFormat
   */
  public static String compactFormat(int number, int scale, boolean si) {
    return compactFormat((long) number, scale, si);
  }

  /**
   * Formats a decimal number in its compact, readable form.
   *
   * @param number the number to format
   * @param scale  the scale of the format result
   * @param si     indicate if format to a SI unit
   *               The International System Of Units (SI) is the metric system that is used
   *               universally as a standard for measurements. SI units play a vital role in scientific
   *               and technological research and development.
   * @return The formatted number
   * @see 
   * CompactNumberFormat
   */
  public static String compactFormat(long number, int scale, boolean si) {
    if (number < 0) {
      return "-" + compactFormat(-number, scale, si);
    }

    int unit = si ? 1000 : 1024;
    if (number < unit) {
      return number + " B";
    }

    int exp = (int) (Math.log(number) / Math.log(unit));
    String pre = (si ? "kMGTPE" : "KMGTPE").charAt(exp - 1) + (si ? "" : "i");
    String format = scale > 0 ? "%," + scale + ".2f %sB" : "%,.2f %sB";
    return String.format(format, number / Math.pow(unit, exp), pre);
  }

  /**
   * Parse key-value pairs in a line, for example :
   * "a=1 b=2 c=3", "x:1 y:2 z:3"
   *
   * @param line The line to parse
   * @return The parsed result
   */
  public static Map parseKvs(String line) {
    return parseKvs(line, "=");
  }

  /**
   * Parse key-value pairs in a line, for example :
   * "a=1 b=2 c=3", "x:1 y:2 z:3"
   *
   * @param line      The line to parse
   * @param delimiter a {@link java.lang.String} object.
   * @return The parsed result
   */
  public static Map parseKvs(String line, String delimiter) {
    return SParser.wrap(line).getKvs(delimiter);
  }

  /**
   * All lines separated by backslashes are merged together
   *
   * @param allLines All lines separated by "\n", some of them are separated by  back slash
   * @return All lines separated by backslashes are merged
   */
  public static List getUnslashedLines(String allLines) {
    return mergeSlashedLines(Arrays.asList(allLines.split("\n")));
  }

  /**
   * 
getUnslashedLines.
   *
   * @param allLines a {@link java.lang.String} object.
   * @param EOL      a {@link java.lang.String} object.
   * @return a {@link java.util.List} object.
   */
  public static List getUnslashedLines(String allLines, String EOL) {
    return mergeSlashedLines(Arrays.asList(allLines.split(EOL)));
  }

  /**
   * Merge lines concatenated with backslash, for example :
   * The line "Java Stream API is very, very useful, \\\n"
   * " and we use them everywhere "
   * can be merged into "Java Stream API is very, very useful, and we use them everywhere"
   *
   * @param slashedLine a {@link java.lang.String} object.
   * @return a {@link java.lang.String} object.
   */
  public static String mergeSlashedLine(String slashedLine) {
    slashedLine = slashedLine.replaceAll("\n", "");
    slashedLine = slashedLine.replaceAll("\\\\", "");
    return slashedLine;
  }

  /**
   * All lines separated by back slashes are merged together
   *
   * @param linesWithSlash Lines with back slash
   * @return All lines separated by back slashes are merged
   */
  public static List mergeSlashedLines(Iterable linesWithSlash) {
    List lines = new ArrayList<>();
    StringBuilder mergedLine = new StringBuilder();
    boolean merging;
    for (String line : linesWithSlash) {
      line = line.trim();

      if (line.isEmpty()) {
        continue;
      }

      if (line.endsWith("\\")) {
        merging = true;
        mergedLine.append(StringUtils.removeEnd(line, "\\"));
      } else {
        mergedLine.append(line);
        merging = false;
      }

      if (!merging) {
        if (mergedLine.length() > 0) {
          lines.add(mergedLine.toString());
          mergedLine = new StringBuilder();
        }
      }
    }

    return lines;
  }

  public static int getLongestCommonSubstring(String a, String b) {
    int m = a.length();
    int n = b.length();

    int max = 0;

    int[][] dp = new int[m][n];

    for (int i = 0; i < m; i++) {
      for (int j = 0; j < n; j++) {
        if (a.charAt(i) == b.charAt(j)) {
          if (i == 0 || j == 0) {
            dp[i][j] = 1;
          } else {
            dp[i][j] = dp[i - 1][j - 1] + 1;
          }

          if (max < dp[i][j])
            max = dp[i][j];
        }

      }
    }

    return max;
  }

  public static String replaceCharsetInHtml(String html, String charset) {
    Matcher matcher = HTML_CHARSET_PATTERN.matcher(html);
    if (matcher.find()) {
      html = html.replaceAll(matcher.group(1), charset);
    }

    return html;
  }

  public static String[] getStrings(String str) {
    Collection values = getStringCollection(str);
    if (values.size() == 0) {
      return null;
    }
    return values.toArray(new String[0]);
  }

  public static String arrayToString(String[] strs) {
    if (strs.length == 0) {
      return "";
    }
    StringBuilder sbuf = new StringBuilder();
    sbuf.append(strs[0]);
    for (int idx = 1; idx < strs.length; idx++) {
      sbuf.append(",");
      sbuf.append(strs[idx]);
    }
    return sbuf.toString();
  }

  public static Collection getStringCollection(String str) {
    String delim = ",";
    return getStringCollection(str, delim);
  }

  public static Collection getStringCollection(String str, String delim) {
    List values = new ArrayList();
    if (str == null)
      return values;
    StringTokenizer tokenizer = new StringTokenizer(str, delim);
    while (tokenizer.hasMoreTokens()) {
      values.add(tokenizer.nextToken());
    }
    return values;
  }

  /**
   * Splits a comma separated value String, trimming leading and trailing whitespace on each value.
   * Duplicate and empty values are removed.
   *
   * @param str a comma separated string with values
   * @return a Collection of String values
   */
  public static Collection getTrimmedStringCollection(String str) {
    Set set = new LinkedHashSet(Arrays.asList(getTrimmedStrings(str)));
    set.remove("");
    return set;
  }

  /**
   * Splits a comma separated value String, trimming leading and trailing whitespace on each value.
   *
   * @param str a comma separated String with values
   * @return an array of String values
   */
  public static String[] getTrimmedStrings(String str) {
    if (null == str || str.trim().isEmpty()) {
      return emptyStringArray;
    }

    return str.trim().split("\\s*,\\s*");
  }

  public static boolean hasHTMLTags(String text) {
    Matcher matcher = HTML_TAG_PATTERN.matcher(text);
    return matcher.find();
  }

  public static boolean isFloat(String text) {
    return FLOAT_PATTERN.matcher(text).matches();
  }

  public static boolean isNumericLike(String text) {
    return NUMERIC_LIKE_PATTERN.matcher(text).matches();
  }

  /**
   * regextester
   *
   * @param text a {@link String} object.
   * @return a boolean.
   */
  public static boolean isMoneyLike(String text) {
    return MONEY_LIKE_PATTERN.matcher(text).matches();
  }

  /**
   * isIpPortLike.
   *
   * @param text a {@link java.lang.String} object.
   * @return a boolean.
   */
  public static boolean isIpPortLike(String text) {
    return IP_PORT_PATTERN.matcher(text).matches();
  }

  /**
   * isIpLike.
   *
   * @param text a {@link java.lang.String} object.
   * @return a boolean.
   */
  public static boolean isIpLike(String text) {
    return isIpV4Like(text);
  }

  public static boolean isIpV4Like(String text) {
    return text.matches("\\d{1,3}\\.\\d{1,3}\\.\\d{1,3}\\.\\d{1,3}");
  }
}