All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.solr.common.util.StrUtils Maven / Gradle / Ivy

/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.apache.solr.common.util;

import java.util.List;
import java.util.ArrayList;
import java.util.Collections;
import java.util.Locale;
import java.io.IOException;

import org.apache.solr.common.SolrException;

/**
 *
 */
public class StrUtils {
  public static final char[] HEX_DIGITS = { '0', '1', '2', '3', '4', '5', '6',
      '7', '8', '9', 'a', 'b', 'c', 'd', 'e', 'f' };

  /**
   * Split a string based on a separator, but don't split if it's inside
   * a string.  Assume '\' escapes the next char both inside and
   * outside strings.
   */
  public static List splitSmart(String s, char separator) {
    ArrayList lst = new ArrayList(4);
    int pos=0, start=0, end=s.length();
    char inString=0;
    char ch=0;
    while (pos < end) {
      char prevChar=ch;
      ch = s.charAt(pos++);
      if (ch=='\\') {    // skip escaped chars
        pos++;
      } else if (inString != 0 && ch==inString) {
        inString=0;
      } else if (ch=='\'' || ch=='"') {
        // If char is directly preceeded by a number or letter
        // then don't treat it as the start of a string.
        // Examples: 50" TV, or can't
        if (!Character.isLetterOrDigit(prevChar)) {
          inString=ch;
        }
      } else if (ch==separator && inString==0) {
        lst.add(s.substring(start,pos-1));
        start=pos;
      }
    }
    if (start < end) {
      lst.add(s.substring(start,end));
    }

    /***
    if (SolrCore.log.isLoggable(Level.FINEST)) {
      SolrCore.log.trace("splitCommand=" + lst);
    }
    ***/

    return lst;
  }

  /** Splits a backslash escaped string on the separator.
   * 

* Current backslash escaping supported: *
\n \t \r \b \f are escaped the same as a Java String *
Other characters following a backslash are produced verbatim (\c => c) * * @param s the string to split * @param separator the separator to split on * @param decode decode backslash escaping */ public static List splitSmart(String s, String separator, boolean decode) { ArrayList lst = new ArrayList(2); StringBuilder sb = new StringBuilder(); int pos=0, end=s.length(); while (pos < end) { if (s.startsWith(separator,pos)) { if (sb.length() > 0) { lst.add(sb.toString()); sb=new StringBuilder(); } pos+=separator.length(); continue; } char ch = s.charAt(pos++); if (ch=='\\') { if (!decode) sb.append(ch); if (pos>=end) break; // ERROR, or let it go? ch = s.charAt(pos++); if (decode) { switch(ch) { case 'n' : ch='\n'; break; case 't' : ch='\t'; break; case 'r' : ch='\r'; break; case 'b' : ch='\b'; break; case 'f' : ch='\f'; break; } } } sb.append(ch); } if (sb.length() > 0) { lst.add(sb.toString()); } return lst; } /** * Splits file names separated by comma character. * File names can contain comma characters escaped by backslash '\' * * @param fileNames the string containing file names * @return a list of file names with the escaping backslashed removed */ public static List splitFileNames(String fileNames) { if (fileNames == null) return Collections.emptyList(); List result = new ArrayList(); for (String file : fileNames.split("(? items, char separator) { StringBuilder sb = new StringBuilder(items.size() << 3); boolean first=true; for (Object o : items) { String item = o.toString(); if (first) { first = false; } else { sb.append(separator); } for (int i=0; i splitWS(String s, boolean decode) { ArrayList lst = new ArrayList(2); StringBuilder sb = new StringBuilder(); int pos=0, end=s.length(); while (pos < end) { char ch = s.charAt(pos++); if (Character.isWhitespace(ch)) { if (sb.length() > 0) { lst.add(sb.toString()); sb=new StringBuilder(); } continue; } if (ch=='\\') { if (!decode) sb.append(ch); if (pos>=end) break; // ERROR, or let it go? ch = s.charAt(pos++); if (decode) { switch(ch) { case 'n' : ch='\n'; break; case 't' : ch='\t'; break; case 'r' : ch='\r'; break; case 'b' : ch='\b'; break; case 'f' : ch='\f'; break; } } } sb.append(ch); } if (sb.length() > 0) { lst.add(sb.toString()); } return lst; } public static List toLower(List strings) { ArrayList ret = new ArrayList(strings.size()); for (String str : strings) { ret.add(str.toLowerCase(Locale.ROOT)); } return ret; } /** Return if a string starts with '1', 't', or 'T' * and return false otherwise. */ public static boolean parseBoolean(String s) { char ch = s.length()>0 ? s.charAt(0) : 0; return (ch=='1' || ch=='t' || ch=='T'); } /** how to transform a String into a boolean... more flexible than * Boolean.parseBoolean() to enable easier integration with html forms. */ public static boolean parseBool(String s) { if( s != null ) { if( s.startsWith("true") || s.startsWith("on") || s.startsWith("yes") ) { return true; } if( s.startsWith("false") || s.startsWith("off") || s.equals("no") ) { return false; } } throw new SolrException( SolrException.ErrorCode.BAD_REQUEST, "invalid boolean value: "+s ); } /** * {@link NullPointerException} and {@link SolrException} free version of {@link #parseBool(String)} * @return parsed boolean value (or def, if s is null or invalid) */ public static boolean parseBool(String s, boolean def) { if( s != null ) { if( s.startsWith("true") || s.startsWith("on") || s.startsWith("yes") ) { return true; } if( s.startsWith("false") || s.startsWith("off") || s.equals("no") ) { return false; } } return def; } /** * URLEncodes a value, replacing only enough chars so that * the URL may be unambiguously pasted back into a browser. *

* Characters with a numeric value less than 32 are encoded. * &,=,%,+,space are encoded. *

*/ public static void partialURLEncodeVal(Appendable dest, String val) throws IOException { for (int i=0; i





© 2015 - 2025 Weber Informatics LLC | Privacy Policy