All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.thinkbiganalytics.metadata.jpa.support.NormalizeAndCleanString Maven / Gradle / Ivy

package com.thinkbiganalytics.metadata.jpa.support;

/*-
 * #%L
 * thinkbig-operational-metadata-jpa
 * %%
 * Copyright (C) 2017 ThinkBig Analytics
 * %%
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 * #L%
 */

import org.apache.commons.lang3.StringUtils;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import java.nio.charset.Charset;
import java.text.Normalizer;

/**
 * MySQL doesnt like unicode strings, and other chars.
 * This will normalize the string and strip the bad chars
 */
public class NormalizeAndCleanString {
    private static final Logger log = LoggerFactory.getLogger(NormalizeAndCleanString.class);


    public static String normalizeAndClean(String str){
        try {
            if(StringUtils.isNotBlank(str)) {
                String testStr = Normalizer.normalize(str, Normalizer.Form.NFD);
                String clean = testStr.replaceAll("\\P{InBasic_Latin}", "");
                return clean;
            }
        }catch (Exception e){
            log.error("Unable to replace non UTF-8 characters for {}. {} ",str,e.getMessage(),e);
        }
        return null;
    }





}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy