All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.taobao.diamond.utils.UrlAnalysisUtils Maven / Gradle / Ivy

There is a newer version: 3.2.4
Show newest version
package com.taobao.diamond.utils;

import java.util.regex.Matcher;
import java.util.regex.Pattern;

import com.taobao.diamond.common.Constants;


/**
 * 
 * @author leiwen.zh
 * 
 */
public class UrlAnalysisUtils {

    private static Pattern urlPattern = Pattern.compile("^(\\w+://)?([\\w\\.]+:)(\\d*)?(\\??.*)");


    public static String getContentIdentity(String content) {

        if (!verifyIncrementPubContent(content)) {
            return null;
        }

        Matcher matcher = urlPattern.matcher(content);
        StringBuilder buf = new StringBuilder();
        if (matcher.find()) {
            String scheme = matcher.group(1);
            String address = matcher.group(2);
            String port = matcher.group(3);
            if (scheme != null) {
                buf.append(scheme);
            }
            buf.append(address);
            if (port != null) {
                buf.append(port);
            }
        }
        return buf.toString();
    }


    private static boolean verifyIncrementPubContent(String content) {

        if (content == null || content.length() == 0) {
            return false;
        }
        for (int i = 0; i < content.length(); i++) {
            char c = content.charAt(i);
            if (c == '\r' || c == '\n') {
                return false;
            }
            if (c == Constants.WORD_SEPARATOR.charAt(0)) {
                return false;
            }
        }
        return true;
    }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy