All Downloads are FREE. Search and download functionalities are using the official Maven repository.

cn.geektool.core.util.HashUtil Maven / Gradle / Ivy

package cn.geektool.core.util;

import cn.geektool.core.lang.hash.CityHash;
import cn.geektool.core.lang.hash.MurmurHash;
import cn.geektool.core.lang.hash.Number128;

/**
 * Hash算法大全
* 推荐使用FNV1算法 * * @author Goodzzp, Looly */ public class HashUtil { /** * 加法hash * * @param key 字符串 * @param prime 一个质数 * @return hash结果 */ public static int additiveHash(String key, int prime) { int hash, i; for (hash = key.length(), i = 0; i < key.length(); i++) { hash += key.charAt(i); } return hash % prime; } /** * 旋转hash * * @param key 输入字符串 * @param prime 质数 * @return hash值 */ public static int rotatingHash(String key, int prime) { int hash, i; for (hash = key.length(), i = 0; i < key.length(); ++i) { hash = (hash << 4) ^ (hash >> 28) ^ key.charAt(i); } // 使用:hash = (hash ^ (hash>>10) ^ (hash>>20)) & mask; // 替代:hash %= prime; // return (hash ^ (hash>>10) ^ (hash>>20)); return hash % prime; } /** * 一次一个hash * * @param key 输入字符串 * @return 输出hash值 */ public static int oneByOneHash(String key) { int hash, i; for (hash = 0, i = 0; i < key.length(); ++i) { hash += key.charAt(i); hash += (hash << 10); hash ^= (hash >> 6); } hash += (hash << 3); hash ^= (hash >> 11); hash += (hash << 15); // return (hash & M_MASK); return hash; } /** * Bernstein's hash * * @param key 输入字节数组 * @return 结果hash */ public static int bernstein(String key) { int hash = 0; int i; for (i = 0; i < key.length(); ++i) { hash = 33 * hash + key.charAt(i); } return hash; } /** * Universal Hashing * * @param key 字节数组 * @param mask 掩码 * @param tab tab * @return hash值 */ public static int universal(char[] key, int mask, int[] tab) { int hash = key.length, i, len = key.length; for (i = 0; i < (len << 3); i += 8) { char k = key[i >> 3]; if ((k & 0x01) == 0) { hash ^= tab[i]; } if ((k & 0x02) == 0) { hash ^= tab[i + 1]; } if ((k & 0x04) == 0) { hash ^= tab[i + 2]; } if ((k & 0x08) == 0) { hash ^= tab[i + 3]; } if ((k & 0x10) == 0) { hash ^= tab[i + 4]; } if ((k & 0x20) == 0) { hash ^= tab[i + 5]; } if ((k & 0x40) == 0) { hash ^= tab[i + 6]; } if ((k & 0x80) == 0) { hash ^= tab[i + 7]; } } return (hash & mask); } /** * Zobrist Hashing * * @param key 字节数组 * @param mask 掩码 * @param tab tab * @return hash值 */ public static int zobrist(char[] key, int mask, int[][] tab) { int hash, i; for (hash = key.length, i = 0; i < key.length; ++i) { hash ^= tab[i][key[i]]; } return (hash & mask); } /** * 改进的32位FNV算法1 * * @param data 数组 * @return hash结果 */ public static int fnvHash(byte[] data) { final int p = 16777619; int hash = (int) 2166136261L; for (byte b : data) { hash = (hash ^ b) * p; } hash += hash << 13; hash ^= hash >> 7; hash += hash << 3; hash ^= hash >> 17; hash += hash << 5; return Math.abs(hash); } /** * 改进的32位FNV算法1 * * @param data 字符串 * @return hash结果 */ public static int fnvHash(String data) { final int p = 16777619; int hash = (int) 2166136261L; for (int i = 0; i < data.length(); i++) { hash = (hash ^ data.charAt(i)) * p; } hash += hash << 13; hash ^= hash >> 7; hash += hash << 3; hash ^= hash >> 17; hash += hash << 5; return Math.abs(hash); } /** * Thomas Wang的算法,整数hash * * @param key 整数 * @return hash值 */ public static int intHash(int key) { key += ~(key << 15); key ^= (key >>> 10); key += (key << 3); key ^= (key >>> 6); key += ~(key << 11); key ^= (key >>> 16); return key; } /** * RS算法hash * * @param str 字符串 * @return hash值 */ public static int rsHash(String str) { int b = 378551; int a = 63689; int hash = 0; for (int i = 0; i < str.length(); i++) { hash = hash * a + str.charAt(i); a = a * b; } return hash & 0x7FFFFFFF; } /** * JS算法 * * @param str 字符串 * @return hash值 */ public static int jsHash(String str) { int hash = 1315423911; for (int i = 0; i < str.length(); i++) { hash ^= ((hash << 5) + str.charAt(i) + (hash >> 2)); } return hash & 0x7FFFFFFF; } /** * PJW算法 * * @param str 字符串 * @return hash值 */ public static int pjwHash(String str) { int bitsInUnsignedInt = 32; int threeQuarters = (bitsInUnsignedInt * 3) / 4; int oneEighth = bitsInUnsignedInt / 8; int highBits = 0xFFFFFFFF << (bitsInUnsignedInt - oneEighth); int hash = 0; int test; for (int i = 0; i < str.length(); i++) { hash = (hash << oneEighth) + str.charAt(i); if ((test = hash & highBits) != 0) { hash = ((hash ^ (test >> threeQuarters)) & (~highBits)); } } return hash & 0x7FFFFFFF; } /** * ELF算法 * * @param str 字符串 * @return hash值 */ public static int elfHash(String str) { int hash = 0; int x; for (int i = 0; i < str.length(); i++) { hash = (hash << 4) + str.charAt(i); if ((x = (int) (hash & 0xF0000000L)) != 0) { hash ^= (x >> 24); hash &= ~x; } } return hash & 0x7FFFFFFF; } /** * BKDR算法 * * @param str 字符串 * @return hash值 */ public static int bkdrHash(String str) { int seed = 131; // 31 131 1313 13131 131313 etc.. int hash = 0; for (int i = 0; i < str.length(); i++) { hash = (hash * seed) + str.charAt(i); } return hash & 0x7FFFFFFF; } /** * SDBM算法 * * @param str 字符串 * @return hash值 */ public static int sdbmHash(String str) { int hash = 0; for (int i = 0; i < str.length(); i++) { hash = str.charAt(i) + (hash << 6) + (hash << 16) - hash; } return hash & 0x7FFFFFFF; } /** * DJB算法 * * @param str 字符串 * @return hash值 */ public static int djbHash(String str) { int hash = 5381; for (int i = 0; i < str.length(); i++) { hash = ((hash << 5) + hash) + str.charAt(i); } return hash & 0x7FFFFFFF; } /** * DEK算法 * * @param str 字符串 * @return hash值 */ public static int dekHash(String str) { int hash = str.length(); for (int i = 0; i < str.length(); i++) { hash = ((hash << 5) ^ (hash >> 27)) ^ str.charAt(i); } return hash & 0x7FFFFFFF; } /** * AP算法 * * @param str 字符串 * @return hash值 */ public static int apHash(String str) { int hash = 0; for (int i = 0; i < str.length(); i++) { hash ^= ((i & 1) == 0) ? ((hash << 7) ^ str.charAt(i) ^ (hash >> 3)) : (~((hash << 11) ^ str.charAt(i) ^ (hash >> 5))); } // return (hash & 0x7FFFFFFF); return hash; } /** * TianL Hash算法 * * @param str 字符串 * @return Hash值 */ public static long tianlHash(String str) { long hash; int iLength = str.length(); if (iLength == 0) { return 0; } if (iLength <= 256) { hash = 16777216L * (iLength - 1); } else { hash = 4278190080L; } int i; char ucChar; if (iLength <= 96) { for (i = 1; i <= iLength; i++) { ucChar = str.charAt(i - 1); if (ucChar <= 'Z' && ucChar >= 'A') { ucChar = (char) (ucChar + 32); } hash += (3 * i * ucChar * ucChar + 5 * i * ucChar + 7 * i + 11 * ucChar) % 16777216; } } else { for (i = 1; i <= 96; i++) { ucChar = str.charAt(i + iLength - 96 - 1); if (ucChar <= 'Z' && ucChar >= 'A') { ucChar = (char) (ucChar + 32); } hash += (3 * i * ucChar * ucChar + 5 * i * ucChar + 7 * i + 11 * ucChar) % 16777216; } } if (hash < 0) { hash *= -1; } return hash; } /** * JAVA自己带的算法 * * @param str 字符串 * @return hash值 */ public static int javaDefaultHash(String str) { int h = 0; int off = 0; int len = str.length(); for (int i = 0; i < len; i++) { h = 31 * h + str.charAt(off++); } return h; } /** * 混合hash算法,输出64位的值 * * @param str 字符串 * @return hash值 */ public static long mixHash(String str) { long hash = str.hashCode(); hash <<= 32; hash |= fnvHash(str); return hash; } /** * 根据对象的内存地址生成相应的Hash值 * * @param obj 对象 * @return hash值 * @since 4.2.2 */ public static int identityHashCode(Object obj) { return System.identityHashCode(obj); } /** * MurmurHash算法32-bit实现 * * @param data 数据 * @return hash值 * @since 4.3.3 */ public static int murmur32(byte[] data) { return MurmurHash.hash32(data); } /** * MurmurHash算法64-bit实现 * * @param data 数据 * @return hash值 * @since 4.3.3 */ public static long murmur64(byte[] data) { return MurmurHash.hash64(data); } /** * MurmurHash算法128-bit实现 * * @param data 数据 * @return hash值 * @since 4.3.3 */ public static long[] murmur128(byte[] data) { return MurmurHash.hash128(data); } /** * CityHash算法32-bit实现 * * @param data 数据 * @return hash值 * @since 5.2.5 */ public static int cityHash32(byte[] data) { return CityHash.hash32(data); } /** * CityHash算法64-bit实现,种子1使用默认的CityHash#k2 * * @param data 数据 * @param seed 种子2 * @return hash值 * @since 5.2.5 */ public static long cityHash64(byte[] data, long seed) { return CityHash.hash64(data, seed); } /** * CityHash算法64-bit实现,种子1使用默认的CityHash#k2 * * @param data 数据 * @param seed0 种子1 * @param seed1 种子2 * @return hash值 * @since 5.2.5 */ public static long cityHash64(byte[] data, long seed0, long seed1) { return CityHash.hash64(data, seed0, seed1); } /** * CityHash算法64-bit实现 * * @param data 数据 * @return hash值 * @since 5.2.5 */ public static long cityHash64(byte[] data) { return CityHash.hash64(data); } /** * CityHash算法128-bit实现 * * @param data 数据 * @return hash值 * @since 5.2.5 */ public static long[] cityHash128(byte[] data) { return CityHash.hash128(data).getLongArray(); } /** * CityHash算法128-bit实现 * * @param data 数据 * @param seed 种子 * @return hash值,long[0]:低位,long[1]:高位 * @since 5.2.5 */ public static long[] cityHash128(byte[] data, Number128 seed) { return CityHash.hash128(data).getLongArray(); } }




© 2015 - 2025 Weber Informatics LLC | Privacy Policy