All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.nlpcn.commons.lang.tire.library.Library Maven / Gradle / Ivy

package org.nlpcn.commons.lang.tire.library;

import java.io.BufferedReader;
import java.io.FileInputStream;
import java.io.InputStream;
import java.util.List;

import org.nlpcn.commons.lang.tire.domain.Forest;
import org.nlpcn.commons.lang.tire.domain.SmartForest;
import org.nlpcn.commons.lang.tire.domain.Value;
import org.nlpcn.commons.lang.util.IOUtil;

public class Library {

	public static Forest makeForest(String path) throws Exception {
		return makeForest(new FileInputStream(path));
	}

	public static Forest makeForest(String path, String encoding) throws Exception {
		return makeForest(new FileInputStream(path), encoding);
	}

	public static Forest makeForest(InputStream inputStream) throws Exception {
		return makeForest(IOUtil.getReader(inputStream, "UTF-8"));
	}

	public static Forest makeForest(InputStream inputStream, String encoding) throws Exception {
		return makeForest(IOUtil.getReader(inputStream, encoding));
	}

	public static Forest makeForest(BufferedReader br) throws Exception {
		return makeLibrary(br, new Forest());
	}

	/**
	 * 传入value数组.构造树
	 *
	 * @param values
	 * @param forest
	 * @return
	 */
	public static Forest makeForest(List values) {
		Forest forest = new Forest();
		for (Value value : values) {
			insertWord(forest, value.toString());
		}
		return forest;
	}

	/**
	 * 词典树的构造方法
	 *
	 * @param br
	 * @param forest
	 * @return
	 * @throws Exception
	 */
	private static Forest makeLibrary(BufferedReader br, Forest forest) throws Exception {
		if (br == null)
			return forest;
		try {
			String temp = null;
			while ((temp = br.readLine()) != null) {
				insertWord(forest, temp);
			}
		} catch (Exception e) {
			e.printStackTrace();
		} finally {
			br.close();
		}
		return forest;
	}

	public static void insertWord(Forest forest, Value value) {
		insertWord(forest, value.getKeyword(), value.getParamers());
	}

	/**
	 * 插入一个词
	 *
	 * @param forest
	 * @param temp
	 */
	public static void insertWord(Forest forest, String temp) {
		String[] param = temp.split("\t");

		temp = param[0];

		String[] resultParams = new String[param.length - 1];
		for (int j = 1; j < param.length; j++) {
			resultParams[j - 1] = param[j];
		}

		insertWord(forest, temp, resultParams);
	}

	private static void insertWord(Forest forest, String temp, String... param) {
		SmartForest branch = forest;
		char[] chars = temp.toCharArray();
		for (int i = 0; i < chars.length; i++) {
			if (chars.length == i + 1) {
				branch.add(new Forest(chars[i], 3, param));
			} else {
				branch.add(new Forest(chars[i], 1, null));
			}
			branch = branch.getBranch(chars[i]);
		}
	}

	/**
	 * 删除一个词
	 *
	 * @param forest
	 * @param temp
	 */
	public static void removeWord(Forest forest, String word) {
		SmartForest branch = forest;
		char[] chars = word.toCharArray();

		for (int i = 0; i < chars.length; i++) {
			if (branch == null)
				return;
			if (chars.length == i + 1) {
				branch.add(new Forest(chars[i], -1, null));
			}
			branch = branch.getBranch(chars[i]);
		}
	}
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy