All Downloads are FREE. Search and download functionalities are using the official Maven repository.

cn.hutool.extra.tokenizer.engine.word.WordEngine Maven / Gradle / Ivy

Go to download

Hutool是一个小而全的Java工具类库,通过静态方法封装,降低相关API的学习成本,提高工作效率,使Java拥有函数式语言般的优雅,让Java语言也可以“甜甜的”。

There is a newer version: 5.8.34
Show newest version
package cn.hutool.extra.tokenizer.engine.word;

import org.apdplat.word.segmentation.Segmentation;
import org.apdplat.word.segmentation.SegmentationAlgorithm;
import org.apdplat.word.segmentation.SegmentationFactory;

import cn.hutool.core.util.StrUtil;
import cn.hutool.extra.tokenizer.Result;
import cn.hutool.extra.tokenizer.TokenizerEngine;

/**
 * Word分词引擎实现
* 项目地址:https://github.com/ysc/word * * @author looly * */ public class WordEngine implements TokenizerEngine { private final Segmentation segmentation; /** * 构造 */ public WordEngine() { this(SegmentationAlgorithm.BidirectionalMaximumMatching); } /** * 构造 * * @param algorithm {@link SegmentationAlgorithm}分词算法枚举 */ public WordEngine(SegmentationAlgorithm algorithm) { this(SegmentationFactory.getSegmentation(algorithm)); } /** * 构造 * * @param segmentation {@link Segmentation}分词实现 */ public WordEngine(Segmentation segmentation) { this.segmentation = segmentation; } @Override public Result parse(CharSequence text) { return new WordResult(this.segmentation.seg(StrUtil.str(text))); } }




© 2015 - 2024 Weber Informatics LLC | Privacy Policy