All Downloads are FREE. Search and download functionalities are using the official Maven repository.

cn.hutool.extra.tokenizer.engine.word.WordEngine Maven / Gradle / Ivy

The newest version!
package cn.hutool.extra.tokenizer.engine.word;

import org.apdplat.word.segmentation.Segmentation;
import org.apdplat.word.segmentation.SegmentationAlgorithm;
import org.apdplat.word.segmentation.SegmentationFactory;

import cn.hutool.core.util.StrUtil;
import cn.hutool.extra.tokenizer.Result;
import cn.hutool.extra.tokenizer.TokenizerEngine;

/**
 * Word分词引擎实现
* 项目地址:https://github.com/ysc/word * * @author looly * */ public class WordEngine implements TokenizerEngine { private final Segmentation segmentation; /** * 构造 */ public WordEngine() { this(SegmentationAlgorithm.BidirectionalMaximumMatching); } /** * 构造 * * @param algorithm {@link SegmentationAlgorithm}分词算法枚举 */ public WordEngine(SegmentationAlgorithm algorithm) { this(SegmentationFactory.getSegmentation(algorithm)); } /** * 构造 * * @param segmentation {@link Segmentation}分词实现 */ public WordEngine(Segmentation segmentation) { this.segmentation = segmentation; } @Override public Result parse(CharSequence text) { return new WordResult(this.segmentation.seg(StrUtil.str(text))); } }




© 2015 - 2024 Weber Informatics LLC | Privacy Policy