com.whaleal.icefrog.extra.tokenizer.engine.hanlp.HanLPEngine Maven / Gradle / Ivy
package com.whaleal.icefrog.extra.tokenizer.engine.hanlp;
import com.hankcs.hanlp.HanLP;
import com.hankcs.hanlp.seg.Segment;
import com.whaleal.icefrog.core.util.StrUtil;
import com.whaleal.icefrog.extra.tokenizer.TokenizerEngine;
import com.whaleal.icefrog.extra.tokenizer.Result;
/**
* HanLP分词引擎实现
* 项目地址:https://github.com/hankcs/HanLP
*
* @author Looly
* @author wh
*
*/
public class HanLPEngine implements TokenizerEngine {
private final Segment seg;
/**
* 构造
*
*/
public HanLPEngine() {
this(HanLP.newSegment());
}
/**
* 构造
*
* @param seg {@link Segment}
*/
public HanLPEngine(Segment seg) {
this.seg = seg;
}
@Override
public Result parse(CharSequence text) {
return new HanLPResult(this.seg.seg(StrUtil.str(text)));
}
}