com.mayabot.nlp.pinyin.PinyinService.kt Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of mynlp-pinyin Show documentation
Show all versions of mynlp-pinyin Show documentation
Maya Nlp subproject :modules:mynlp-pinyin
/*
* Copyright 2018 mayabot.com authors. All rights reserved.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.mayabot.nlp.pinyin
import com.google.common.collect.Lists
import com.mayabot.nlp.MynlpEnv
import com.mayabot.nlp.SettingItem.string
import com.mayabot.nlp.injector.Singleton
import com.mayabot.nlp.pinyin.model.Pinyin
import com.mayabot.nlp.resources.NlpResource
import java.util.*
/**
* 拼音的词典
*
* @author jimichan
*/
@Singleton
class PinyinService constructor(private val mynlp: MynlpEnv) : BasePinyinDictionary() {
init {
rebuild()
}
internal override fun load(): TreeMap> {
val list = Lists.newArrayList()
list.add(mynlp.loadResource(mynlp.get(pinyinSetting)))
val ext = mynlp.tryLoadResource(pinyinExtDicSetting)
if (ext != null) {
list.add(ext)
}
val map = TreeMap>()
for (dictResource in list) {
dictResource.inputStream()
.bufferedReader()
.forEachLine { line ->
//降龙伏虎=xiang2,long2,fu2,hu3
//单=dan1,shan4,chan2
val param = line.split("=".toRegex()).dropLastWhile { it.isEmpty() }.toTypedArray()
val key = param[0]
try {
val pinyins = parse(param[1])
if (pinyins != null) {
map[key] = pinyins
}
} catch (e: java.lang.Exception) {
logger.error("parse ${param[1]}", e)
}
}
}
return map
}
companion object {
@JvmStatic
val version = "1.0.0"
@JvmStatic
val pinyinSetting = string("pinyin.dict", "mynlp-pinyin.txt")
@JvmStatic
val pinyinExtDicSetting = string("pinyin.ext.dict", null)
}
override fun toString(): String {
return super.toString()
}
}