All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.mayabot.nlp.pinyin.PinyinService.kt Maven / Gradle / Ivy

There is a newer version: 3.1.7
Show newest version
/*
 * Copyright 2018 mayabot.com authors. All rights reserved.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 *  you may not use this file except in compliance with the License.
 *  You may obtain a copy of the License at
 *
 *       http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package com.mayabot.nlp.pinyin

import com.google.common.collect.Lists
import com.mayabot.nlp.MynlpEnv
import com.mayabot.nlp.SettingItem.string
import com.mayabot.nlp.injector.Singleton
import com.mayabot.nlp.pinyin.model.Pinyin
import com.mayabot.nlp.resources.NlpResource
import java.util.*

/**
 * 拼音的词典
 *
 * @author jimichan
 */
@Singleton
class PinyinService constructor(private val mynlp: MynlpEnv) : BasePinyinDictionary() {

    init {
        rebuild()
    }

    internal override fun load(): TreeMap> {
        val list = Lists.newArrayList()

        list.add(mynlp.loadResource(mynlp.get(pinyinSetting)))

        val ext = mynlp.tryLoadResource(pinyinExtDicSetting)
        if (ext != null) {
            list.add(ext)
        }

        val map = TreeMap>()
        for (dictResource in list) {

            dictResource.inputStream()
                    .bufferedReader()
                    .forEachLine { line ->
                        //降龙伏虎=xiang2,long2,fu2,hu3
                        //单=dan1,shan4,chan2
                        val param = line.split("=".toRegex()).dropLastWhile { it.isEmpty() }.toTypedArray()

                        val key = param[0]
                        try {
                            val pinyins = parse(param[1])
                            if (pinyins != null) {
                                map[key] = pinyins
                            }
                        } catch (e: java.lang.Exception) {
                            logger.error("parse ${param[1]}", e)
                        }
                    }
        }
        return map
    }

    companion object {

        @JvmStatic
        val version = "1.0.0"

        @JvmStatic
        val pinyinSetting = string("pinyin.dict", "mynlp-pinyin.txt")

        @JvmStatic
        val pinyinExtDicSetting = string("pinyin.ext.dict", null)
    }

    override fun toString(): String {
        return super.toString()
    }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy