ASRT_SpeechRecognition/utils/config.py

75 lines
2.1 KiB
Python

#!/usr/bin/env python3
# -*- coding: utf-8 -*-
#
# Copyright 2016-2099 Ailemon.net
#
# This file is part of ASRT Speech Recognition Tool.
#
# ASRT is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
# ASRT is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with ASRT. If not, see <https://www.gnu.org/licenses/>.
# ============================================================================
"""
@author: nl8590687
加载ASRT配置文件相关
"""
import json
DEFAULT_CONFIG_FILENAME = 'asrt_config.json'
_config_dict = None
_pinyin_dict = None
_pinyin_list = None
def load_config_file(filename: str) -> dict:
"""
加载json配置文件
参数:\\
filename: 文件名
返回:\\
配置信息字典
"""
global _config_dict
if _config_dict is not None:
return _config_dict
with open(filename, 'r', encoding="utf-8") as file_pointer:
_config_dict = json.load(file_pointer)
return _config_dict
def load_pinyin_dict(filename: str) -> tuple:
"""
加载拼音列表和拼音字典
拼音列表:用于下标索引转拼音 \\
拼音字典:用于拼音索引转下标
"""
global _pinyin_list, _pinyin_dict
if _pinyin_dict is not None and _pinyin_list is not None:
return _pinyin_list, _pinyin_dict
_pinyin_list = list()
_pinyin_dict = dict()
with open(filename, 'r', encoding='utf-8') as file_pointer:
lines = file_pointer.read().split('\n')
for line in lines:
if len(line) == 0:
continue
tokens = line.split('\t')
_pinyin_list.append(tokens[0])
_pinyin_dict[tokens[0]] = len(_pinyin_list) - 1
return _pinyin_list, _pinyin_dict