diff --git a/asrserver.py b/asrserver.py deleted file mode 100644 index f3f8489..0000000 --- a/asrserver.py +++ /dev/null @@ -1,157 +0,0 @@ -#!/usr/bin/env python3 -# -*- coding: utf-8 -*- -# -# Copyright 2016-2099 Ailemon.net -# -# This file is part of ASRT Speech Recognition Tool. -# -# ASRT is free software: you can redistribute it and/or modify -# it under the terms of the GNU General Public License as published by -# the Free Software Foundation, either version 3 of the License, or -# (at your option) any later version. -# ASRT is distributed in the hope that it will be useful, -# but WITHOUT ANY WARRANTY; without even the implied warranty of -# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the -# GNU General Public License for more details. -# -# You should have received a copy of the GNU General Public License -# along with ASRT. If not, see . -# ============================================================================ - -""" -@author: nl8590687 -ASRT语音识别API的HTTP服务器程序 -""" - -import http.server -import socket -from speech_model import ModelSpeech -from speech_model_zoo import SpeechModel251BN -from speech_features import Spectrogram -from LanguageModel2 import ModelLanguage - -AUDIO_LENGTH = 1600 -AUDIO_FEATURE_LENGTH = 200 -CHANNELS = 1 -# 默认输出的拼音的表示大小是1428,即1427个拼音+1个空白块 -OUTPUT_SIZE = 1428 -sm251bn = SpeechModel251BN( - input_shape=(AUDIO_LENGTH, AUDIO_FEATURE_LENGTH, CHANNELS), - output_size=OUTPUT_SIZE - ) -feat = Spectrogram() -ms = ModelSpeech(sm251bn, feat, max_label_length=64) -ms.load_model('save_models/' + sm251bn.get_model_name() + '.model.h5') - -ml = ModelLanguage('model_language') -ml.LoadModel() - - -class ASRTHTTPHandle(http.server.BaseHTTPRequestHandler): - def setup(self): - self.request.settimeout(10) - http.server.BaseHTTPRequestHandler.setup(self) - - def _set_response(self): - self.send_response(200) - self.send_header('Content-type', 'text/html') - self.end_headers() - - def do_GET(self): - buf = 'ASRT_SpeechRecognition API' - self.protocal_version = 'HTTP/1.1' - - self._set_response() - - buf = bytes(buf,encoding="utf-8") - self.wfile.write(buf) - - def do_POST(self): - ''' - 处理通过POST方式传递过来并接收的语音数据 - 通过语音模型和语言模型计算得到语音识别结果并返回 - ''' - path = self.path - print(path) - #获取post提交的数据 - datas = self.rfile.read(int(self.headers['content-length'])) - #datas = urllib.unquote(datas).decode("utf-8", 'ignore') - datas = datas.decode('utf-8') - datas_split = datas.split('&') - token = '' - fs = 0 - wavs = [] - - for line in datas_split: - [key, value]=line.split('=') - if key == 'wavs' and value != '': - wavs.append(int(value)) - elif key == 'fs': - fs = int(value) - elif key == 'token': - token = value - else: - print(key, value) - - if token != 'qwertasd': - buf = '403' - print(buf) - buf = bytes(buf,encoding="utf-8") - self.wfile.write(buf) - return - - if len(wavs)>0: - r = self.recognize([wavs], fs) - else: - r = '' - - if token == 'qwertasd': - buf = r - else: - buf = '403' - - self._set_response() - - print(buf) - buf = bytes(buf,encoding="utf-8") - self.wfile.write(buf) - - def recognize(self, wavs, fs): - r='' - try: - r_speech = ms.recognize_speech(wavs, fs) - print(r_speech) - str_pinyin = r_speech - r = ml.SpeechToText(str_pinyin) - except Exception as ex: - r='' - print('[*Message] Server raise a bug. ', ex) - return r - - def recognize_from_file(self, filename): - pass - - -class HTTPServerV6(http.server.HTTPServer): - address_family = socket.AF_INET6 - - -def start_server(ip, port): - if ':' in ip: - http_server = HTTPServerV6((ip, port), ASRTHTTPHandle) - else: - http_server = http.server.HTTPServer((ip, int(port)), ASRTHTTPHandle) - - print('服务器已开启') - - try: - http_server.serve_forever() #设置一直监听并接收请求 - except KeyboardInterrupt: - pass - http_server.server_close() - print('HTTP server closed') - - -if __name__ == '__main__': - start_server('', 20000) # For IPv4 Network Only - #start_server('::', 20000) # For IPv6 Network diff --git a/client.py b/client.py deleted file mode 100644 index d7be0f8..0000000 --- a/client.py +++ /dev/null @@ -1,40 +0,0 @@ -#!/usr/bin/env python3 -# -*- coding: utf-8 -*- -# -# Copyright 2016-2099 Ailemon.net -# -# This file is part of ASRT Speech Recognition Tool. -# -# ASRT is free software: you can redistribute it and/or modify -# it under the terms of the GNU General Public License as published by -# the Free Software Foundation, either version 3 of the License, or -# (at your option) any later version. -# ASRT is distributed in the hope that it will be useful, -# but WITHOUT ANY WARRANTY; without even the implied warranty of -# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the -# GNU General Public License for more details. -# -# You should have received a copy of the GNU General Public License -# along with ASRT. If not, see . -# ============================================================================ - -''' -@author: nl8590687 -ASRT语音识别asrserver测试专用客户端 -''' -import time -import requests -from utils.ops import read_wav_data - -URL = 'http://127.0.0.1:20000/' -TOKEN = 'qwertasd' -wavsignal, fs, _, _ = read_wav_data('X:\\语音数据集\\data_thchs30\\train\\A11_0.wav') -datas={'token':TOKEN, 'fs':fs, 'wavs':wavsignal} - -t0=time.time() -r = requests.post(URL, datas) -t1=time.time() -r.encoding='utf-8' - -print(r.text) -print('time:', t1-t0, 's')