ASRT_SpeechRecognition/asrserver.py

#!/usr/bin/env python3
# -*- coding: utf-8 -*-
#
# Copyright 2016-2099 Ailemon.net
#
# This file is part of ASRT Speech Recognition Tool.
#
# ASRT is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
# ASRT is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with ASRT.  If not, see <https://www.gnu.org/licenses/>.
# ============================================================================

"""
@author: nl8590687
ASRT语音识别API的HTTP服务器程序
"""

import http.server
import socket
from speech_model import ModelSpeech
from speech_model_zoo import SpeechModel251BN
from speech_features import Spectrogram
from LanguageModel2 import ModelLanguage

AUDIO_LENGTH = 1600
AUDIO_FEATURE_LENGTH = 200
CHANNELS = 1
# 默认输出的拼音的表示大小是1428，即1427个拼音+1个空白块
OUTPUT_SIZE = 1428
sm251bn = SpeechModel251BN(
    input_shape=(AUDIO_LENGTH, AUDIO_FEATURE_LENGTH, CHANNELS),
    output_size=OUTPUT_SIZE
    )
feat = Spectrogram()
ms = ModelSpeech(sm251bn, feat, max_label_length=64)
ms.load_model('save_models/' + sm251bn.get_model_name() + '.model.h5')

ml = ModelLanguage('model_language')
ml.LoadModel()


class ASRTHTTPHandle(http.server.BaseHTTPRequestHandler):
    def setup(self):
        self.request.settimeout(10)
        http.server.BaseHTTPRequestHandler.setup(self)

    def _set_response(self):
        self.send_response(200)
        self.send_header('Content-type', 'text/html')
        self.end_headers()

    def do_GET(self):
        buf = 'ASRT_SpeechRecognition API'
        self.protocal_version = 'HTTP/1.1'

        self._set_response()

        buf = bytes(buf,encoding="utf-8")
        self.wfile.write(buf)

    def do_POST(self):
        '''
        处理通过POST方式传递过来并接收的语音数据
        通过语音模型和语言模型计算得到语音识别结果并返回
        '''
        path = self.path
        print(path)
        #获取post提交的数据
        datas = self.rfile.read(int(self.headers['content-length']))
        #datas = urllib.unquote(datas).decode("utf-8", 'ignore')
        datas = datas.decode('utf-8')
        datas_split = datas.split('&')
        token = ''
        fs = 0
        wavs = []

        for line in datas_split:
            [key, value]=line.split('=')
            if key == 'wavs' and value != '':
                wavs.append(int(value))
            elif key == 'fs':
                fs = int(value)
            elif key == 'token':
                token = value
            else:
                print(key, value)

        if token != 'qwertasd':
            buf = '403'
            print(buf)
            buf = bytes(buf,encoding="utf-8")
            self.wfile.write(buf)
            return

        if len(wavs)>0:
            r = self.recognize([wavs], fs)
        else:
            r = ''

        if token == 'qwertasd':
            buf = r
        else:
            buf = '403'

        self._set_response()

        print(buf)
        buf = bytes(buf,encoding="utf-8")
        self.wfile.write(buf)

    def recognize(self, wavs, fs):
        r=''
        try:
            r_speech = ms.recognize_speech(wavs, fs)
            print(r_speech)
            str_pinyin = r_speech
            r = ml.SpeechToText(str_pinyin)
        except Exception as ex:
            r=''
            print('[*Message] Server raise a bug. ', ex)
        return r

    def recognize_from_file(self, filename):
        pass


class HTTPServerV6(http.server.HTTPServer):
    address_family = socket.AF_INET6


def start_server(ip, port):
    if ':' in ip:
        http_server = HTTPServerV6((ip, port), ASRTHTTPHandle)
    else:
        http_server = http.server.HTTPServer((ip, int(port)), ASRTHTTPHandle)

    print('服务器已开启')

    try:
        http_server.serve_forever() #设置一直监听并接收请求
    except KeyboardInterrupt:
        pass
    http_server.server_close()
    print('HTTP server closed')


if __name__ == '__main__':
    start_server('', 20000) # For IPv4 Network Only
    #start_server('::', 20000) # For IPv6 Network
-												add language model and server and fix bugs

											
										
										
											2018-04-21 20:50:53 +08:00
+								#!/usr/bin/env python3
 								# -*- coding: utf-8 -*-
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								#
 								# Copyright 2016-2099 Ailemon.net
 								#
 								# This file is part of ASRT Speech Recognition Tool.
 								#
 								# ASRT is free software: you can redistribute it and/or modify
 								# it under the terms of the GNU General Public License as published by
 								# the Free Software Foundation, either version 3 of the License, or
 								# (at your option) any later version.
 								# ASRT is distributed in the hope that it will be useful,
 								# but WITHOUT ANY WARRANTY; without even the implied warranty of
 								# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 								# GNU General Public License for more details.
 								#
 								# You should have received a copy of the GNU General Public License
 								# along with ASRT.  If not, see <https://www.gnu.org/licenses/>.
 								# ============================================================================
-												add language model and server and fix bugs

											
										
										
											2018-04-21 20:50:53 +08:00
+								"""
 								@author: nl8590687
-												feat: 切换声学模型模块

											
										
										
											2021-11-20 20:32:09 +08:00
+								ASRT语音识别API的HTTP服务器程序
-												add language model and server and fix bugs

											
										
										
											2018-04-21 20:50:53 +08:00
+								"""
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
-												add language model and server and fix bugs

											
										
										
											2018-04-21 20:50:53 +08:00
+								import http.server
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								import socket
-												feat: 切换声学模型模块

											
										
										
											2021-11-20 20:32:09 +08:00
+								from speech_model import ModelSpeech
-												feat: 切换默认声学模型到m251bn

											
										
										
											2022-03-27 21:47:12 +08:00
+								from speech_model_zoo import SpeechModel251BN
-												feat: 切换声学模型模块

											
										
										
											2021-11-20 20:32:09 +08:00
+								from speech_features import Spectrogram
 								from LanguageModel2 import ModelLanguage
-												style: 规范代码风格

											
										
										
											2021-11-26 18:27:35 +08:00
+								AUDIO_LENGTH = 1600
 								AUDIO_FEATURE_LENGTH = 200
 								CHANNELS = 1
-												feat: 切换声学模型模块

											
										
										
											2021-11-20 20:32:09 +08:00
+								# 默认输出的拼音的表示大小是1428，即1427个拼音+1个空白块
-												style: 规范代码风格

											
										
										
											2021-11-26 18:27:35 +08:00
+								OUTPUT_SIZE = 1428
-												feat: 切换默认声学模型到m251bn

											
										
										
											2022-03-27 21:47:12 +08:00
+								sm251bn = SpeechModel251BN(
-												style: 规范代码风格

											
										
										
											2021-11-26 18:27:35 +08:00
+								    input_shape=(AUDIO_LENGTH, AUDIO_FEATURE_LENGTH, CHANNELS),
 								    output_size=OUTPUT_SIZE
-												feat: 切换声学模型模块

											
										
										
											2021-11-20 20:32:09 +08:00
+								    )
 								feat = Spectrogram()
-												feat: 切换默认声学模型到m251bn

											
										
										
											2022-03-27 21:47:12 +08:00
+								ms = ModelSpeech(sm251bn, feat, max_label_length=64)
 								ms.load_model('save_models/' + sm251bn.get_model_name() + '.model.h5')
-												fix bugs and improve asrserver

											
										
										
											2018-05-11 16:56:59 +08:00
 								ml = ModelLanguage('model_language')
 								ml.LoadModel()
-												add language model and server and fix bugs

											
										
										
											2018-04-21 20:50:53 +08:00
-												Add IPv6 support to asrserver

											
										
										
											2019-01-09 16:37:10 +08:00
-												style: 规范代码风格

											
										
										
											2021-11-26 18:27:35 +08:00
+								class ASRTHTTPHandle(http.server.BaseHTTPRequestHandler):
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								    def setup(self):
 								        self.request.settimeout(10)
 								        http.server.BaseHTTPRequestHandler.setup(self)
 								    def _set_response(self):
 								        self.send_response(200)
 								        self.send_header('Content-type', 'text/html')
 								        self.end_headers()
-												style: 规范代码风格

											
										
										
											2021-11-26 18:27:35 +08:00
+								    def do_GET(self):
 								        buf = 'ASRT_SpeechRecognition API'
 								        self.protocal_version = 'HTTP/1.1'
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								        self._set_response()
-												style: 规范代码风格

											
										
										
											2021-11-26 18:27:35 +08:00
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								        buf = bytes(buf,encoding="utf-8")
-												style: 规范代码风格

											
										
										
											2021-11-26 18:27:35 +08:00
+								        self.wfile.write(buf)
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
-												style: 规范代码风格

											
										
										
											2021-11-26 18:27:35 +08:00
+								    def do_POST(self):
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								        '''
 								        处理通过POST方式传递过来并接收的语音数据
 								        通过语音模型和语言模型计算得到语音识别结果并返回
 								        '''
-												style: 规范代码风格

											
										
										
											2021-11-26 18:27:35 +08:00
+								        path = self.path
 								        print(path)
 								        #获取post提交的数据
 								        datas = self.rfile.read(int(self.headers['content-length']))
 								        #datas = urllib.unquote(datas).decode("utf-8", 'ignore')
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								        datas = datas.decode('utf-8')
 								        datas_split = datas.split('&')
 								        token = ''
 								        fs = 0
 								        wavs = []
-												style: 规范代码风格

											
										
										
											2021-11-26 18:27:35 +08:00
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								        for line in datas_split:
 								            [key, value]=line.split('=')
-												style: 规范代码风格

											
										
										
											2021-11-26 18:27:35 +08:00
+								            if key == 'wavs' and value != '':
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								                wavs.append(int(value))
-												style: 规范代码风格

											
										
										
											2021-11-26 18:27:35 +08:00
+								            elif key == 'fs':
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								                fs = int(value)
-												style: 规范代码风格

											
										
										
											2021-11-26 18:27:35 +08:00
+								            elif key == 'token':
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								                token = value
 								            else:
 								                print(key, value)
-												style: 规范代码风格

											
										
										
											2021-11-26 18:27:35 +08:00
 								        if token != 'qwertasd':
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								            buf = '403'
 								            print(buf)
 								            buf = bytes(buf,encoding="utf-8")
-												style: 规范代码风格

											
										
										
											2021-11-26 18:27:35 +08:00
+								            self.wfile.write(buf)
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								            return
-												style: 规范代码风格

											
										
										
											2021-11-26 18:27:35 +08:00
 								        if len(wavs)>0:
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								            r = self.recognize([wavs], fs)
 								        else:
 								            r = ''
-												style: 规范代码风格

											
										
										
											2021-11-26 18:27:35 +08:00
 								        if token == 'qwertasd':
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								            buf = r
 								        else:
 								            buf = '403'
-												style: 规范代码风格

											
										
										
											2021-11-26 18:27:35 +08:00
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								        self._set_response()
-												style: 规范代码风格

											
										
										
											2021-11-26 18:27:35 +08:00
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								        print(buf)
 								        buf = bytes(buf,encoding="utf-8")
-												style: 规范代码风格

											
										
										
											2021-11-26 18:27:35 +08:00
+								        self.wfile.write(buf)
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								    def recognize(self, wavs, fs):
 								        r=''
 								        try:
-												feat: 切换声学模型模块

											
										
										
											2021-11-20 20:32:09 +08:00
+								            r_speech = ms.recognize_speech(wavs, fs)
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								            print(r_speech)
 								            str_pinyin = r_speech
 								            r = ml.SpeechToText(str_pinyin)
 								        except Exception as ex:
 								            r=''
 								            print('[*Message] Server raise a bug. ', ex)
 								        return r
-												style: 规范代码风格

											
										
										
											2021-11-26 18:27:35 +08:00
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								    def recognize_from_file(self, filename):
 								        pass
-												Add IPv6 support to asrserver

											
										
										
											2019-01-09 16:37:10 +08:00
 								class HTTPServerV6(http.server.HTTPServer):
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								    address_family = socket.AF_INET6
-												Add IPv6 support to asrserver

											
										
										
											2019-01-09 16:37:10 +08:00
-												style: 规范代码风格

											
										
										
											2021-11-26 18:27:35 +08:00
+								def start_server(ip, port):
 								    if ':' in ip:
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								        http_server = HTTPServerV6((ip, port), ASRTHTTPHandle)
 								    else:
 								        http_server = http.server.HTTPServer((ip, int(port)), ASRTHTTPHandle)
-												style: 规范代码风格

											
										
										
											2021-11-26 18:27:35 +08:00
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								    print('服务器已开启')
-												style: 规范代码风格

											
										
										
											2021-11-26 18:27:35 +08:00
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								    try:
-												style: 规范代码风格

											
										
										
											2021-11-26 18:27:35 +08:00
+								        http_server.serve_forever() #设置一直监听并接收请求
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								    except KeyboardInterrupt:
 								        pass
 								    http_server.server_close()
 								    print('HTTP server closed')
-												add language model and server and fix bugs

											
										
										
											2018-04-21 20:50:53 +08:00
+								if __name__ == '__main__':
-												style: 为代码添加头部注释说明

											
										
										
											2021-05-16 19:44:05 +08:00
+								    start_server('', 20000) # For IPv4 Network Only
 								    #start_server('::', 20000) # For IPv6 Network