2 år sedan · 882e6c3576
--- a/bridge/bridge.py
+++ b/bridge/bridge.py
@@ -10,7 +10,7 @@ class Bridge(object):
        return bot_factory.create_bot("chatGPT").reply(query, context)

    def fetch_voice_to_text(self, voiceFile):
        return voice_factory.create_voice("google").voiceToText(voiceFile)
        return voice_factory.create_voice("openai").voiceToText(voiceFile)

    def fetch_text_to_voice(self, text):
        return voice_factory.create_voice("google").textToVoice(text)
        return voice_factory.create_voice("baidu").textToVoice(text)
--- a/channel/wechat/wechat_channel.py
+++ b/channel/wechat/wechat_channel.py
@@ -54,14 +54,14 @@ class WechatChannel(Channel):
    def handle_voice(self, msg):
        if conf().get('speech_recognition') != True :
            return
        logger.debug("[WX]receive voice msg: ", msg['FileName'])
        logger.debug("[WX]receive voice msg: " + msg['FileName'])
        thread_pool.submit(self._do_handle_voice, msg)

    def _do_handle_voice(self, msg):
        fileName = self.tmpFilePath+msg['FileName']
        msg.download(fileName)
        content = super().build_voice_to_text(fileName)
        self._handle_single_msg(msg, content, True)
        self._handle_single_msg(msg, content, False)

    def handle_text(self, msg):
        logger.debug("[WX]receive text msg: " + json.dumps(msg, ensure_ascii=False))
--- a/config-template.json
+++ b/config-template.json
@@ -8,6 +8,9 @@
  "image_create_prefix": ["画", "看", "找"],
  "conversation_max_tokens": 1000,
  "speech_recognition": false,
  "baidu_app_id": "YOUR BAIDU APP ID",
  "baidu_api_key": "YOUR BAIDU API KEY",
  "baidu_secret_key": "YOUR BAIDU SERVICE KEY",
  "character_desc": "你是ChatGPT, 一个由OpenAI训练的大型语言模型, 你旨在回答并解决人们的任何问题，并且可以使用多种语言与人交流。",
  "expires_in_seconds": 3600
 }
--- a/voice/baidu/baidu_voice.py
+++ b/voice/baidu/baidu_voice.py
@@ -0,0 +1,22 @@

 """
 baidu voice service
 """
 from aip import AipSpeech
 from voice.voice import Voice
 from config import conf

 class BaiduVoice(Voice):
    APP_ID = conf().get('baidu_app_id')
    API_KEY = conf().get('baidu_api_key')
    SECRET_KEY = conf().get('baidu_secret_key')
    client = AipSpeech(APP_ID, API_KEY, SECRET_KEY)
    
    def __init__(self):
        pass

    def voiceToText(self, voice_file):
        pass

    def textToVoice(self, text):
        pass
--- a/voice/openai/openai_voice.py
+++ b/voice/openai/openai_voice.py
@@ -0,0 +1,25 @@

 """
 google voice service
 """
 import json
 import openai
 from common.log import logger
 from voice.voice import Voice


 class OpenaiVoice(Voice):
    def __init__(self):
        pass

    def voiceToText(self, voice_file):
        file = open(voice_file, "rb")
        reply = openai.Audio.transcribe("whisper-1", file)
        json_dict = json.loads(reply)
        text = json_dict['text']
        logger.info(
            '[Openai] voiceToText text={} voice file name={}'.format(text, voice_file))
        return text

    def textToVoice(self, text):
        pass
--- a/voice/voice_factory.py
+++ b/voice/voice_factory.py
@@ -8,10 +8,13 @@ def create_voice(voice_type):
    :param voice_type: voice type code
    :return: voice instance
    """
    if voice_type == 'xfyun':
        from voice.xfyun.xfyun_voice import XfyunVoice
        return XfyunVoice()
    if voice_type == 'baidu':
        from voice.baidu.baidu_voice import BaiduVoice
        return BaiduVoice()
    elif voice_type == 'google':
        from voice.google.google_voice import GoogleVoice
        return GoogleVoice()
    elif voice_type == 'openai':
        from voice.openai.openai_voice import OpenaiVoice
        return OpenaiVoice()
    raise RuntimeError
--- a/voice/xfyun/xfyun_voice.py
+++ b/voice/xfyun/xfyun_voice.py
@@ -1,35 +0,0 @@

 """
 科大讯飞 voice service
 """

 from voice.voice import Voice

 # 科大讯飞语音识别
 lfasr_host = 'http://raasr.xfyun.cn/api'
 # 请求的接口名
 api_prepare = '/prepare'
 api_upload = '/upload'
 api_merge = '/merge'
 api_get_progress = '/getProgress'
 api_get_result = '/getResult'
 # 文件分片大小10M
 file_piece_sice = 10485760
 # ——————————————————转写可配置参数————————————————
 # 参数可在官网界面（https://doc.xfyun.cn/rest_api/%E8%AF%AD%E9%9F%B3%E8%BD%AC%E5%86%99.html）查看，根据需求可自行在gene_params方法里添加修改
 # 转写类型
 lfasr_type = 0
 # 是否开启分词
 has_participle = 'false'
 has_seperate = 'true'
 # 多候选词个数
 max_alternatives = 0
 # 子用户标识
 suid = ''

 class XfyunVoice(Voice):
    def __init__(self):
        pass

    def voiceToText(self, voice_file):
        pass