当前位置:   article > 正文

ROS 语音交互(三) tts

ROS 语音交互(三) tts

目录

一、模型选择

二、流程

三、核心代码展示


一、模型选择

科大讯飞超拟人识别

二、流程

超拟⼈合成协议 | 讯飞开放平台文档中心 (xfyun.cn)

三、核心代码展示

  1. # coding: utf-8
  2. import _thread as thread
  3. import os
  4. import time
  5. import base64
  6. import base64
  7. import datetime
  8. import hashlib
  9. import hmac
  10. import json
  11. from urllib.parse import urlparse
  12. import ssl
  13. from datetime import datetime
  14. from time import mktime
  15. from urllib.parse import urlencode
  16. from wsgiref.handlers import format_date_time
  17. import websocket
  18. import openpyxl
  19. from concurrent.futures import ThreadPoolExecutor, as_completed
  20. import os
  21. class Ws_Param(object):
  22. # 初始化
  23. def __init__(self, APPID, APIKey, APISecret, gpt_url):
  24. self.APPID = APPID
  25. self.APIKey = APIKey
  26. self.APISecret = APISecret
  27. self.host = urlparse(gpt_url).netloc
  28. self.path = urlparse(gpt_url).path
  29. self.gpt_url = gpt_url
  30. # 生成url
  31. def create_url(self):
  32. # 生成RFC1123格式的时间戳
  33. now = datetime.now()
  34. date = format_date_time(mktime(now.timetuple()))
  35. # 拼接字符串
  36. signature_origin = "host: " + self.host + "\n"
  37. signature_origin += "date: " + date + "\n"
  38. signature_origin += "GET " + self.path + " HTTP/1.1"
  39. # 进行hmac-sha256进行加密
  40. signature_sha = hmac.new(self.APISecret.encode('utf-8'), signature_origin.encode('utf-8'),
  41. digestmod=hashlib.sha256).digest()
  42. signature_sha_base64 = base64.b64encode(signature_sha).decode(encoding='utf-8')
  43. authorization_origin = f'api_key="{self.APIKey}", algorithm="hmac-sha256", headers="host date request-line", signature="{signature_sha_base64}"'
  44. authorization = base64.b64encode(authorization_origin.encode('utf-8')).decode(encoding='utf-8')
  45. # 将请求的鉴权参数组合为字典
  46. v = {
  47. "authorization": authorization,
  48. "date": date,
  49. "host": self.host
  50. }
  51. # 拼接鉴权参数,生成url
  52. url = self.gpt_url + '?' + urlencode(v)
  53. # 此处打印出建立连接时候的url,参考本demo的时候可取消上方打印的注释,比对相同参数时生成的url与自己代码生成的url是否一致
  54. return url
  55. # 收到websocket错误的处理
  56. def on_error(ws, error):
  57. print("### error:", error)
  58. # 收到websocket关闭的处理
  59. def on_close(ws):
  60. print("### closed ###")
  61. # 收到websocket连接建立的处理
  62. def on_open(ws):
  63. thread.start_new_thread(run, (ws,))
  64. # 收到websocket消息的处理
  65. def on_message(ws, message):
  66. message = json.loads(message)
  67. code = message['header']['code']
  68. if code != 0:
  69. print("### 请求出错: ", message)
  70. else:
  71. payload = message.get("payload")
  72. status = message['header']['status']
  73. if status == 2:
  74. print("### 合成完毕")
  75. ws.close()
  76. if payload and payload != "null":
  77. audio = payload.get("audio")
  78. if audio:
  79. audio = audio["audio"]
  80. with open(fr'./{ws.vcn}.mp3', 'ab') as f:
  81. f.write(base64.b64decode(audio))
  82. def run(ws, *args):
  83. body = {
  84. "header": {
  85. "app_id": ws.appid,
  86. "status": 0
  87. },
  88. "parameter": {
  89. "oral": {
  90. "spark_assist": 1,
  91. "oral_level": "mid"
  92. },
  93. "tts": {
  94. "vcn": ws.vcn,
  95. "speed": 50,
  96. "volume": 50,
  97. "pitch": 50,
  98. "bgs": 0,
  99. "reg": 0,
  100. "rdn": 0,
  101. "rhy": 0,
  102. "scn": 0,
  103. "version": 0,
  104. "L5SilLen": 0,
  105. "ParagraphSilLen": 0,
  106. "audio": {
  107. "encoding": "lame",
  108. "sample_rate": 16000,
  109. "channels": 1,
  110. "bit_depth": 16,
  111. "frame_size": 0
  112. },
  113. "pybuf": {
  114. "encoding": "utf8",
  115. "compress": "raw",
  116. "format": "plain"
  117. }
  118. }
  119. },
  120. "payload": {
  121. "text": {
  122. "encoding": "utf8",
  123. "compress": "raw",
  124. "format": "json",
  125. "status": 0,
  126. "seq": 0,
  127. "text": str(base64.b64encode(ws.text.encode('utf-8')), "UTF8")
  128. }
  129. }
  130. }
  131. ws.send(json.dumps(body))
  132. def main(appid, api_secret, api_key, url, text, vcn):
  133. wsParam = Ws_Param(appid, api_key, api_secret, url)
  134. wsUrl = wsParam.create_url()
  135. ws = websocket.WebSocketApp(wsUrl, on_message=on_message, on_error=on_error, on_close=on_close, on_open=on_open)
  136. websocket.enableTrace(False)
  137. ws.appid = appid
  138. ws.text = text
  139. ws.vcn = vcn
  140. ws.run_forever(sslopt={"cert_reqs": ssl.CERT_NONE})
  141. if __name__ == "__main__":
  142. main(
  143. appid="",
  144. api_secret="",
  145. api_key="",
  146. url="wss://cbm01.cn-huabei-1.xf-yun.com/v1/private/medd90fec",
  147. # 待合成文本
  148. text="今天天气很不错。",
  149. # 发音人参数
  150. vcn = "x4_lingyuzhao_oral"
  151. )

声明:本文内容由网友自发贡献,不代表【wpsshop博客】立场,版权归原作者所有,本站不承担相应法律责任。如您发现有侵权的内容,请联系我们。转载请注明出处:https://www.wpsshop.cn/w/小蓝xlanll/article/detail/261638
推荐阅读
相关标签
  

闽ICP备14008679号