1、资源下载(可以去讯飞官网控制台下载)
2、实现代码
# Python调普通离线合成并实时播放
import wave
from ctypes import *
import pyaudio"""
1、 在Python中某些时候需要C做效率上的补充,Python中的ctypes模块可以很方便的调用Windows的DLL(也包括Linux下的SO等文件)
2、播放库下载地址:
https://www.lfd.uci.edu/ ~gohlke/pythonlibs/#pyaudio
"""def msp_login(dll):login_params = b'appid = 你的APPID, work_dir = ...'ret = dll.MSPLogin(None, None, login_params)if ret != 0:print(f'调用失败,错误码 {ret}')else:print('调用登录成功...')def tts_session_begin(dll, voice_name): # 开始会话voice_name = voice_namesession_begin_params = f'engine_type = local, voice_name = {voice_name}, text_encoding = UTF-8, ' f'tts_res_path = fo|res/tts/{voice_name}.jet;fo|res/tts/common.jet, sample_rate = 16000, ' f'speed = 50, volume = 50, pitch = 50, rdn = 2'session_begin_params_bytes = bytes(session_begin_params, 'UTF-8')error_code = c_int()dll.QTTSSessionBegin.restype = c_char_p # 设置原生函数返回值为char指针return_session_id = dll.QTTSSessionBegin(session_begin_params_bytes, byref(error_code))print(f'{return_session_id} {type(return_session_id)}')if error_code.value != 0:print(f'调用失败,错误码 {error_code.value}')else:print(f'开启会话成功...')return return_session_iddef tts_text_put(dll, method_text):method_text = method_text.encode('UTF-8')ret = dll.QTTSTextPut(session_id, method_text, len(method_text), None)if ret != 0:print(f'写入合成调用失败,错误码 {ret}')else:print('写入合成文本成功...')def tts_audio_get(dll, temp_session_id, store_file):audio_len, synth_status, return_ret = c_int(), c_int(), c_int()dll.QTTSAudioGet.restype = c_void_p # 设置原生函数返回为void指针return_data_buffer = bytes()while True:return_data = python_dll.QTTSAudioGet(temp_session_id, byref(audio_len), byref(synth_status), byref(return_ret))if return_ret.value != 0:print(f'调用失败,错误码:{return_ret}')breakelse:if return_data:return_data_buffer = return_data_buffer + string_at(return_data, audio_len.value)store_file.writeframes(string_at(return_data, audio_len.value))if synth_status.value == 2: # 说明返回完毕breakreturn return_data_bufferdef tts_session_end(dll, temp_session_id):ret = dll.QTTSSessionEnd(temp_session_id, '正常结束会话...')if ret != 0:print(f'结束会话调用失败,错误码 {ret}')else:print('结束会话成功...')def msp_logout(dll):ret = dll.MSPLogout()if ret != 0:print(f'调用失败,错误码 {ret}')else:print('调用退出成功...')if __name__ == '__main__':# 0、加载dll或sopython_dll = CDLL('dll/msc_x64.dll')# 1、登录msp_login(python_dll)# 2、开启会话session_id = tts_session_begin(python_dll, 'xiaoyuan')# 3、放入文本text = '科大讯飞是中国最大的语音技术提供商'tts_text_put(python_dll, text)# 4、存储文件temp_file = wave.open('tts_sample.wav', 'wb')temp_file.setnchannels(1)temp_file.setsampwidth(2)temp_file.setframerate(16000)return_bytes = tts_audio_get(python_dll, session_id, temp_file)temp_file.close()# 5、同步实时播放py_audio = pyaudio.PyAudio()stream = py_audio.open(format=py_audio.get_format_from_width(width=2), channels=1, rate=16000,output=True)stream.write(return_bytes)# 6、关闭会话tts_session_end(python_dll, session_id)# 7、退出登录msp_logout(python_dll)