科大讯飞语音合成

import time
from ctypes import *
from io import BytesIO
import wave
import platform
import logging
import os

logging.basicConfig(level=logging.DEBUG)

BASEPATH = os.path.split(os.path.realpath(__file__))[0]


def play(filename):
    import pygame
    pygame.mixer.init(frequency=16000)
    pygame.mixer.music.load(filename)
    pygame.mixer.music.play()
    while pygame.mixer.music.get_busy() == True:
        continue


def saveWave(raw_data, _tmpFile='test.wav'):
    f = wave.open(_tmpFile, 'w')
    f.setparams((1, 2, 16000, 262720, 'NONE', 'not compressed'))
    f.writeframesraw(raw_data)
    f.close()
    return _tmpFile


def text_to_speech(src_text="这不仅仅是一个测试", file_name=None):
    plat = platform.architecture()
    if plat[1].startswith(('Windows', 'windows')):
        if plat[0] == '32bit':
            cur = cdll.LoadLibrary(BASEPATH + '/x86/msc.dll')
        else:
            cur = cdll.LoadLibrary(BASEPATH + '/x64/msc_x64.dll')
    else:
        if plat[0] == '32bit':
            cur = cdll.LoadLibrary(BASEPATH + '/x86/libmsc.so')
        else:
            cur = cdll.LoadLibrary(BASEPATH + '/x64/libmsc.so')

    MSPLogin = cur.MSPLogin
    QTTSSessionBegin = cur.QTTSSessionBegin
    QTTSTextPut = cur.QTTSTextPut

    QTTSAudioGet = cur.QTTSAudioGet
    QTTSAudioGet.restype = c_void_p

    QTTSSessionEnd = cur.QTTSSessionEnd

    ret_c = c_int(0)
    ret = 0

    ret = MSPLogin(None, None, b'appid = xxx, work_dir = .')
    if ret != 0:
        logging.error("MSPLogin failed, error code: {}".format(ret))
        return

    session_begin_params = "voice_name = xiaoyan, text_encoding = gbk, sample_rate = 16000, speed = 50, volume = 50, pitch = 50, rdn = 2"
    sessionID = QTTSSessionBegin(session_begin_params, byref(ret_c));
    if ret_c.value != 0:
        logging.error("QTTSSessionBegin failed, error code: " + ret_c.value);
        return

    ret = QTTSTextPut(sessionID, src_text, len(src_text), None)
    if ret != 0:
        logging.error("QTTSTextPut failed, error code: " + ret);
        QTTSSessionEnd(sessionID, "TextPutError");

        return
    logging.info("正在合成 [%s]..." % (src_text))

    audio_len = c_uint(0)
    synth_status = c_int(0)

    f = BytesIO()
    while True:
        p = QTTSAudioGet(sessionID, byref(audio_len), byref(synth_status), byref(ret_c));
        if ret_c.value != 0:
            logging.error("QTTSAudioGet failed, error code: " + ret_c);
            QTTSSessionEnd(sessionID, "AudioGetError");
            break

        if p != None:
            buf = (c_char * audio_len.value).from_address(p)
            logging.debug(buf)
            logging.debug(type(buf))
            f.write(buf)

        if synth_status.value == 2:
            saveWave(f.getvalue(), file_name)
            break

        logging.debug(".")
        time.sleep(1)

    logging.info('合成完成！')
    ret = QTTSSessionEnd(sessionID, "Normal");
    if ret != 0:
        logging.error("QTTSTextPut failed, error code: " + ret);


if __name__ == '__main__':
    text_val = "亲爱的用户，您好，这是一个语音合成示例，感谢您对科大讯飞语音技术的支持！科大讯飞是亚太地区最大的语音上市公司，股票代码：002230"
    text_to_speech(text_val.encode('gbk'), '你好.wav')
posted @ 2017-11-24 18:40 hyu9999 Views(894) Comments(0) 收藏举报
刷新页面返回顶部
hyu9999

科大讯飞语音合成

公告