/// <summary> /// 把文本转换成声音,写入指定的内存流 /// </summary> /// <param name="SpeekText">要转化成语音的文字</param> /// <param name="mStream">合成结果输出的音频流</param> private void Speek(string SpeekText, ref MemoryStream mStream) { if (SpeekText == "" || _speed == "" || _vol == "" || _speeker == "") { return; } //string szParams = "ssm=1," + _speeker + ",spd=" + _speed + ",aue=speex-wb;7,vol=" + _vol + ",auf=audio/L16;rate=16000"; string szParams = "engine_type = local, voice_name = " + _speeker + ", text_encoding = UTF8, tts_res_path = " + TTSPath(_speeker) + ", sample_rate = 16000, speed = " + _speed + ", volume = " + _vol + ", pitch = 50, rdn = 2"; //string szParams = "engine_type = cloud, voice_name = " + _speeker + ", text_encoding = UTF8, sample_rate = 16000, speed = " + _speed + ", volume = " + _vol + ", pitch = 50, rdn = 2"; //string szParams = "engine_type = cloud ,voice_name = " + _speeker + ", text_encoding = GB2312,sample_rate = 16000"; int ret = 0; try { sessionID = Marshal.PtrToStringAnsi(TTSDll.QTTSSessionBegin(szParams, ref ret)); if (ret != 0) { UnityEngine.Debug.Log(ret); throw new Exception("初始化TTS引会话错误,错误代码:" + ret); } ret = TTSDll.QTTSTextPut(sessionID, SpeekText, (uint)Encoding.Default.GetByteCount(SpeekText), null); if (ret != 0) { UnityEngine.Debug.Log(ret); throw new Exception("向服务器发送数据,错误代码:" + ret); }//IntPtr audio_data; SynthStatus synth_status = SynthStatus.TTS_FLAG_STILL_HAVE_DATA; while (true) { int audio_len = 0; IntPtr source = TTSDll.QTTSAudioGet(sessionID, ref audio_len, ref synth_status, ref ret); byte[] array = new byte[audio_len]; if (audio_len > 0) { Marshal.Copy(source, array, 0, audio_len); } mStream.Write(array, 0, audio_len);//将合成的音频字节数据存放到内存流中 //Thread.Sleep(15);//防止CPU频繁占用 if (synth_status == SynthStatus.TTS_FLAG_DATA_END || ret != 0) { break; } } } catch (Exception ex) { Log.Warning(ex.Message); } finally { ret = TTSDll.QTTSSessionEnd(sessionID, ""); if (ret != 0) { throw new Exception("结束TTS会话错误,错误代码:" + ret); } } }
public void CloseXunFei() { int ret = TTSDll.MSPLogout(); if (ret != 0) { throw new Exception("逆初始化TTS引擎错误,错误代码:" + ret); } }
/// <summary> /// 构造函数,初始化引擎 /// </summary> /// <param name="configs">初始化引擎参数</param> /// <param name="szParams">开始会话用参数</param> public XunFeiTemplate(string name, string password, string configs) { DSpeeker.Add(Speeker.小燕_青年女声_中英文_普通话, "xiaoyan"); DSpeeker.Add(Speeker.小宇_青年男声_中英文_普通话, "xiaoyu"); int ret = TTSDll.MSPLogin(name, password, configs); if (ret != 0) { throw new Exception("初始化TTS引擎错误,错误代码:" + ret); } _speed = "50"; _vol = "100"; _speeker = "xiaoyan"; Log.Info(TTSPath(_speeker)); }
/// <summary> /// 把文字转化为声音,单路配置,一种语音 /// </summary> /// <param name="speekText">要转化成语音的文字</param> /// <param name="outWaveFlie">把声音转为文件,默认为不生产wave文件</param> private void speek(string speekText, string outWaveFlie = null) { if (speekText == "" || _speed == "" || _vol == "" || _speeker == "") { return; } string szParams = "ssm=1," + _speeker + ",spd=" + _speed + ",aue=speex-wb;7,vol=" + _vol + ",auf=audio/L16;rate=16000"; int ret = 0; try { sessionID = Ptr2Str(TTSDll.QTTSSessionBegin(szParams, ref ret)); if (ret != 0) { throw new Exception("初始化TTS引会话错误,错误代码:" + ret); } ret = TTSDll.QTTSTextPut(sessionID, speekText, (uint)Encoding.Default.GetByteCount(speekText), string.Empty); if (ret != 0) { throw new Exception("向服务器发送数据,错误代码:" + ret); } IntPtr audio_data; int audio_len = 0; SynthStatus synth_status = SynthStatus.TTS_FLAG_STILL_HAVE_DATA; MemoryStream fs = new MemoryStream(); fs.Write(new byte[44], 0, 44); //写44字节的空文件头 while (synth_status == SynthStatus.TTS_FLAG_STILL_HAVE_DATA) { audio_data = TTSDll.QTTSAudioGet(sessionID, ref audio_len, ref synth_status, ref ret); if (ret != 0) { break; } byte[] data = new byte[audio_len]; if (audio_len > 0) { Marshal.Copy(audio_data, data, 0, audio_len); } fs.Write(data, 0, data.Length); } WAVE_Header header = getWave_Header((int)fs.Length - 44); //创建wav文件头 byte[] headerByte = StructToBytes(header); //把文件头结构转化为字节数组 //写入文件头 fs.Position = 0; //定位到文件头 fs.Write(headerByte, 0, headerByte.Length); //写入文件头 fs.Position = 0; System.Media.SoundPlayer pl = new System.Media.SoundPlayer(fs); pl.Stop(); pl.Play(); if (outWaveFlie != null) { FileStream ofs = new FileStream(outWaveFlie, FileMode.Create); fs.WriteTo(ofs); fs.Close(); ofs.Close(); fs = null; ofs = null; } } catch (Exception ex) { System.Diagnostics.Debug.WriteLine(ex.Message); } finally { ret = TTSDll.QTTSSessionEnd(sessionID, ""); if (ret != 0) { throw new Exception("结束TTS会话错误,错误代码:" + ret); } } }
private MemoryStream GetAudioData(string str) { int ret = 0; IntPtr session_ID; //APPID请勿随意改动 string login_configs = "appid = 5ac9f8d1"; //登录参数,自己注册后获取的appid string text = str; //text是待合成文本 uint audio_len = 0; SynthStatus synth_status = SynthStatus.MSP_TTS_FLAG_STILL_HAVE_DATA; ret = TTSDll.MSPLogin(string.Empty, string.Empty, login_configs); //第一个参数为用户名,第二个参数为密码,第三个参数是登录参数,用户名和密码需要在http://open.voicecloud.cn //MSPLogin方法返回失败 if (ret != (int)ErrorCode.MSP_SUCCESS) { return(null); } //string parameter = "engine_type = local, voice_name=xiaoyan, tts_res_path =fo|res\\tts\\xiaoyan.jet;fo|res\\tts\\common.jet, sample_rate = 16000"; string _params = "ssm=1,ent=sms16k,vcn=xiaoyan,spd=medium,aue=speex-wb;7,vol=x-loud,auf=audio/L16;rate=16000"; //string @params = "engine_type = local,voice_name=xiaoyan,speed=50,volume=50,pitch=50,rcn=1, text_encoding = UTF8, background_sound=1,sample_rate = 16000"; session_ID = TTSDll.QTTSSessionBegin(_params, ref ret); //QTTSSessionBegin方法返回失败 if (ret != (int)ErrorCode.MSP_SUCCESS) { return(null); } ret = TTSDll.QTTSTextPut(Ptr2Str(session_ID), text, (uint)Encoding.Default.GetByteCount(text), string.Empty); //QTTSTextPut方法返回失败 if (ret != (int)ErrorCode.MSP_SUCCESS) { return(null); } //内存流可直接在内存进行读写,不需要临时缓冲区或者临时文件 MemoryStream memoryStream = new MemoryStream(); memoryStream.Write(new byte[44], 0, 44);//为结构体开辟空间,后面用来存储音频文件结构体 while (true) { IntPtr source = TTSDll.QTTSAudioGet(Ptr2Str(session_ID), ref audio_len, ref synth_status, ref ret); byte[] array = new byte[(int)audio_len]; if (audio_len > 0) { Marshal.Copy(source, array, 0, (int)audio_len); } memoryStream.Write(array, 0, array.Length); //将合成的音频字节数据存放到内存流中 Thread.Sleep(150); //防止CPU频繁占用 if (synth_status == SynthStatus.MSP_TTS_FLAG_DATA_END || ret != 0) { break; } } WAVE_Header wave_Header = getWave_Header((int)memoryStream.Length - 44); byte[] array2 = StructToBytes(wave_Header); memoryStream.Position = 0L; //将指针定位到开头 memoryStream.Write(array2, 0, array2.Length); //存储结构体的字节数组 memoryStream.Position = 0L; //将指针定位到开头 ret = TTSDll.QTTSSessionEnd(Ptr2Str(session_ID), ""); //结束会话 ret = TTSDll.MSPLogout(); //退出登录 return(memoryStream); }
/// <summary> /// 语音识别 /// </summary> /// <param name="text"></param>文本内容 public void SpeechTest(String text, string ent, string vcn) { try { ///APPID请勿随意改动 string login_configs = "appid =59c4ae84 ";//登录参数,自己注册后获取的appid if (string.IsNullOrEmpty(text.Trim())) { text = "请输入合成语音的内容"; } //string filename = "Call.wav"; //合成的语音文件 uint audio_len = 0; SynthStatus synth_status = SynthStatus.MSP_TTS_FLAG_STILL_HAVE_DATA; ret = TTSDll.MSPLogin(string.Empty, string.Empty, login_configs);//第一个参数为用户名,第二个参数为密码,第三个参数是登录参数,用户名和密码需要在http://open.voicecloud.cn //MSPLogin方法返回失败 if (ret != (int)ErrorCode.MSP_SUCCESS) { return; } string _params = "ssm=1,ent=" + ent + ",vcn=" + vcn + ",spd=medium,aue=speex-wb;7,vol=x-loud,auf=audio/L16;rate=16000"; session_ID = TTSDll.QTTSSessionBegin(_params, ref ret); //QTTSSessionBegin方法返回失败 if (ret != (int)ErrorCode.MSP_SUCCESS) { return; } ret = TTSDll.QTTSTextPut(Ptr2Str(session_ID), text, (uint)Encoding.Default.GetByteCount(text), string.Empty); //QTTSTextPut方法返回失败 if (ret != (int)ErrorCode.MSP_SUCCESS) { return; } MemoryStream memoryStream = new MemoryStream(); memoryStream.Write(new byte[44], 0, 44); while (true) { IntPtr source = TTSDll.QTTSAudioGet(Ptr2Str(session_ID), ref audio_len, ref synth_status, ref ret); byte[] array = new byte[(int)audio_len]; if (audio_len > 0) { Marshal.Copy(source, array, 0, (int)audio_len); } memoryStream.Write(array, 0, array.Length); Thread.Sleep(1000); if (synth_status == SynthStatus.MSP_TTS_FLAG_DATA_END || ret != 0) { break; } } WAVE_Header wave_Header = getWave_Header((int)memoryStream.Length - 44); byte[] array2 = this.StructToBytes(wave_Header); memoryStream.Position = 0L; memoryStream.Write(array2, 0, array2.Length); memoryStream.Position = 0L; SoundPlayer soundPlayer = new SoundPlayer(memoryStream); soundPlayer.Stop(); soundPlayer.Play(); //if (filename != null) //{ // FileStream fileStream = new FileStream(filename, FileMode.Create, FileAccess.Write); // memoryStream.WriteTo(fileStream); // memoryStream.Close(); // fileStream.Close(); //} } catch (Exception) { } finally { ret = TTSDll.QTTSSessionEnd(Ptr2Str(session_ID), ""); ret = TTSDll.MSPLogout();//退出登录 } }
/// <summary> /// /// </summary> /// <param name="text">要转换的文字</param> /// <param name="guisy">生成声音文件的标识</param> public string txt2ShengYin(string text, string guisy) { try { ///APPID请勿随意改动 string login_configs = ZmConfig.XunFeiAppId;//登录参数,自己注册后获取的appid if (string.IsNullOrEmpty(text)) { return("请输入合成语音的内容"); } string filename = guisy + ".wav"; //合成的语音文件 uint audio_len = 0; SynthStatus synth_status = SynthStatus.MSP_TTS_FLAG_STILL_HAVE_DATA; //第一个参数为用户名,第二个参数为密码,第三个参数是登录参数,用户名和密码需要在http://open.voicecloud.cn // usr[in] 此参数保留,传入NULL即可。 //pwd[in] 此参数保留,传入NULL即可。 //params[in] 参见下表: //格式说明:每个参数和参数值通过key=value的形式组成参数对;如果有多个参数对,再用逗号进行拼接,如:key_1=value_1,key_2=value_2 //注意:每个参数(key)和参数值(value)均不得含有逗号(,)和等号(=),否则会被截断 //在线/离线业务 参数 名称 ret = TTSDll.MSPLogin(string.Empty, string.Empty, login_configs); //MSPLogin方法返回失败 if (ret != (int)ErrorCode.MSP_SUCCESS) { return("MSPLogin:"******"engine_type = local, voice_name=xiaoyan, tts_res_path =fo|res\\tts\\xiaoyan.jet;fo|res\\tts\\common.jet, sample_rate = 16000"; string _params = "ssm=1,ent=sms16k,vcn=xiaoyan,spd=medium,aue=speex-wb;7,vol=x-loud,auf=audio/L16;rate=16000"; //string @params = "engine_type = local,voice_name=xiaoyan,speed=50,volume=50,pitch=50,rcn=1, text_encoding = UTF8, background_sound=1,sample_rate = 16000"; session_ID = TTSDll.QTTSSessionBegin(_params, ref ret); //QTTSSessionBegin方法返回失败 if (ret != (int)ErrorCode.MSP_SUCCESS) { return("QTTSSessionBegin:" + ret.ToString()); } ret = TTSDll.QTTSTextPut(Ptr2Str(session_ID), text, (uint)Encoding.Default.GetByteCount(text), string.Empty); //QTTSTextPut方法返回失败 if (ret != (int)ErrorCode.MSP_SUCCESS) { return("QTTSTextPut:" + ret.ToString()); } MemoryStream memoryStream = new MemoryStream(); memoryStream.Write(new byte[44], 0, 44); while (true) { IntPtr source = TTSDll.QTTSAudioGet(Ptr2Str(session_ID), ref audio_len, ref synth_status, ref ret); byte[] array = new byte[(int)audio_len]; if (audio_len > 0) { Marshal.Copy(source, array, 0, (int)audio_len); } memoryStream.Write(array, 0, array.Length); Thread.Sleep(1000); if (synth_status == SynthStatus.MSP_TTS_FLAG_DATA_END || ret != 0) { break; } } WAVE_Header wave_Header = getWave_Header((int)memoryStream.Length - 44); byte[] array2 = this.StructToBytes(wave_Header); memoryStream.Position = 0L; memoryStream.Write(array2, 0, array2.Length); memoryStream.Position = 0L; if (filename != null) { FileStream fileStream = new FileStream(filename, FileMode.Create, FileAccess.Write); memoryStream.WriteTo(fileStream); memoryStream.Close(); fileStream.Close(); } } catch (Exception) { } finally { ret = TTSDll.QTTSSessionEnd(Ptr2Str(session_ID), ""); ret = TTSDll.MSPLogout();//退出登录 } return("ok:" + guisy); }