tts_sample.c
16.6 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
/*
* 语音合成(Text To Speech,TTS)技术能够自动将任意文字实时转换为连续的
* 自然语音,是一种能够在任何时间、任何地点,向任何人提供语音信息服务的
* 高效便捷手段,非常符合信息时代海量数据、动态更新和个性化查询的需求。
*/
#include <stdlib.h>
#include <stdio.h>
#include <unistd.h>
#include <errno.h>
#include <stdint.h>
#include <string.h>
#include "qtts.h"
#include "msp_cmn.h"
#include "msp_errors.h"
#include "ircut.h"
#include "music.h"
#include "Interface.h"
#include "wiringPi.h"
//#include "widget/test_widget_speaker.h"
typedef int SR_DWORD;
typedef short int SR_WORD ;
const char* TTS_ID = NULL;
const char* TTS_ID1 = NULL;
const char* TTS_ID2 = NULL;
extern int play_mode;
extern int reset_play;
extern int now_volume;
extern int tts_add;
extern int TTS_switch;
extern int TTS_delay;//TTS播放后的延迟时间
extern int now_play_stat;//当前播放状态 0未播放 1音频播放 2文本播放 3文本文件播放 4实时喊话
int TTS_wav_test = 0;
int tts_speed_add=50;
/* wav音频头部格式 */
typedef struct _wave_pcm_hdr
{
char riff[4]; // = "RIFF"
int size_8; // = FileSize - 8
char wave[4]; // = "WAVE"
char fmt[4]; // = "fmt "
int fmt_size; // = 下一个结构体的大小 : 16
short int format_tag; // = PCM : 1
short int channels; // = 通道数 : 1
int samples_per_sec; // = 采样率 : 8000 | 6000 | 11025 | 16000
int avg_bytes_per_sec; // = 每秒字节数 : samples_per_sec * bits_per_sample / 8
short int block_align; // = 每采样点字节数 : wBitsPerSample / 8
short int bits_per_sample; // = 量化比特数: 8 | 16
char data[4]; // = "data";
int data_size; // = 纯数据长度 : FileSize - 44
} wave_pcm_hdr;
/* 默认wav音频头部数据 */
wave_pcm_hdr default_wav_hdr =
{
{ 'R', 'I', 'F', 'F' },
0,
{'W', 'A', 'V', 'E'},
{'f', 'm', 't', ' '},
16,
1,
1,
16000,
32000,
2,
16,
{'d', 'a', 't', 'a'},
0
};
/* 文本合成 */
int text_to_speech(const char* src_text, const char* des_path, const char* params)
{
int ret = -1;
FILE* fp = NULL;
const char* sessionID = NULL;
const char* sessionID1 = NULL;
const char* sessionID2 = NULL;
unsigned int audio_len = 0;
wave_pcm_hdr wav_hdr = default_wav_hdr;
int synth_status = MSP_TTS_FLAG_STILL_HAVE_DATA;
uint8_t TTS_header[] = {0x5a,0x5a,0x77,0x00,0x00,0x00,0x00,0x51,0x04};
uint8_t TTS_header_wav[] ={0x5a,0x5a,0x77,0x00,0x24,0x00,0x00,0x51,0x04,
'R', 'I', 'F', 'F' ,
36498,
'W', 'A', 'V', 'E',
'f', 'm', 't', ' ',
16,
1,
1,
16000,
32000,
2,
16,
'd', 'a', 't', 'a',
36462,
0x00,0x23};
char TTS_end[] = {0x00,0x23};
int num=0;
char TTS_data[2048];
char TTS_null[2048]={0};
ret= -1;
if (NULL == src_text || NULL == des_path)
{
printf("params is error!\n");
return ret;
}
/* 开始合成 */
sessionID = QTTSSessionBegin(params, &ret);
TTS_ID = sessionID;
if (MSP_SUCCESS != ret)
{
printf("QTTSSessionBegin failed, error code: %d.\n", ret);
return ret;
}
ret = QTTSTextPut(sessionID, src_text, (unsigned int)strlen(src_text), NULL);
if (MSP_SUCCESS != ret)
{
printf("QTTSTextPut failed, error code: %d.\n",ret);
QTTSSessionEnd(sessionID, "TextPutError");
return ret;
}
printf("正在合成 ...\n");
if(TTS_wav_test == 1){
fp = fopen("/root/tts_test_wav.wav", "wb");
fwrite(&wav_hdr, sizeof(wav_hdr) ,1, fp); //添加wav音频头,使用采样率为16000
}
while (1)
{
if(now_play_stat==2){//文本播放
/* 获取合成音频 */
const char* data = QTTSAudioGet(sessionID, &audio_len, &synth_status, &ret);
if (MSP_SUCCESS != ret)
break;
//printf("获取成功,长度位%d\n",audio_len);
if (NULL != data)
{
rawPlay(16000,data,audio_len);//播放合成的音频文件
if(TTS_wav_test == 1){
fwrite(data, audio_len, 1, fp);
wav_hdr.data_size += audio_len; //计算data_size大小
}
//rawPlay(16000,TTS_null,2048);
//rawPlay(16000,TTS_null,2048);
//rawPlay(16000,TTS_null,2048);
//printf("播放成功\n");
}
//else{printf("data==null\n");}
if (MSP_TTS_FLAG_DATA_END == synth_status)
break;
}
else {
printf("now_play_stat = %d return TTS\n",now_play_stat);
QTTSSessionEnd(sessionID, "Normal");
return;//不是文本播放直接退出
}
}
printf("\n");
if (MSP_SUCCESS != ret)
{
printf("QTTSAudioGet failed, error code: %d.\n",ret);
QTTSSessionEnd(sessionID, "AudioGetError");
if(TTS_wav_test == 1)
{
fclose(fp);
}
return ret;
}
if(TTS_wav_test == 1){
/* 修正wav文件头数据的大小 */
wav_hdr.size_8 += wav_hdr.data_size + (sizeof(wav_hdr) - 8);
/* 将修正过的数据写回文件头部,音频文件为wav格式 */
fseek(fp, 4, 0);
fwrite(&wav_hdr.size_8,sizeof(wav_hdr.size_8), 1, fp); //写入size_8的值
fseek(fp, 40, 0); //将文件指针偏移到存储data_size值的位置
fwrite(&wav_hdr.data_size,sizeof(wav_hdr.data_size), 1, fp); //写入data_size的值
fclose(fp);
fp = NULL;
/* 合成完毕 */
}
ret = QTTSSessionEnd(sessionID, "Normal");
if (MSP_SUCCESS != ret)
{
printf("QTTSSessionEnd failed, error code: %d.\n",ret);
}
//stop_music();//结束播放
return ret;
}
void login_tts(void){
int ret = MSP_SUCCESS;
int error_num=0;
const char* login_params = "appid = 03857dfd, work_dir = .";//登录参数,appid与msc库绑定,请勿随意改动
relogin:
/* 用户登录 */
ret = MSPLogin(NULL, NULL, login_params); //第一个参数是用户名,第二个参数是密码,第三个参数是登录参数,用户名和密码可在http://www.xfyun.cn注册获取
if (MSP_SUCCESS != ret&&error_num<10)
{
error_num+=1;
printf("TTS Login failed, error code: %d num %d.\n", ret,error_num);
goto relogin ;//登录失败,重新登录
}
else{
printf("TTS login\n");
}
return;
}
int play_tts(int name,int volume,int speed, char* argv[])
{
int ret = MSP_SUCCESS;
char name_tts[16];
char name_path[64];
char session_begin_params[512];
tts_speed_add=speed;
/*
* rdn: 合成音频数字发音方式
* volume: 合成音频的音量
* pitch: 合成音频的音调
* speed: 合成音频对应的语速
* voice_name: 合成发音人
* sample_rate: 合成音频采样率
* text_encoding: 合成文本编码格式
*
*/
switch(name){
case 1://中文女生
snprintf(name_tts,16, "xiaoyan");
snprintf(name_path,64, "fo|/root/tts/xiaoyan.jet");
break;
case 2://中文男生
snprintf(name_tts,16, "xiaofeng");
snprintf(name_path,64, "fo|/root/tts/xiaofeng.jet");
break;
case 11://英文女生
snprintf(name_tts,16, "catherine");
snprintf(name_path,64, "fo|/root/tts/catherine.jet");
break;
case 12://英文男生
snprintf(name_tts,16, "john");
snprintf(name_path,64, "fo|/root/tts/john.jet");
break;
case 31://东北
snprintf(name_tts,16, "xiaoqian");
snprintf(name_path,64, "fo|/root/tts/xiaoqian.jet");
break;
case 32://四川
snprintf(name_tts,16, "xiaorong");
snprintf(name_path,64, "fo|/root/tts/xiaorong.jet");
break;
case 33://河南
snprintf(name_tts,16, "xiaokun");
snprintf(name_path,64, "fo|/root/tts/xiaokun.jet");
break;
case 34://湖南
snprintf(name_tts,16, "xiaoqiang");
snprintf(name_path,64, "fo|/root/tts/xiaoqiang.jet");
break;
case 35://陕西
snprintf(name_tts,16, "xiaoying");
snprintf(name_path,64, "fo|/root/tts/xiaoying.jet");
break;
case 36://广东
snprintf(name_tts,16, "xiaomei");
snprintf(name_path,64, "fo|/root/tts/xiaomei.jet");
break;
default://默认中文女生
snprintf(name_tts,16, "xiaoyan");
snprintf(name_path,64, "fo|/root/tts/xiaoyan.jet");
break;
}
const char* filename = "/root/record/1.wav"; //合成的语音文件名称 tts_res_path = fo|res/tts/xiaoyan.jet;fo|res/tts/common.jet,
const char* text = "你好,讯飞语音合成测试。"; //合成文本
//const char* session_begin_params = "engine_type = local,voice_name=xiaoyan, text_encoding = UTF8, tts_res_path = fo|/root/tts/xiaoyan.jet;fo|/root/tts/common.jet, sample_rate = 16000, speed = 50, volume = 50, pitch = 50, rdn = 2";
snprintf(session_begin_params,512,"engine_type = local,voice_name=%s, text_encoding = UTF8, tts_res_path = %s;fo|/root/tts/common.jet, sample_rate = 16000, speed = %d, volume = %d, pitch = 50, rdn = 2",name_tts,name_path,speed,volume);
printf("session_begin_params=%s\n",session_begin_params);
printf("argv=%s\n",argv);
char tts_add1[512];
char tts_add2[512];
snprintf(tts_add1,512,"engine_type = local,voice_name=xiaoyan, text_encoding = UTF8, tts_res_path = fo|/root/tts/xiaoyan.jet;fo|/root/tts/common.jet, sample_rate = 16000, speed = %d, volume = 100, pitch = 50, rdn = 2",tts_speed_add);
snprintf(tts_add2,512,"engine_type = local,voice_name=xiaofeng, text_encoding = UTF8, tts_res_path = fo|/root/tts/xiaofeng.jet;fo|/root/tts/common.jet, sample_rate = 16000, speed = %d, volume = 100, pitch = 50, rdn = 2",tts_speed_add);
/* 文本合成 */
printf("TTS start\n");
//stop_music();//暂停
set_paly_state(2);//设置为文本播放
reset_play=0;
set_amplifier(1);//打开功放
Start_TTS:
ret = text_to_speech(argv, filename, session_begin_params);
if (MSP_SUCCESS != ret)
{
printf("text_to_speech failed, error code: %d.\n", ret);
}
printf("合成完毕\n");
if(tts_add==1){
ret = text_to_speech(argv, filename, tts_add1);
if (MSP_SUCCESS != ret)
{
printf("text_to_speech failed, error code: %d.\n", ret);
}
printf("追加女声合成完毕\n");
}
else if(tts_add==2){
ret = text_to_speech(argv, filename, tts_add2);
if (MSP_SUCCESS != ret)
{
printf("text_to_speech failed, error code: %d.\n", ret);
}
printf("追加男声合成完毕\n");
}
if(play_mode==1&&TTS_switch==1&&now_play_stat==2){
delay(500);
goto Start_TTS;
}
//delay(TTS_delay*50*speed/50);
//printf("TTS delay=%d ms\n",TTS_delay*1000*speed/50);
printf("延时长度%d 字节长度%d \n",( strlen(argv) *100*speed/50), strlen(argv) );
if(strlen(argv) *120*speed/50<=6000&&now_play_stat==2){
delay( strlen(argv) *150*speed/50);
}
else if(strlen(argv) *120*speed/50>6000&&now_play_stat==2){
delay(8000);
}
//set_amplifier(0);//关闭功放
printf("TTS end\n");
set_paly_state(0);//设置播放结束
return 0;
}
int first_tts(int name,int volume,int speed, char* argv[])
{
int ret = MSP_SUCCESS;
char name_tts[16];
char name_path[64];
char session_begin_params[512];
/*
* rdn: 合成音频数字发音方式
* volume: 合成音频的音量
* pitch: 合成音频的音调
* speed: 合成音频对应的语速
* voice_name: 合成发音人
* sample_rate: 合成音频采样率
* text_encoding: 合成文本编码格式
*
*/
switch(name){
case 1://中文女生
snprintf(name_tts,16, "xiaoyan");
snprintf(name_path,64, "fo|/root/tts/xiaoyan.jet");
break;
case 2://中文男生
snprintf(name_tts,16, "xiaofeng");
snprintf(name_path,64, "fo|/root/tts/xiaofeng.jet");
break;
case 11://英文女生
snprintf(name_tts,16, "catherine");
snprintf(name_path,64, "fo|/root/tts/catherine.jet");
break;
case 12://英文男生
snprintf(name_tts,16, "john");
snprintf(name_path,64, "fo|/root/tts/john.jet");
break;
case 31://东北
snprintf(name_tts,16, "xiaoqian");
snprintf(name_path,64, "fo|/root/tts/xiaoqian.jet");
break;
case 32://四川
snprintf(name_tts,16, "xiaorong");
snprintf(name_path,64, "fo|/root/tts/xiaorong.jet");
break;
case 33://河南
snprintf(name_tts,16, "xiaokun");
snprintf(name_path,64, "fo|/root/tts/xiaokun.jet");
break;
case 34://湖南
snprintf(name_tts,16, "xiaoqiang");
snprintf(name_path,64, "fo|/root/tts/xiaoqiang.jet");
break;
case 35://陕西
snprintf(name_tts,16, "xiaoying");
snprintf(name_path,64, "fo|/root/tts/xiaoying.jet");
break;
case 36://广东
snprintf(name_tts,16, "xiaomei");
snprintf(name_path,64, "fo|/root/tts/xiaomei.jet");
break;
default://默认中文女生
snprintf(name_tts,16, "xiaoyan");
snprintf(name_path,64, "fo|/root/tts/xiaoyan.jet");
break;
}
const char* filename = "/root/record/1.wav"; //合成的语音文件名称 tts_res_path = fo|res/tts/xiaoyan.jet;fo|res/tts/common.jet,
const char* text = "你好,讯飞语音合成测试。"; //合成文本
//const char* session_begin_params = "engine_type = local,voice_name=xiaoyan, text_encoding = UTF8, tts_res_path = fo|/root/tts/xiaoyan.jet;fo|/root/tts/common.jet, sample_rate = 16000, speed = 50, volume = 50, pitch = 50, rdn = 2";
snprintf(session_begin_params,512,"engine_type = local,voice_name=xiaoyan, text_encoding = UTF8, tts_res_path = fo|/root/tts/xiaoyan.jet;fo|/root/tts/common.jet, sample_rate = 16000, speed = 50, volume = 100, pitch = 50, rdn = 2");
//snprintf(session_begin_params,512,"engine_type = local,voice_name=%s, text_encoding = UTF8, tts_res_path = %s;fo|/root/tts/common.jet, sample_rate = 16000, speed = %d, volume = %d, pitch = 50, rdn = 2",name_tts,name_path,speed,volume);
printf("session_begin_params=%s\n",session_begin_params);
printf("argv=%s\n",argv);
/* 文本合成 */
printf("开始合成 ...\n");
set_paly_state(2);//设置文本播放
set_amplifier(1);//打开功放
reset_play=0;
ret = text_to_speech(argv, filename, session_begin_params);
if (MSP_SUCCESS != ret)
{
printf("text_to_speech failed, error code: %d.\n", ret);
}
printf("合成完毕\n");
delay(2000);
set_amplifier(0);//关闭功放
set_paly_state(0);//设置播放结束
return 0;
}
int play_tts_mobie(int name,int volume,int speed, char* argv[])
{
int ret = MSP_SUCCESS;
char name_tts[16];
char name_path[64];
char session_begin_params[512];
/*
* rdn: 合成音频数字发音方式
* volume: 合成音频的音量
* pitch: 合成音频的音调
* speed: 合成音频对应的语速
* voice_name: 合成发音人
* sample_rate: 合成音频采样率
* text_encoding: 合成文本编码格式
*
*/
switch(name){
case 1:
snprintf(name_tts,16, "xiaoyan");
snprintf(name_path,64, "fo|/root/tts/xiaoyan.jet");
break;
case 2:
snprintf(name_tts,16, "xiaofeng");
snprintf(name_path,64, "fo|/root/tts/xiaofeng.jet");
break;
default:
break;
}
const char* filename = "/root/record/1.wav"; //合成的语音文件名称 tts_res_path = fo|res/tts/xiaoyan.jet;fo|res/tts/common.jet,
const char* text = "你好,讯飞语音合成测试。"; //合成文本
//const char* session_begin_params = "engine_type = local,voice_name=xiaoyan, text_encoding = UTF8, tts_res_path = fo|/root/tts/xiaoyan.jet;fo|/root/tts/common.jet, sample_rate = 16000, speed = 50, volume = 50, pitch = 50, rdn = 2";
snprintf(session_begin_params,512,"engine_type = local,voice_name=%s, text_encoding = UNICODE, tts_res_path = %s;fo|/root/tts/common.jet, sample_rate = 8000, speed = %d, volume = %d, pitch = 50, rdn = 2",name_tts,name_path,speed,volume);
printf("session_begin_params=%s\n",session_begin_params);
for(int i=0;i<sizeof(argv);i++){
printf("argv[%d]=%x \n",i,argv[i]);
}
printf("argv=%s\n",argv);
/* 文本合成 */
printf("手机开始合成 ...\n");
stop_music();//暂停
reset_play=0;
set_amplifier(1);//打开功放
now_play_stat=2;//文本播放
if(now_volume>50){
Protection(2);//音量大于五十执行保护
}
ret = text_to_speech(argv, filename, session_begin_params);
if (MSP_SUCCESS != ret)
{
printf("text_to_speech failed, error code: %d.\n", ret);
}
printf("合成完毕\n");
set_amplifier(0);//关闭功放
/*char end_tts[]={0x25,0x00,0x02,0xff,0x00,0x23};
E_DjiChannelAddress channelAddress;
channelAddress = DJI_CHANNEL_ADDRESS_MASTER_RC_APP;
DjiLowSpeedDataChannel_SendData(channelAddress,end_tts,sizeof(end_tts));
channelAddress = DJI_CHANNEL_ADDRESS_EXTENSION_PORT;
DjiLowSpeedDataChannel_SendData(channelAddress,end_tts,sizeof(end_tts)); */
return 0;
now_play_stat=0;//无播放
}
void stop_TTS_paly(){
printf("stop TTS\n");
set_paly_state(0);//设置无播放
set_amplifier(0);//关闭功放
QTTSSessionEnd(TTS_ID,"stop_tts");
if(tts_add==1){
QTTSSessionEnd(TTS_ID1,"stop_tts");
}
else if(tts_add==2){
QTTSSessionEnd(TTS_ID2,"stop_tts");
}
}