123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330 |
- #include <stdlib.h>
- #include <stdio.h>
- #include <string.h>
- #include <errno.h>
- #include <unistd.h>
- #include "../../include/qisr.h"
- #include "../../include/msp_cmn.h"
- #include "../../include/msp_errors.h"
- #define SAMPLE_RATE_16K (16000)
- #define SAMPLE_RATE_8K (8000)
- #define MAX_GRAMMARID_LEN (32)
- #define MAX_PARAMS_LEN (1024)
- const char * ASR_RES_PATH = "fo|res/asr/common.jet"; //离线语法识别资源路径
- const char * GRM_BUILD_PATH = "res/asr/GrmBuilld"; //构建离线语法识别网络生成数据保存路径
- const char * GRM_FILE = "call.bnf"; //构建离线识别语法网络所用的语法文件
- const char * LEX_NAME = "contact"; //更新离线识别语法的contact槽(语法文件为此示例中使用的call.bnf)
- typedef struct _UserData {
- int build_fini; //标识语法构建是否完成
- int update_fini; //标识更新词典是否完成
- int errcode; //记录语法构建或更新词典回调错误码
- char grammar_id[MAX_GRAMMARID_LEN]; //保存语法构建返回的语法ID
- }UserData;
- const char *get_audio_file(void); //选择进行离线语法识别的语音文件
- int build_grammar(UserData *udata); //构建离线识别语法网络
- int update_lexicon(UserData *udata); //更新离线识别语法词典
- int run_asr(UserData *udata); //进行离线语法识别
- const char* get_audio_file(void)
- {
- char key = 0;
- while(key != 27) //按Esc则退出
- {
- printf("请选择音频文件:\n");
- printf("1.打电话给丁伟\n");
- printf("2.打电话给黄辣椒\n");
- key = getchar();
- getchar();
- switch(key)
- {
- case '1':
- printf("\n1.打电话给丁伟\n");
- return "wav/ddhgdw.pcm";
- case '2':
- printf("\n2.打电话给黄辣椒\n");
- return "wav/ddhghlj.pcm";
- default:
- continue;
- }
- }
- exit(0);
- return NULL;
- }
- int build_grm_cb(int ecode, const char *info, void *udata)
- {
- UserData *grm_data = (UserData *)udata;
- if (NULL != grm_data) {
- grm_data->build_fini = 1;
- grm_data->errcode = ecode;
- }
- if (MSP_SUCCESS == ecode && NULL != info) {
- printf("构建语法成功! 语法ID:%s\n", info);
- if (NULL != grm_data)
- snprintf(grm_data->grammar_id, MAX_GRAMMARID_LEN - 1, info);
- }
- else
- printf("构建语法失败!%d\n", ecode);
- return 0;
- }
- int build_grammar(UserData *udata)
- {
- FILE *grm_file = NULL;
- char *grm_content = NULL;
- unsigned int grm_cnt_len = 0;
- char grm_build_params[MAX_PARAMS_LEN] = {NULL};
- int ret = 0;
- grm_file = fopen(GRM_FILE, "rb");
- if(NULL == grm_file) {
- printf("打开\"%s\"文件失败![%s]\n", GRM_FILE, strerror(errno));
- return -1;
- }
- fseek(grm_file, 0, SEEK_END);
- grm_cnt_len = ftell(grm_file);
- fseek(grm_file, 0, SEEK_SET);
- grm_content = (char *)malloc(grm_cnt_len + 1);
- if (NULL == grm_content)
- {
- printf("内存分配失败!\n");
- fclose(grm_file);
- grm_file = NULL;
- return -1;
- }
- fread((void*)grm_content, 1, grm_cnt_len, grm_file);
- grm_content[grm_cnt_len] = '\0';
- fclose(grm_file);
- grm_file = NULL;
- snprintf(grm_build_params, MAX_PARAMS_LEN - 1,
- "engine_type = local, \
- asr_res_path = %s, sample_rate = %d, \
- grm_build_path = %s, ",
- ASR_RES_PATH,
- SAMPLE_RATE_16K,
- GRM_BUILD_PATH
- );
- ret = QISRBuildGrammar("bnf", grm_content, grm_cnt_len, grm_build_params, build_grm_cb, udata);
- free(grm_content);
- grm_content = NULL;
- return ret;
- }
- int update_lex_cb(int ecode, const char *info, void *udata)
- {
- UserData *lex_data = (UserData *)udata;
- if (NULL != lex_data) {
- lex_data->update_fini = 1;
- lex_data->errcode = ecode;
- }
- if (MSP_SUCCESS == ecode)
- printf("更新词典成功!\n");
- else
- printf("更新词典失败!%d\n", ecode);
- return 0;
- }
- int update_lexicon(UserData *udata)
- {
- const char *lex_content = "丁伟\n黄辣椒";
- unsigned int lex_cnt_len = strlen(lex_content);
- char update_lex_params[MAX_PARAMS_LEN] = {NULL};
- snprintf(update_lex_params, MAX_PARAMS_LEN - 1,
- "engine_type = local, text_encoding = UTF-8, \
- asr_res_path = %s, sample_rate = %d, \
- grm_build_path = %s, grammar_list = %s, ",
- ASR_RES_PATH,
- SAMPLE_RATE_16K,
- GRM_BUILD_PATH,
- udata->grammar_id);
- return QISRUpdateLexicon(LEX_NAME, lex_content, lex_cnt_len, update_lex_params, update_lex_cb, udata);
- }
- int run_asr(UserData *udata)
- {
- char asr_params[MAX_PARAMS_LEN] = {NULL};
- const char *rec_rslt = NULL;
- const char *session_id = NULL;
- const char *asr_audiof = NULL;
- FILE *f_pcm = NULL;
- char *pcm_data = NULL;
- long pcm_count = 0;
- long pcm_size = 0;
- int last_audio = 0;
- int aud_stat = MSP_AUDIO_SAMPLE_CONTINUE;
- int ep_status = MSP_EP_LOOKING_FOR_SPEECH;
- int rec_status = MSP_REC_STATUS_INCOMPLETE;
- int rss_status = MSP_REC_STATUS_INCOMPLETE;
- int errcode = -1;
- asr_audiof = get_audio_file();
- f_pcm = fopen(asr_audiof, "rb");
- if (NULL == f_pcm) {
- printf("打开\"%s\"失败![%s]\n", f_pcm, strerror(errno));
- goto run_error;
- }
- fseek(f_pcm, 0, SEEK_END);
- pcm_size = ftell(f_pcm);
- fseek(f_pcm, 0, SEEK_SET);
- pcm_data = (char *)malloc(pcm_size);
- if (NULL == pcm_data)
- goto run_error;
- fread((void *)pcm_data, pcm_size, 1, f_pcm);
- fclose(f_pcm);
- f_pcm = NULL;
- //离线语法识别参数设置
- snprintf(asr_params, MAX_PARAMS_LEN - 1,
- "engine_type = local, \
- asr_res_path = %s, sample_rate = %d, \
- grm_build_path = %s, local_grammar = %s, \
- result_type = xml, result_encoding = UTF-8, ",
- ASR_RES_PATH,
- SAMPLE_RATE_16K,
- GRM_BUILD_PATH,
- udata->grammar_id
- );
- session_id = QISRSessionBegin(NULL, asr_params, &errcode);
- if (NULL == session_id)
- goto run_error;
- printf("开始识别...\n");
- while (1) {
- unsigned int len = 6400;
- if (pcm_size < 12800) {
- len = pcm_size;
- last_audio = 1;
- }
- aud_stat = MSP_AUDIO_SAMPLE_CONTINUE;
- if (0 == pcm_count)
- aud_stat = MSP_AUDIO_SAMPLE_FIRST;
- if (len <= 0)
- break;
- printf(">");
- fflush(stdout);
- errcode = QISRAudioWrite(session_id, (const void *)&pcm_data[pcm_count], len, aud_stat, &ep_status, &rec_status);
- if (MSP_SUCCESS != errcode)
- goto run_error;
- pcm_count += (long)len;
- pcm_size -= (long)len;
- //检测到音频结束
- if (MSP_EP_AFTER_SPEECH == ep_status)
- break;
- usleep(150 * 1000); //模拟人说话时间间隙
- }
- //主动点击音频结束
- QISRAudioWrite(session_id, (const void *)NULL, 0, MSP_AUDIO_SAMPLE_LAST, &ep_status, &rec_status);
- free(pcm_data);
- pcm_data = NULL;
- //获取识别结果
- while (MSP_REC_STATUS_COMPLETE != rss_status && MSP_SUCCESS == errcode) {
- rec_rslt = QISRGetResult(session_id, &rss_status, 0, &errcode);
- usleep(150 * 1000);
- }
- printf("\n识别结束:\n");
- printf("=============================================================\n");
- if (NULL != rec_rslt)
- printf("%s\n", rec_rslt);
- else
- printf("没有识别结果!\n");
- printf("=============================================================\n");
- goto run_exit;
- run_error:
- if (NULL != pcm_data) {
- free(pcm_data);
- pcm_data = NULL;
- }
- if (NULL != f_pcm) {
- fclose(f_pcm);
- f_pcm = NULL;
- }
- run_exit:
- QISRSessionEnd(session_id, NULL);
- return errcode;
- }
- int main(int argc, char* argv[])
- {
- const char *login_config = "appid = 5d5b9efd"; //登录参数
- UserData asr_data;
- int ret = 0 ;
- char c;
- ret = MSPLogin(NULL, NULL, login_config); //第一个参数为用户名,第二个参数为密码,传NULL即可,第三个参数是登录参数
- if (MSP_SUCCESS != ret) {
- printf("登录失败:%d\n", ret);
- goto exit;
- }
- memset(&asr_data, 0, sizeof(UserData));
- printf("构建离线识别语法网络...\n");
- ret = build_grammar(&asr_data); //第一次使用某语法进行识别,需要先构建语法网络,获取语法ID,之后使用此语法进行识别,无需再次构建
- if (MSP_SUCCESS != ret) {
- printf("构建语法调用失败!\n");
- goto exit;
- }
- while (1 != asr_data.build_fini)
- usleep(300 * 1000);
- if (MSP_SUCCESS != asr_data.errcode)
- goto exit;
- printf("离线识别语法网络构建完成,开始识别...\n");
- ret = run_asr(&asr_data);
- if (MSP_SUCCESS != ret) {
- printf("离线语法识别出错: %d \n", ret);
- goto exit;
- }
- printf("更新离线语法词典...\n");
- ret = update_lexicon(&asr_data); //当语法词典槽中的词条需要更新时,调用QISRUpdateLexicon接口完成更新
- if (MSP_SUCCESS != ret) {
- printf("更新词典调用失败!\n");
- goto exit;
- }
- while (1 != asr_data.update_fini)
- usleep(300 * 1000);
- if (MSP_SUCCESS != asr_data.errcode)
- goto exit;
- printf("更新离线语法词典完成,开始识别...\n");
- ret = run_asr(&asr_data);
- if (MSP_SUCCESS != ret) {
- printf("离线语法识别出错: %d \n", ret);
- goto exit;
- }
- exit:
- MSPLogout();
- printf("请按任意键退出...\n");
- getchar();
- return 0;
- }
|