funasrruntime.cpp 23 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776
  1. #include "precomp.h"
  2. #include <vector>
  3. // APIs for Init
  4. _FUNASRAPI FUNASR_HANDLE FunASRInit(std::map<std::string, std::string>& model_path, int thread_num, ASR_TYPE type)
  5. {
  6. funasr::Model* mm = funasr::CreateModel(model_path, thread_num, type);
  7. return mm;
  8. }
  9. _FUNASRAPI FUNASR_HANDLE FunASROnlineInit(FUNASR_HANDLE asr_hanlde, std::vector<int> chunk_size)
  10. {
  11. funasr::Model* mm = funasr::CreateModel(asr_hanlde, chunk_size);
  12. return mm;
  13. }
  14. _FUNASRAPI FUNASR_HANDLE FsmnVadInit(std::map<std::string, std::string>& model_path, int thread_num)
  15. {
  16. funasr::VadModel* mm = funasr::CreateVadModel(model_path, thread_num);
  17. return mm;
  18. }
  19. _FUNASRAPI FUNASR_HANDLE FsmnVadOnlineInit(FUNASR_HANDLE fsmnvad_handle)
  20. {
  21. funasr::VadModel* mm = funasr::CreateVadModel(fsmnvad_handle);
  22. return mm;
  23. }
  24. _FUNASRAPI FUNASR_HANDLE CTTransformerInit(std::map<std::string, std::string>& model_path, int thread_num, PUNC_TYPE type)
  25. {
  26. funasr::PuncModel* mm = funasr::CreatePuncModel(model_path, thread_num, type);
  27. return mm;
  28. }
  29. _FUNASRAPI FUNASR_HANDLE FunOfflineInit(std::map<std::string, std::string>& model_path, int thread_num)
  30. {
  31. funasr::OfflineStream* mm = funasr::CreateOfflineStream(model_path, thread_num);
  32. return mm;
  33. }
  34. _FUNASRAPI FUNASR_HANDLE FunTpassInit(std::map<std::string, std::string>& model_path, int thread_num)
  35. {
  36. funasr::TpassStream* mm = funasr::CreateTpassStream(model_path, thread_num);
  37. return mm;
  38. }
  39. _FUNASRAPI FUNASR_HANDLE FunTpassOnlineInit(FUNASR_HANDLE tpass_handle, std::vector<int> chunk_size)
  40. {
  41. return funasr::CreateTpassOnlineStream(tpass_handle, chunk_size);
  42. }
  43. // APIs for ASR Infer
  44. _FUNASRAPI FUNASR_RESULT FunASRInferBuffer(FUNASR_HANDLE handle, const char* sz_buf, int n_len, FUNASR_MODE mode, QM_CALLBACK fn_callback, bool input_finished, int sampling_rate, std::string wav_format)
  45. {
  46. funasr::Model* recog_obj = (funasr::Model*)handle;
  47. if (!recog_obj)
  48. return nullptr;
  49. funasr::Audio audio(recog_obj->GetAsrSampleRate(),1);
  50. if(wav_format == "pcm" || wav_format == "PCM"){
  51. if (!audio.LoadPcmwav(sz_buf, n_len, &sampling_rate))
  52. return nullptr;
  53. }else{
  54. if (!audio.FfmpegLoad(sz_buf, n_len))
  55. return nullptr;
  56. }
  57. float* buff;
  58. int len;
  59. int flag = 0;
  60. funasr::FUNASR_RECOG_RESULT* p_result = new funasr::FUNASR_RECOG_RESULT;
  61. p_result->snippet_time = audio.GetTimeLen();
  62. if(p_result->snippet_time == 0){
  63. return p_result;
  64. }
  65. int n_step = 0;
  66. int n_total = audio.GetQueueSize();
  67. while (audio.Fetch(buff, len, flag) > 0) {
  68. string msg = recog_obj->Forward(buff, len, input_finished);
  69. p_result->msg += msg;
  70. n_step++;
  71. if (fn_callback)
  72. fn_callback(n_step, n_total);
  73. }
  74. return p_result;
  75. }
  76. _FUNASRAPI FUNASR_RESULT FunASRInfer(FUNASR_HANDLE handle, const char* sz_filename, FUNASR_MODE mode, QM_CALLBACK fn_callback, int sampling_rate)
  77. {
  78. funasr::Model* recog_obj = (funasr::Model*)handle;
  79. if (!recog_obj)
  80. return nullptr;
  81. funasr::Audio audio(recog_obj->GetAsrSampleRate(),1);
  82. if(funasr::is_target_file(sz_filename, "wav")){
  83. int32_t sampling_rate_ = -1;
  84. if(!audio.LoadWav(sz_filename, &sampling_rate_))
  85. return nullptr;
  86. }else if(funasr::is_target_file(sz_filename, "pcm")){
  87. if (!audio.LoadPcmwav(sz_filename, &sampling_rate))
  88. return nullptr;
  89. }else{
  90. if (!audio.FfmpegLoad(sz_filename))
  91. return nullptr;
  92. }
  93. float* buff;
  94. int len;
  95. int flag = 0;
  96. int n_step = 0;
  97. int n_total = audio.GetQueueSize();
  98. funasr::FUNASR_RECOG_RESULT* p_result = new funasr::FUNASR_RECOG_RESULT;
  99. p_result->snippet_time = audio.GetTimeLen();
  100. if(p_result->snippet_time == 0){
  101. return p_result;
  102. }
  103. while (audio.Fetch(buff, len, flag) > 0) {
  104. string msg = recog_obj->Forward(buff, len, true);
  105. p_result->msg += msg;
  106. n_step++;
  107. if (fn_callback)
  108. fn_callback(n_step, n_total);
  109. }
  110. return p_result;
  111. }
  112. // APIs for VAD Infer
  113. _FUNASRAPI FUNASR_RESULT FsmnVadInferBuffer(FUNASR_HANDLE handle, const char* sz_buf, int n_len, QM_CALLBACK fn_callback, bool input_finished, int sampling_rate, std::string wav_format)
  114. {
  115. funasr::VadModel* vad_obj = (funasr::VadModel*)handle;
  116. if (!vad_obj)
  117. return nullptr;
  118. funasr::Audio audio(vad_obj->GetVadSampleRate(),1);
  119. if(wav_format == "pcm" || wav_format == "PCM"){
  120. if (!audio.LoadPcmwav(sz_buf, n_len, &sampling_rate))
  121. return nullptr;
  122. }else{
  123. if (!audio.FfmpegLoad(sz_buf, n_len))
  124. return nullptr;
  125. }
  126. funasr::FUNASR_VAD_RESULT* p_result = new funasr::FUNASR_VAD_RESULT;
  127. p_result->snippet_time = audio.GetTimeLen();
  128. if(p_result->snippet_time == 0){
  129. return p_result;
  130. }
  131. vector<std::vector<int>> vad_segments;
  132. audio.Split(vad_obj, vad_segments, input_finished);
  133. p_result->segments = new vector<std::vector<int>>(vad_segments);
  134. return p_result;
  135. }
  136. _FUNASRAPI FUNASR_RESULT FsmnVadInfer(FUNASR_HANDLE handle, const char* sz_filename, QM_CALLBACK fn_callback, int sampling_rate)
  137. {
  138. funasr::VadModel* vad_obj = (funasr::VadModel*)handle;
  139. if (!vad_obj)
  140. return nullptr;
  141. funasr::Audio audio(vad_obj->GetVadSampleRate(),1);
  142. if(funasr::is_target_file(sz_filename, "wav")){
  143. int32_t sampling_rate_ = -1;
  144. if(!audio.LoadWav(sz_filename, &sampling_rate_))
  145. return nullptr;
  146. }else if(funasr::is_target_file(sz_filename, "pcm")){
  147. if (!audio.LoadPcmwav(sz_filename, &sampling_rate))
  148. return nullptr;
  149. }else{
  150. if (!audio.FfmpegLoad(sz_filename))
  151. return nullptr;
  152. }
  153. funasr::FUNASR_VAD_RESULT* p_result = new funasr::FUNASR_VAD_RESULT;
  154. p_result->snippet_time = audio.GetTimeLen();
  155. if(p_result->snippet_time == 0){
  156. return p_result;
  157. }
  158. vector<std::vector<int>> vad_segments;
  159. audio.Split(vad_obj, vad_segments, true);
  160. p_result->segments = new vector<std::vector<int>>(vad_segments);
  161. return p_result;
  162. }
  163. // APIs for PUNC Infer
  164. _FUNASRAPI FUNASR_RESULT CTTransformerInfer(FUNASR_HANDLE handle, const char* sz_sentence, FUNASR_MODE mode, QM_CALLBACK fn_callback, PUNC_TYPE type, FUNASR_RESULT pre_result)
  165. {
  166. funasr::PuncModel* punc_obj = (funasr::PuncModel*)handle;
  167. if (!punc_obj)
  168. return nullptr;
  169. FUNASR_RESULT p_result = nullptr;
  170. if (type==PUNC_OFFLINE){
  171. p_result = (FUNASR_RESULT)new funasr::FUNASR_PUNC_RESULT;
  172. ((funasr::FUNASR_PUNC_RESULT*)p_result)->msg = punc_obj->AddPunc(sz_sentence);
  173. }else if(type==PUNC_ONLINE){
  174. if (!pre_result)
  175. p_result = (FUNASR_RESULT)new funasr::FUNASR_PUNC_RESULT;
  176. else
  177. p_result = pre_result;
  178. ((funasr::FUNASR_PUNC_RESULT*)p_result)->msg = punc_obj->AddPunc(sz_sentence, ((funasr::FUNASR_PUNC_RESULT*)p_result)->arr_cache);
  179. }else{
  180. LOG(ERROR) << "Wrong PUNC_TYPE";
  181. exit(-1);
  182. }
  183. return p_result;
  184. }
  185. // APIs for Offline-stream Infer
  186. _FUNASRAPI FUNASR_RESULT FunOfflineInferBuffer(FUNASR_HANDLE handle, const char* sz_buf, int n_len,
  187. FUNASR_MODE mode, QM_CALLBACK fn_callback, const std::vector<std::vector<float>> &hw_emb,
  188. int sampling_rate, std::string wav_format, bool itn, FUNASR_DEC_HANDLE dec_handle)
  189. {
  190. funasr::OfflineStream* offline_stream = (funasr::OfflineStream*)handle;
  191. if (!offline_stream)
  192. return nullptr;
  193. funasr::Audio audio(offline_stream->asr_handle->GetAsrSampleRate(),1);
  194. try{
  195. if(wav_format == "pcm" || wav_format == "PCM"){
  196. if (!audio.LoadPcmwav(sz_buf, n_len, &sampling_rate))
  197. return nullptr;
  198. }else{
  199. if (!audio.FfmpegLoad(sz_buf, n_len))
  200. return nullptr;
  201. }
  202. }catch (std::exception const &e)
  203. {
  204. LOG(ERROR)<<e.what();
  205. return nullptr;
  206. }
  207. funasr::FUNASR_RECOG_RESULT* p_result = new funasr::FUNASR_RECOG_RESULT;
  208. p_result->snippet_time = audio.GetTimeLen();
  209. if(p_result->snippet_time == 0){
  210. return p_result;
  211. }
  212. if(offline_stream->UseVad()){
  213. audio.Split(offline_stream);
  214. }
  215. float* buff;
  216. int len;
  217. int flag = 0;
  218. int n_step = 0;
  219. int n_total = audio.GetQueueSize();
  220. float start_time = 0.0;
  221. std::string cur_stamp = "[";
  222. std::string lang = (offline_stream->asr_handle)->GetLang();
  223. while (audio.Fetch(buff, len, flag, start_time) > 0) {
  224. // dec reset
  225. funasr::WfstDecoder* wfst_decoder = (funasr::WfstDecoder*)dec_handle;
  226. if (wfst_decoder){
  227. wfst_decoder->StartUtterance();
  228. }
  229. string msg = (offline_stream->asr_handle)->Forward(buff, len, true, hw_emb, dec_handle);
  230. std::vector<std::string> msg_vec = funasr::split(msg, '|');
  231. if(msg_vec.size()==0){
  232. continue;
  233. }
  234. if(lang == "en-bpe" && p_result->msg != ""){
  235. p_result->msg += " ";
  236. }
  237. p_result->msg += msg_vec[0];
  238. //timestamp
  239. if(msg_vec.size() > 1){
  240. std::vector<std::string> msg_stamp = funasr::split(msg_vec[1], ',');
  241. for(int i=0; i<msg_stamp.size()-1; i+=2){
  242. float begin = std::stof(msg_stamp[i])+start_time;
  243. float end = std::stof(msg_stamp[i+1])+start_time;
  244. cur_stamp += "["+std::to_string((int)(1000*begin))+","+std::to_string((int)(1000*end))+"],";
  245. }
  246. }
  247. n_step++;
  248. if (fn_callback)
  249. fn_callback(n_step, n_total);
  250. }
  251. if(cur_stamp != "["){
  252. cur_stamp.erase(cur_stamp.length() - 1);
  253. p_result->stamp += cur_stamp + "]";
  254. }
  255. if(offline_stream->UsePunc()){
  256. string punc_res = (offline_stream->punc_handle)->AddPunc((p_result->msg).c_str(), lang);
  257. p_result->msg = punc_res;
  258. }
  259. #if !defined(__APPLE__)
  260. if(offline_stream->UseITN() && itn){
  261. string msg_itn = offline_stream->itn_handle->Normalize(p_result->msg);
  262. if(!(p_result->stamp).empty()){
  263. std::string new_stamp = funasr::TimestampSmooth(p_result->msg, msg_itn, p_result->stamp);
  264. if(!new_stamp.empty()){
  265. p_result->stamp = new_stamp;
  266. }
  267. }
  268. p_result->msg = msg_itn;
  269. }
  270. #endif
  271. return p_result;
  272. }
  273. _FUNASRAPI FUNASR_RESULT FunOfflineInfer(FUNASR_HANDLE handle, const char* sz_filename, FUNASR_MODE mode, QM_CALLBACK fn_callback,
  274. const std::vector<std::vector<float>> &hw_emb, int sampling_rate, bool itn, FUNASR_DEC_HANDLE dec_handle)
  275. {
  276. funasr::OfflineStream* offline_stream = (funasr::OfflineStream*)handle;
  277. if (!offline_stream)
  278. return nullptr;
  279. funasr::Audio audio((offline_stream->asr_handle)->GetAsrSampleRate(),1);
  280. try{
  281. if(funasr::is_target_file(sz_filename, "wav")){
  282. int32_t sampling_rate_ = -1;
  283. if(!audio.LoadWav(sz_filename, &sampling_rate_))
  284. return nullptr;
  285. }else if(funasr::is_target_file(sz_filename, "pcm")){
  286. if (!audio.LoadPcmwav(sz_filename, &sampling_rate))
  287. return nullptr;
  288. }else{
  289. if (!audio.FfmpegLoad(sz_filename))
  290. return nullptr;
  291. }
  292. }catch (std::exception const &e)
  293. {
  294. LOG(ERROR)<<e.what();
  295. return nullptr;
  296. }
  297. funasr::FUNASR_RECOG_RESULT* p_result = new funasr::FUNASR_RECOG_RESULT;
  298. p_result->snippet_time = audio.GetTimeLen();
  299. if(p_result->snippet_time == 0){
  300. return p_result;
  301. }
  302. if(offline_stream->UseVad()){
  303. audio.Split(offline_stream);
  304. }
  305. float* buff;
  306. int len;
  307. int flag = 0;
  308. int n_step = 0;
  309. int n_total = audio.GetQueueSize();
  310. float start_time = 0.0;
  311. std::string cur_stamp = "[";
  312. std::string lang = (offline_stream->asr_handle)->GetLang();
  313. while (audio.Fetch(buff, len, flag, start_time) > 0) {
  314. // dec reset
  315. funasr::WfstDecoder* wfst_decoder = (funasr::WfstDecoder*)dec_handle;
  316. if (wfst_decoder){
  317. wfst_decoder->StartUtterance();
  318. }
  319. string msg = (offline_stream->asr_handle)->Forward(buff, len, true, hw_emb, dec_handle);
  320. std::vector<std::string> msg_vec = funasr::split(msg, '|');
  321. if(msg_vec.size()==0){
  322. continue;
  323. }
  324. if(lang == "en-bpe" && p_result->msg != ""){
  325. p_result->msg += " ";
  326. }
  327. p_result->msg += msg_vec[0];
  328. //timestamp
  329. if(msg_vec.size() > 1){
  330. std::vector<std::string> msg_stamp = funasr::split(msg_vec[1], ',');
  331. for(int i=0; i<msg_stamp.size()-1; i+=2){
  332. float begin = std::stof(msg_stamp[i])+start_time;
  333. float end = std::stof(msg_stamp[i+1])+start_time;
  334. cur_stamp += "["+std::to_string((int)(1000*begin))+","+std::to_string((int)(1000*end))+"],";
  335. }
  336. }
  337. n_step++;
  338. if (fn_callback)
  339. fn_callback(n_step, n_total);
  340. }
  341. if(cur_stamp != "["){
  342. cur_stamp.erase(cur_stamp.length() - 1);
  343. p_result->stamp += cur_stamp + "]";
  344. }
  345. if(offline_stream->UsePunc()){
  346. string punc_res = (offline_stream->punc_handle)->AddPunc((p_result->msg).c_str(), lang);
  347. p_result->msg = punc_res;
  348. }
  349. #if !defined(__APPLE__)
  350. if(offline_stream->UseITN() && itn){
  351. string msg_itn = offline_stream->itn_handle->Normalize(p_result->msg);
  352. if(!(p_result->stamp).empty()){
  353. std::string new_stamp = funasr::TimestampSmooth(p_result->msg, msg_itn, p_result->stamp);
  354. if(!new_stamp.empty()){
  355. p_result->stamp = new_stamp;
  356. }
  357. }
  358. p_result->msg = msg_itn;
  359. }
  360. #endif
  361. return p_result;
  362. }
  363. #if !defined(__APPLE__)
  364. _FUNASRAPI const std::vector<std::vector<float>> CompileHotwordEmbedding(FUNASR_HANDLE handle, std::string &hotwords, ASR_TYPE mode)
  365. {
  366. if (mode == ASR_OFFLINE){
  367. funasr::OfflineStream* offline_stream = (funasr::OfflineStream*)handle;
  368. std::vector<std::vector<float>> emb;
  369. if (!offline_stream)
  370. return emb;
  371. return (offline_stream->asr_handle)->CompileHotwordEmbedding(hotwords);
  372. }
  373. else if (mode == ASR_TWO_PASS){
  374. funasr::TpassStream* tpass_stream = (funasr::TpassStream*)handle;
  375. std::vector<std::vector<float>> emb;
  376. if (!tpass_stream)
  377. return emb;
  378. return (tpass_stream->asr_handle)->CompileHotwordEmbedding(hotwords);
  379. }
  380. else{
  381. LOG(ERROR) << "Not implement: Online model does not support Hotword yet!";
  382. std::vector<std::vector<float>> emb;
  383. return emb;
  384. }
  385. }
  386. #endif
  387. // APIs for 2pass-stream Infer
  388. _FUNASRAPI FUNASR_RESULT FunTpassInferBuffer(FUNASR_HANDLE handle, FUNASR_HANDLE online_handle, const char* sz_buf,
  389. int n_len, std::vector<std::vector<std::string>> &punc_cache, bool input_finished,
  390. int sampling_rate, std::string wav_format, ASR_TYPE mode,
  391. const std::vector<std::vector<float>> &hw_emb, bool itn)
  392. {
  393. funasr::TpassStream* tpass_stream = (funasr::TpassStream*)handle;
  394. funasr::TpassOnlineStream* tpass_online_stream = (funasr::TpassOnlineStream*)online_handle;
  395. if (!tpass_stream || !tpass_online_stream)
  396. return nullptr;
  397. funasr::VadModel* vad_online_handle = (tpass_online_stream->vad_online_handle).get();
  398. if (!vad_online_handle)
  399. return nullptr;
  400. funasr::Audio* audio = ((funasr::FsmnVadOnline*)vad_online_handle)->audio_handle.get();
  401. funasr::Model* asr_online_handle = (tpass_online_stream->asr_online_handle).get();
  402. if (!asr_online_handle)
  403. return nullptr;
  404. int chunk_len = ((funasr::ParaformerOnline*)asr_online_handle)->chunk_len;
  405. funasr::Model* asr_handle = (tpass_stream->asr_handle).get();
  406. if (!asr_handle)
  407. return nullptr;
  408. funasr::PuncModel* punc_online_handle = (tpass_stream->punc_online_handle).get();
  409. if (!punc_online_handle)
  410. return nullptr;
  411. if(wav_format == "pcm" || wav_format == "PCM"){
  412. if (!audio->LoadPcmwavOnline(sz_buf, n_len, &sampling_rate))
  413. return nullptr;
  414. }else{
  415. // if (!audio->FfmpegLoad(sz_buf, n_len))
  416. // return nullptr;
  417. LOG(ERROR) <<"Wrong wav_format: " << wav_format ;
  418. return nullptr;
  419. }
  420. funasr::FUNASR_RECOG_RESULT* p_result = new funasr::FUNASR_RECOG_RESULT;
  421. p_result->snippet_time = audio->GetTimeLen();
  422. audio->Split(vad_online_handle, chunk_len, input_finished, mode);
  423. funasr::AudioFrame* frame = NULL;
  424. while(audio->FetchChunck(frame) > 0){
  425. string msg = ((funasr::ParaformerOnline*)asr_online_handle)->Forward(frame->data, frame->len, frame->is_final);
  426. if(mode == ASR_ONLINE){
  427. ((funasr::ParaformerOnline*)asr_online_handle)->online_res += msg;
  428. if(frame->is_final){
  429. string online_msg = ((funasr::ParaformerOnline*)asr_online_handle)->online_res;
  430. string msg_punc = punc_online_handle->AddPunc(online_msg.c_str(), punc_cache[0]);
  431. p_result->tpass_msg = msg_punc;
  432. #if !defined(__APPLE__)
  433. // ITN
  434. if(tpass_stream->UseITN() && itn){
  435. string msg_itn = tpass_stream->itn_handle->Normalize(msg_punc);
  436. p_result->tpass_msg = msg_itn;
  437. }
  438. #endif
  439. ((funasr::ParaformerOnline*)asr_online_handle)->online_res = "";
  440. p_result->msg += msg;
  441. }else{
  442. p_result->msg += msg;
  443. }
  444. }else if(mode == ASR_TWO_PASS){
  445. p_result->msg += msg;
  446. }
  447. if(frame != NULL){
  448. delete frame;
  449. frame = NULL;
  450. }
  451. }
  452. // timestamp
  453. std::string cur_stamp = "[";
  454. while(audio->FetchTpass(frame) > 0){
  455. string msg = ((funasr::Paraformer*)asr_handle)->Forward(frame->data, frame->len, frame->is_final, hw_emb);
  456. std::vector<std::string> msg_vec = funasr::split(msg, '|'); // split with timestamp
  457. if(msg_vec.size()==0){
  458. continue;
  459. }
  460. msg = msg_vec[0];
  461. //timestamp
  462. if(msg_vec.size() > 1){
  463. std::vector<std::string> msg_stamp = funasr::split(msg_vec[1], ',');
  464. for(int i=0; i<msg_stamp.size()-1; i+=2){
  465. float begin = std::stof(msg_stamp[i]) + float(frame->global_start)/1000.0;
  466. float end = std::stof(msg_stamp[i+1]) + float(frame->global_start)/1000.0;
  467. cur_stamp += "["+std::to_string((int)(1000*begin))+","+std::to_string((int)(1000*end))+"],";
  468. }
  469. }
  470. if(cur_stamp != "["){
  471. cur_stamp.erase(cur_stamp.length() - 1);
  472. p_result->stamp += cur_stamp + "]";
  473. }
  474. string msg_punc = punc_online_handle->AddPunc(msg.c_str(), punc_cache[1]);
  475. if(input_finished){
  476. msg_punc += "。";
  477. }
  478. p_result->tpass_msg = msg_punc;
  479. #if !defined(__APPLE__)
  480. if(tpass_stream->UseITN() && itn){
  481. string msg_itn = tpass_stream->itn_handle->Normalize(msg_punc);
  482. // TimestampSmooth
  483. if(!(p_result->stamp).empty()){
  484. std::string new_stamp = funasr::TimestampSmooth(p_result->tpass_msg, msg_itn, p_result->stamp);
  485. if(!new_stamp.empty()){
  486. p_result->stamp = new_stamp;
  487. }
  488. }
  489. p_result->tpass_msg = msg_itn;
  490. }
  491. #endif
  492. if(frame != NULL){
  493. delete frame;
  494. frame = NULL;
  495. }
  496. }
  497. if(input_finished){
  498. audio->ResetIndex();
  499. }
  500. return p_result;
  501. }
  502. _FUNASRAPI const int FunASRGetRetNumber(FUNASR_RESULT result)
  503. {
  504. if (!result)
  505. return 0;
  506. return 1;
  507. }
  508. // APIs for GetRetSnippetTime
  509. _FUNASRAPI const float FunASRGetRetSnippetTime(FUNASR_RESULT result)
  510. {
  511. if (!result)
  512. return 0.0f;
  513. return ((funasr::FUNASR_RECOG_RESULT*)result)->snippet_time;
  514. }
  515. _FUNASRAPI const float FsmnVadGetRetSnippetTime(FUNASR_RESULT result)
  516. {
  517. if (!result)
  518. return 0.0f;
  519. return ((funasr::FUNASR_VAD_RESULT*)result)->snippet_time;
  520. }
  521. // APIs for GetResult
  522. _FUNASRAPI const char* FunASRGetResult(FUNASR_RESULT result,int n_index)
  523. {
  524. funasr::FUNASR_RECOG_RESULT * p_result = (funasr::FUNASR_RECOG_RESULT*)result;
  525. if(!p_result)
  526. return nullptr;
  527. return p_result->msg.c_str();
  528. }
  529. _FUNASRAPI const char* FunASRGetStamp(FUNASR_RESULT result)
  530. {
  531. funasr::FUNASR_RECOG_RESULT * p_result = (funasr::FUNASR_RECOG_RESULT*)result;
  532. if(!p_result)
  533. return nullptr;
  534. return p_result->stamp.c_str();
  535. }
  536. _FUNASRAPI const char* FunASRGetTpassResult(FUNASR_RESULT result,int n_index)
  537. {
  538. funasr::FUNASR_RECOG_RESULT * p_result = (funasr::FUNASR_RECOG_RESULT*)result;
  539. if(!p_result)
  540. return nullptr;
  541. return p_result->tpass_msg.c_str();
  542. }
  543. _FUNASRAPI const char* CTTransformerGetResult(FUNASR_RESULT result,int n_index)
  544. {
  545. funasr::FUNASR_PUNC_RESULT * p_result = (funasr::FUNASR_PUNC_RESULT*)result;
  546. if(!p_result)
  547. return nullptr;
  548. return p_result->msg.c_str();
  549. }
  550. _FUNASRAPI vector<std::vector<int>>* FsmnVadGetResult(FUNASR_RESULT result,int n_index)
  551. {
  552. funasr::FUNASR_VAD_RESULT * p_result = (funasr::FUNASR_VAD_RESULT*)result;
  553. if(!p_result)
  554. return nullptr;
  555. return p_result->segments;
  556. }
  557. // APIs for FreeResult
  558. _FUNASRAPI void FunASRFreeResult(FUNASR_RESULT result)
  559. {
  560. if (result)
  561. {
  562. delete (funasr::FUNASR_RECOG_RESULT*)result;
  563. }
  564. }
  565. _FUNASRAPI void CTTransformerFreeResult(FUNASR_RESULT result)
  566. {
  567. if (result)
  568. {
  569. delete (funasr::FUNASR_PUNC_RESULT*)result;
  570. }
  571. }
  572. _FUNASRAPI void FsmnVadFreeResult(FUNASR_RESULT result)
  573. {
  574. funasr::FUNASR_VAD_RESULT * p_result = (funasr::FUNASR_VAD_RESULT*)result;
  575. if (p_result)
  576. {
  577. if(p_result->segments){
  578. delete p_result->segments;
  579. }
  580. delete p_result;
  581. }
  582. }
  583. // APIs for decoder status reset
  584. _FUNASRAPI void FunASRReset(FUNASR_HANDLE handle, FUNASR_DEC_HANDLE dec_handle)
  585. {
  586. funasr::Model* recog_obj = (funasr::Model*)handle;
  587. recog_obj->StartUtterance();
  588. funasr::WfstDecoder* wfst_decoder = (funasr::WfstDecoder*)dec_handle;
  589. if (wfst_decoder)
  590. wfst_decoder->StartUtterance();
  591. }
  592. _FUNASRAPI void FunOfflineReset(FUNASR_HANDLE handle, FUNASR_DEC_HANDLE dec_handle)
  593. {
  594. funasr::OfflineStream* recog_obj = (funasr::OfflineStream*)handle;
  595. recog_obj->asr_handle->StartUtterance();
  596. funasr::WfstDecoder* wfst_decoder = (funasr::WfstDecoder*)dec_handle;
  597. if (wfst_decoder)
  598. wfst_decoder->StartUtterance();
  599. }
  600. // APIs for Uninit
  601. _FUNASRAPI void FunASRUninit(FUNASR_HANDLE handle)
  602. {
  603. funasr::Model* recog_obj = (funasr::Model*)handle;
  604. if (!recog_obj)
  605. return;
  606. delete recog_obj;
  607. }
  608. _FUNASRAPI void FsmnVadUninit(FUNASR_HANDLE handle)
  609. {
  610. funasr::VadModel* recog_obj = (funasr::VadModel*)handle;
  611. if (!recog_obj)
  612. return;
  613. delete recog_obj;
  614. }
  615. _FUNASRAPI void CTTransformerUninit(FUNASR_HANDLE handle)
  616. {
  617. funasr::PuncModel* punc_obj = (funasr::PuncModel*)handle;
  618. if (!punc_obj)
  619. return;
  620. delete punc_obj;
  621. }
  622. _FUNASRAPI void FunOfflineUninit(FUNASR_HANDLE handle)
  623. {
  624. funasr::OfflineStream* offline_stream = (funasr::OfflineStream*)handle;
  625. if (!offline_stream)
  626. return;
  627. delete offline_stream;
  628. }
  629. _FUNASRAPI void FunTpassUninit(FUNASR_HANDLE handle)
  630. {
  631. funasr::TpassStream* tpass_stream = (funasr::TpassStream*)handle;
  632. if (!tpass_stream)
  633. return;
  634. delete tpass_stream;
  635. }
  636. _FUNASRAPI void FunTpassOnlineUninit(FUNASR_HANDLE handle)
  637. {
  638. funasr::TpassOnlineStream* tpass_online_stream = (funasr::TpassOnlineStream*)handle;
  639. if (!tpass_online_stream)
  640. return;
  641. delete tpass_online_stream;
  642. }
  643. _FUNASRAPI FUNASR_DEC_HANDLE FunASRWfstDecoderInit(FUNASR_HANDLE handle, int asr_type, float glob_beam, float lat_beam, float am_scale)
  644. {
  645. funasr::WfstDecoder* mm = nullptr;
  646. if (asr_type == ASR_OFFLINE) {
  647. funasr::OfflineStream* offline_stream = (funasr::OfflineStream*)handle;
  648. funasr::Paraformer* paraformer = (funasr::Paraformer*)offline_stream->asr_handle.get();
  649. if (paraformer->lm_)
  650. mm = new funasr::WfstDecoder(paraformer->lm_.get(),
  651. paraformer->GetPhoneSet(), paraformer->GetVocab(), glob_beam, lat_beam, am_scale);
  652. }
  653. return mm;
  654. }
  655. _FUNASRAPI void FunASRWfstDecoderUninit(FUNASR_DEC_HANDLE handle)
  656. {
  657. funasr::WfstDecoder* wfst_decoder = (funasr::WfstDecoder*)handle;
  658. if (!wfst_decoder)
  659. return;
  660. delete wfst_decoder;
  661. }
  662. _FUNASRAPI void FunWfstDecoderLoadHwsRes(FUNASR_DEC_HANDLE handle, int inc_bias, unordered_map<string, int> &hws_map)
  663. {
  664. funasr::WfstDecoder* wfst_decoder = (funasr::WfstDecoder*)handle;
  665. if (!wfst_decoder)
  666. return;
  667. wfst_decoder->LoadHwsRes(inc_bias, hws_map);
  668. }
  669. _FUNASRAPI void FunWfstDecoderUnloadHwsRes(FUNASR_DEC_HANDLE handle)
  670. {
  671. funasr::WfstDecoder* wfst_decoder = (funasr::WfstDecoder*)handle;
  672. if (!wfst_decoder)
  673. return;
  674. wfst_decoder->UnloadHwsRes();
  675. }