游雁 2 سال پیش
والد
کامیت
a4254193de

BIN
docs/images/wechat.png


+ 2 - 1
egs_modelscope/asr_vad_punc/speech_paraformer-large-vad-punc_asr_nat-zh-cn-16k-common-vocab8404-pytorch/demo.py

@@ -8,9 +8,10 @@ if __name__ == '__main__':
         task=Tasks.auto_speech_recognition,
         model='damo/speech_paraformer-large-vad-punc_asr_nat-zh-cn-16k-common-vocab8404-pytorch',
         vad_model='damo/speech_fsmn_vad_zh-cn-16k-common-pytorch',
+        #punc_model='damo/punc_ct-transformer_zh-cn-common-vocab272727-pytorch',
         punc_model='damo/punc_ct-transformer_cn-en-common-vocab471067-large',
         output_dir=output_dir,
     )
-    rec_result = inference_pipeline(audio_in=audio_in, batch_size_token=5000, batch_size_token_threshold_s=40)
+    rec_result = inference_pipeline(audio_in=audio_in, batch_size_token=5000, batch_size_token_threshold_s=40, max_single_segment_time=6000)
     print(rec_result)