|
@@ -7,10 +7,13 @@ if __name__ == '__main__':
|
|
|
inference_pipeline = pipeline(
|
|
inference_pipeline = pipeline(
|
|
|
task=Tasks.auto_speech_recognition,
|
|
task=Tasks.auto_speech_recognition,
|
|
|
model='damo/speech_paraformer-large-vad-punc_asr_nat-zh-cn-16k-common-vocab8404-pytorch',
|
|
model='damo/speech_paraformer-large-vad-punc_asr_nat-zh-cn-16k-common-vocab8404-pytorch',
|
|
|
|
|
+ model_revision="v1.2.1",
|
|
|
vad_model='damo/speech_fsmn_vad_zh-cn-16k-common-pytorch',
|
|
vad_model='damo/speech_fsmn_vad_zh-cn-16k-common-pytorch',
|
|
|
vad_model_revision="v1.1.8",
|
|
vad_model_revision="v1.1.8",
|
|
|
punc_model='damo/punc_ct-transformer_zh-cn-common-vocab272727-pytorch',
|
|
punc_model='damo/punc_ct-transformer_zh-cn-common-vocab272727-pytorch',
|
|
|
- punc_model_revision="v1.1.6")
|
|
|
|
|
|
|
+ punc_model_revision="v1.1.6",
|
|
|
|
|
+ ngpu=1,
|
|
|
|
|
+ )
|
|
|
rec_result = inference_pipeline(audio_in=audio_in)
|
|
rec_result = inference_pipeline(audio_in=audio_in)
|
|
|
print(rec_result)
|
|
print(rec_result)
|
|
|
|
|
|