北念 2 лет назад
Родитель
Сommit
a9600a123e
1 измененных файлов с 4 добавлено и 3 удалено
  1. 4 3
      funasr/bin/asr_infer.py

+ 4 - 3
funasr/bin/asr_infer.py

@@ -1922,9 +1922,6 @@ class Speech2TextWhisper:
     ):
 
         from funasr.tasks.whisper import ASRTask
-        from funasr.utils.whisper_utils.transcribe import transcribe
-        from funasr.utils.whisper_utils.audio import pad_or_trim, log_mel_spectrogram
-        from funasr.utils.whisper_utils.decoding import DecodingOptions, detect_language, decode
 
         # 1. Build ASR model
         scorers = {}
@@ -1987,6 +1984,10 @@ class Speech2TextWhisper:
 
         """
 
+        from funasr.utils.whisper_utils.transcribe import transcribe
+        from funasr.utils.whisper_utils.audio import pad_or_trim, log_mel_spectrogram
+        from funasr.utils.whisper_utils.decoding import DecodingOptions, detect_language, decode
+
         speech = speech[0]
         speech = pad_or_trim(speech)
         mel = log_mel_spectrogram(speech).to(self.device)