speech_asr 3 лет назад
Родитель
Сommit
2f933cb101
2 измененных файлов с 0 добавлено и 6 удалено
  1. 0 4
      funasr/bin/eend_ola_inference.py
  2. 0 2
      funasr/models/e2e_diar_eend_ola.py

+ 0 - 4
funasr/bin/eend_ola_inference.py

@@ -27,9 +27,6 @@ from funasr.utils.types import str2bool
 from funasr.utils.types import str2triple_str
 from funasr.utils.types import str_or_none
 
-from modelscope.utils.logger import get_logger
-logger = get_logger()
-
 class Speech2Diarization:
     """Speech2Diarlization class
 
@@ -211,7 +208,6 @@ def inference_modelscope(
             if isinstance(raw_inputs, torch.Tensor):
                 raw_inputs = raw_inputs.numpy()
             data_path_and_name_and_type = [raw_inputs[0], "speech", "bytes"]
-        logger.info(data_path_and_name_and_type)
         loader = EENDOLADiarTask.build_streaming_iterator(
             data_path_and_name_and_type,
             dtype=dtype,

+ 0 - 2
funasr/models/e2e_diar_eend_ola.py

@@ -190,8 +190,6 @@ class DiarEENDOLAModel(AbsESPnetModel):
                             shuffle: bool = True,
                             threshold: float = 0.5,
                             **kwargs):
-        if self.frontend is not None:
-            speech = self.frontend(speech)
         speech = [s[:s_len] for s, s_len in zip(speech, speech_lengths)]
         emb = self.forward_encoder(speech, speech_lengths)
         if shuffle: