|
|
@@ -1371,10 +1371,7 @@ def inference_transducer(
|
|
|
left_context=left_context,
|
|
|
right_context=right_context,
|
|
|
)
|
|
|
- speech2text = Speech2TextTransducer.from_pretrained(
|
|
|
- model_tag=model_tag,
|
|
|
- **speech2text_kwargs,
|
|
|
- )
|
|
|
+ speech2text = Speech2TextTransducer(**speech2text_kwargs)
|
|
|
|
|
|
def _forward(data_path_and_name_and_type,
|
|
|
raw_inputs: Union[np.ndarray, torch.Tensor] = None,
|