嘉渊 пре 2 година
родитељ
комит
27a3d1855d
1 измењених фајлова са 1 додато и 1 уклоњено
  1. 1 1
      egs/wenetspeech/conformer/local/process_opus.py

+ 1 - 1
egs/wenetspeech/conformer/local/process_opus.py

@@ -65,7 +65,7 @@ def output(output_wav_scp, utt_list, seg_path_list, start_time_list, end_time_li
 
 
             start = int(start_time_list[i] * sample_rate)
             start = int(start_time_list[i] * sample_rate)
             end = int(end_time_list[i] * sample_rate)
             end = int(end_time_list[i] * sample_rate)
-            target_audio = waveform[:, start:end].transpose(0, 1).contiguous()
+            target_audio = waveform[:, start:end]
             torchaudio.save(seg_wav_path, target_audio, sample_rate)
             torchaudio.save(seg_wav_path, target_audio, sample_rate)
 
 
             fout.write("{} {}\n".format(utt_id, seg_wav_path))
             fout.write("{} {}\n".format(utt_id, seg_wav_path))