finetune.sh 1.2 KB

12345678910111213141516171819202122232425262728
  1. ## download model
  2. #local_path_root=../modelscope_models
  3. #mkdir -p ${local_path_root}
  4. #local_path=${local_path_root}/speech_paraformer-large_asr_nat-zh-cn-16k-common-vocab8404-pytorch
  5. #git clone https://www.modelscope.cn/damo/speech_paraformer-large_asr_nat-zh-cn-16k-common-vocab8404-pytorch.git ${local_path}
  6. ## generate jsonl from wav.scp and text.txt
  7. python funasr/datasets/audio_datasets/scp2jsonl.py \
  8. ++scp_file_list='["/Users/zhifu/funasr1.0/test_local/wav.scp", "/Users/zhifu/funasr1.0/test_local/text.txt"]' \
  9. ++data_type_list='["source", "target"]' \
  10. ++jsonl_file_out=/Users/zhifu/funasr1.0/test_local/audio_datasets.jsonl
  11. # torchrun \
  12. # --nnodes 1 \
  13. # --nproc_per_node 1 \
  14. python funasr/bin/train.py \
  15. +model="damo/speech_paraformer-large_asr_nat-zh-cn-16k-common-vocab8404-pytorch" \
  16. +model_revision="v2.0.4" \
  17. +train_data_set_list="/Users/zhifu/funasr_github/test_local/aishell2_dev_ios/asr_task_debug_len_10.jsonl" \
  18. +valid_data_set_list="/Users/zhifu/funasr_github/test_local/aishell2_dev_ios/asr_task_debug_len_10.jsonl" \
  19. ++dataset_conf.batch_size=64 \
  20. ++dataset_conf.batch_type="example" \
  21. ++train_conf.max_epoch=2 \
  22. ++dataset_conf.num_workers=4 \
  23. +output_dir="outputs/debug/ckpt/funasr2/exp2" \
  24. +debug="true"