cmvn_converter.py 1.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051
  1. import argparse
  2. import json
  3. import numpy as np
  4. def get_parser():
  5. parser = argparse.ArgumentParser(
  6. description="cmvn converter",
  7. formatter_class=argparse.ArgumentDefaultsHelpFormatter,
  8. )
  9. parser.add_argument(
  10. "--cmvn_json",
  11. default=False,
  12. required=True,
  13. type=str,
  14. help="cmvn json file",
  15. )
  16. parser.add_argument(
  17. "--am_mvn",
  18. default=False,
  19. required=True,
  20. type=str,
  21. help="am mvn file",
  22. )
  23. return parser
  24. def main():
  25. parser = get_parser()
  26. args = parser.parse_args()
  27. with open(args.cmvn_json, "r") as fin:
  28. cmvn_dict = json.load(fin)
  29. mean_stats = np.array(cmvn_dict["mean_stats"])
  30. var_stats = np.array(cmvn_dict["var_stats"])
  31. total_frame = np.array(cmvn_dict["total_frames"])
  32. mean = -1.0 * mean_stats / total_frame
  33. var = 1.0 / np.sqrt(var_stats / total_frame - mean * mean)
  34. dims = mean.shape[0]
  35. with open(args.am_mvn, 'w') as fout:
  36. fout.write("<Nnet>" + "\n" + "<Splice> " + str(dims) + " " + str(dims) + '\n' + "[ 0 ]" + "\n" + "<AddShift> " + str(dims) + " " + str(dims) + "\n")
  37. mean_str = str(list(mean)).replace(',', '').replace('[', '[ ').replace(']', ' ]')
  38. fout.write("<LearnRateCoef> 0 " + mean_str + '\n')
  39. fout.write("<Rescale> " + str(dims) + " " + str(dims) + '\n')
  40. var_str = str(list(var)).replace(',', '').replace('[', '[ ').replace(']', ' ]')
  41. fout.write("<LearnRateCoef> 0 " + var_str + '\n')
  42. fout.write("</Nnet>" + '\n')
  43. if __name__ == '__main__':
  44. main()