HoneyTian commited on
Commit
cd1dd54
·
1 Parent(s): d39598e
Files changed (1) hide show
  1. examples/wenet/toolbox_infer.py +13 -1
examples/wenet/toolbox_infer.py CHANGED
@@ -41,6 +41,18 @@ def get_args():
41
  def main():
42
  args = get_args()
43
 
 
 
 
 
 
 
 
 
 
 
 
 
44
  # audio convert
45
  in_filename = Path(args.in_filename)
46
  out_filename = Path(tempfile.gettempdir()) / "asr" / in_filename.name
@@ -69,7 +81,7 @@ def main():
69
  )
70
 
71
  text = decode.decode_by_recognizer(recognizer=recognizer,
72
- filename=out_filename.as_posix(),
73
  )
74
  print("text: {}".format(text))
75
  return
 
41
  def main():
42
  args = get_args()
43
 
44
+ # audio convert
45
+ signal, sample_rate = librosa.load(args.filename, sr=args.sample_rate)
46
+ signal *= 32768.0
47
+ signal = np.array(signal, dtype=np.int16)
48
+
49
+ temp_file = temp_directory / "temp.wav"
50
+ wavfile.write(
51
+ temp_file.as_posix(),
52
+ rate=args.sample_rate,
53
+ data=signal
54
+ )
55
+
56
  # audio convert
57
  in_filename = Path(args.in_filename)
58
  out_filename = Path(tempfile.gettempdir()) / "asr" / in_filename.name
 
81
  )
82
 
83
  text = decode.decode_by_recognizer(recognizer=recognizer,
84
+ filename=temp_file,
85
  )
86
  print("text: {}".format(text))
87
  return