Spaces:
Running
Running
update
Browse files- examples/wenet/toolbox_infer.py +18 -18
- toolbox/k2_sherpa/decode.py +0 -1
examples/wenet/toolbox_infer.py
CHANGED
|
@@ -42,25 +42,25 @@ def main():
|
|
| 42 |
args = get_args()
|
| 43 |
|
| 44 |
# audio convert
|
| 45 |
-
signal, sample_rate = librosa.load(args.in_filename, sr=args.sample_rate)
|
| 46 |
-
signal *= 32768.0
|
| 47 |
-
signal = np.array(signal, dtype=np.int16)
|
| 48 |
-
|
| 49 |
-
temp_file = temp_directory / "temp.wav"
|
| 50 |
-
wavfile.write(
|
| 51 |
-
|
| 52 |
-
|
| 53 |
-
|
| 54 |
-
)
|
| 55 |
|
| 56 |
# audio convert
|
| 57 |
-
|
| 58 |
-
|
| 59 |
-
|
| 60 |
-
|
| 61 |
-
|
| 62 |
-
|
| 63 |
-
|
| 64 |
|
| 65 |
# load recognizer
|
| 66 |
m_dict = models.model_map["Chinese"][0]
|
|
@@ -105,7 +105,7 @@ def main():
|
|
| 105 |
# print("text: {}".format(text))
|
| 106 |
|
| 107 |
text = decode.decode_by_recognizer(recognizer=recognizer,
|
| 108 |
-
filename=
|
| 109 |
)
|
| 110 |
print("text: {}".format(text))
|
| 111 |
return
|
|
|
|
| 42 |
args = get_args()
|
| 43 |
|
| 44 |
# audio convert
|
| 45 |
+
# signal, sample_rate = librosa.load(args.in_filename, sr=args.sample_rate)
|
| 46 |
+
# signal *= 32768.0
|
| 47 |
+
# signal = np.array(signal, dtype=np.int16)
|
| 48 |
+
#
|
| 49 |
+
# temp_file = temp_directory / "temp.wav"
|
| 50 |
+
# wavfile.write(
|
| 51 |
+
# temp_file.as_posix(),
|
| 52 |
+
# rate=args.sample_rate,
|
| 53 |
+
# data=signal
|
| 54 |
+
# )
|
| 55 |
|
| 56 |
# audio convert
|
| 57 |
+
in_filename = Path(args.in_filename)
|
| 58 |
+
out_filename = Path(tempfile.gettempdir()) / "asr" / in_filename.name
|
| 59 |
+
out_filename.parent.mkdir(parents=True, exist_ok=True)
|
| 60 |
+
|
| 61 |
+
audio_convert(in_filename=in_filename.as_posix(),
|
| 62 |
+
out_filename=out_filename.as_posix(),
|
| 63 |
+
)
|
| 64 |
|
| 65 |
# load recognizer
|
| 66 |
m_dict = models.model_map["Chinese"][0]
|
|
|
|
| 105 |
# print("text: {}".format(text))
|
| 106 |
|
| 107 |
text = decode.decode_by_recognizer(recognizer=recognizer,
|
| 108 |
+
filename=out_filename.as_posix(),
|
| 109 |
)
|
| 110 |
print("text: {}".format(text))
|
| 111 |
return
|
toolbox/k2_sherpa/decode.py
CHANGED
|
@@ -40,7 +40,6 @@ def decode_offline_recognizer(recognizer: sherpa.OfflineRecognizer,
|
|
| 40 |
recognizer.decode_stream(s)
|
| 41 |
|
| 42 |
text = s.result.text.strip()
|
| 43 |
-
print("text: {}".format(text))
|
| 44 |
return text.lower()
|
| 45 |
|
| 46 |
|
|
|
|
| 40 |
recognizer.decode_stream(s)
|
| 41 |
|
| 42 |
text = s.result.text.strip()
|
|
|
|
| 43 |
return text.lower()
|
| 44 |
|
| 45 |
|