Update app.py
Browse files
app.py
CHANGED
@@ -48,10 +48,18 @@ def transcribe(audio_path):
|
|
48 |
|
49 |
|
50 |
#------
|
51 |
-
|
|
|
|
|
|
|
|
|
|
|
52 |
with torch.no_grad():
|
53 |
-
predicted_ids = model.generate(
|
|
|
|
|
54 |
transcription = processor.batch_decode(predicted_ids, skip_special_tokens=True)[0]
|
|
|
55 |
return transcription
|
56 |
|
57 |
|
|
|
48 |
|
49 |
|
50 |
#------
|
51 |
+
audio_cnt, sr = librosa.load(audio_path, sr=16000)
|
52 |
+
|
53 |
+
# 将音频数据传递给 processor
|
54 |
+
input_values = processor(audio, sampling_rate=16000, return_tensors="pt").input_values
|
55 |
+
|
56 |
+
# 模型推理
|
57 |
with torch.no_grad():
|
58 |
+
predicted_ids = model.generate(input_values)
|
59 |
+
|
60 |
+
# 解码得到转录结果
|
61 |
transcription = processor.batch_decode(predicted_ids, skip_special_tokens=True)[0]
|
62 |
+
|
63 |
return transcription
|
64 |
|
65 |
|