Spaces:

wang0507
/

shuaige

Sleeping

wang0507 commited on Nov 16, 2023

Commit

e35df71

1 Parent(s): 8c387c8

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -14,12 +14,17 @@ p = pipeline("automatic-speech-recognition", model=model)
 transcriber = pipeline("automatic-speech-recognition", model=model)
-def transcribe(audio):
-    sr, y = audio
     y = y.astype(np.float32)
     y /= np.max(np.abs(y))
-    return transcriber({"sampling_rate": sr, "raw": y})["text"]
@@ -45,8 +50,9 @@ with gr.Blocks() as demo:
     with gr.Tab("Real Time Speech Recognition"):
         with gr.Row():
             transcribe,
-            gr.Audio(sources=["microphone"]),
-            "text",
 demo.launch()

 transcriber = pipeline("automatic-speech-recognition", model=model)
+def transcribe(stream, new_chunk):
+    sr, y = new_chunk
     y = y.astype(np.float32)
     y /= np.max(np.abs(y))
+    if stream is not None:
+        stream = np.concatenate([stream, y])
+    else:
+        stream = y
+    return stream, transcriber({"sampling_rate": sr, "raw": stream})["text"]
     with gr.Tab("Real Time Speech Recognition"):
         with gr.Row():
             transcribe,
+        ["state", gr.Audio(sources=["microphone"], streaming=True)],
+        ["state", "text"],
+        live=True
 demo.launch()