Spaces:
Runtime error
Runtime error
audio to text
Browse files
app.py
CHANGED
|
@@ -19,7 +19,7 @@ seamless_client = Client("facebook/seamless_m4t")
|
|
| 19 |
|
| 20 |
|
| 21 |
|
| 22 |
-
def process_speech(audio_input,input_language
|
| 23 |
"""
|
| 24 |
processing sound using seamless_m4t
|
| 25 |
"""
|
|
@@ -42,7 +42,7 @@ def process_speech(audio_input,input_language,target_language):
|
|
| 42 |
audio_input, #audio_name
|
| 43 |
"",
|
| 44 |
input_language,# source language
|
| 45 |
-
|
| 46 |
api_name="/run",
|
| 47 |
)
|
| 48 |
out = out[1] # get the text
|
|
@@ -419,16 +419,15 @@ with gr.Blocks(theme='ParityError/Anime') as iface :
|
|
| 419 |
image_input = gr.Image(label="upload image")
|
| 420 |
image_output = gr.Markdown(label="output text")
|
| 421 |
image_button = gr.Button("process image")
|
| 422 |
-
with gr.Tab("speech to text
|
| 423 |
with gr.Row():
|
| 424 |
-
input_language = gr.Dropdown(languages, label="
|
| 425 |
-
target_language = gr.Dropdown(languages, label="target language",value="English",interactive=True)
|
| 426 |
audio_input = gr.Audio(label="speak",type="filepath",sources="microphone")
|
| 427 |
audio_output = gr.Markdown(label="output text")
|
| 428 |
audio_button = gr.Button("process audio")
|
| 429 |
text_button.click(process_and_query, inputs=text_input, outputs=text_output)
|
| 430 |
image_button.click(process_image, inputs=image_input, outputs=image_output)
|
| 431 |
-
audio_button.click(process_speech, inputs=[audio_input,input_language
|
| 432 |
|
| 433 |
|
| 434 |
iface.queue().launch(show_error=True,debug=True)
|
|
|
|
| 19 |
|
| 20 |
|
| 21 |
|
| 22 |
+
def process_speech(audio_input,input_language):
|
| 23 |
"""
|
| 24 |
processing sound using seamless_m4t
|
| 25 |
"""
|
|
|
|
| 42 |
audio_input, #audio_name
|
| 43 |
"",
|
| 44 |
input_language,# source language
|
| 45 |
+
input_language,# target language
|
| 46 |
api_name="/run",
|
| 47 |
)
|
| 48 |
out = out[1] # get the text
|
|
|
|
| 419 |
image_input = gr.Image(label="upload image")
|
| 420 |
image_output = gr.Markdown(label="output text")
|
| 421 |
image_button = gr.Button("process image")
|
| 422 |
+
with gr.Tab("speech to text"):
|
| 423 |
with gr.Row():
|
| 424 |
+
input_language = gr.Dropdown(languages, label="select the language",value="French",interactive=True)
|
|
|
|
| 425 |
audio_input = gr.Audio(label="speak",type="filepath",sources="microphone")
|
| 426 |
audio_output = gr.Markdown(label="output text")
|
| 427 |
audio_button = gr.Button("process audio")
|
| 428 |
text_button.click(process_and_query, inputs=text_input, outputs=text_output)
|
| 429 |
image_button.click(process_image, inputs=image_input, outputs=image_output)
|
| 430 |
+
audio_button.click(process_speech, inputs=[audio_input,input_language], outputs=audio_output)
|
| 431 |
|
| 432 |
|
| 433 |
iface.queue().launch(show_error=True,debug=True)
|