Update app.py
Browse files
app.py
CHANGED
|
@@ -141,7 +141,7 @@ def predict(audio_path, question):
|
|
| 141 |
link = "https://github.com/Sreyan88/GAMA"
|
| 142 |
text = "[Github]"
|
| 143 |
paper_link = "https://sreyan88.github.io/gamaaudio/"
|
| 144 |
-
paper_text = "
|
| 145 |
demo = gr.Interface(fn=predict,
|
| 146 |
inputs=[gr.Audio(type="filepath"), gr.Textbox(value='Describe the audio in detail', label='Edit the textbox to ask your own questions!')],
|
| 147 |
outputs=[gr.Textbox(label="Audio Meta Information"), gr.Textbox(label="GAMA Output")],
|
|
@@ -151,4 +151,4 @@ demo = gr.Interface(fn=predict,
|
|
| 151 |
"GAMA-IT is authored by members of the GAMMA Lab at the University of Maryland, College Park and Adobe, USA. <br>" +
|
| 152 |
"**GAMA-IT is not an ASR model and has limited ability to recognize the speech content. It primarily focuses on perception and understanding of non-speech sounds.**<br>" +
|
| 153 |
"Input an audio and ask quesions! Audio will be converted to 16kHz and padded or trim to 10 seconds.")
|
| 154 |
-
demo.launch(
|
|
|
|
| 141 |
link = "https://github.com/Sreyan88/GAMA"
|
| 142 |
text = "[Github]"
|
| 143 |
paper_link = "https://sreyan88.github.io/gamaaudio/"
|
| 144 |
+
paper_text = "https://arxiv.org/pdf/2406.11768"
|
| 145 |
demo = gr.Interface(fn=predict,
|
| 146 |
inputs=[gr.Audio(type="filepath"), gr.Textbox(value='Describe the audio in detail', label='Edit the textbox to ask your own questions!')],
|
| 147 |
outputs=[gr.Textbox(label="Audio Meta Information"), gr.Textbox(label="GAMA Output")],
|
|
|
|
| 151 |
"GAMA-IT is authored by members of the GAMMA Lab at the University of Maryland, College Park and Adobe, USA. <br>" +
|
| 152 |
"**GAMA-IT is not an ASR model and has limited ability to recognize the speech content. It primarily focuses on perception and understanding of non-speech sounds.**<br>" +
|
| 153 |
"Input an audio and ask quesions! Audio will be converted to 16kHz and padded or trim to 10 seconds.")
|
| 154 |
+
demo.launch()
|