GAMA-IT

Running on Zero

sonalkum commited on Jul 5, 2024

Commit

e2a134d

verified ·

1 Parent(s): a35500a

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -141,7 +141,7 @@ def predict(audio_path, question):
 link = "https://github.com/Sreyan88/GAMA"
 text = "[Github]"
 paper_link = "https://sreyan88.github.io/gamaaudio/"
-paper_text = "[Paper]"
 demo = gr.Interface(fn=predict,
                     inputs=[gr.Audio(type="filepath"), gr.Textbox(value='Describe the audio in detail', label='Edit the textbox to ask your own questions!')],
                     outputs=[gr.Textbox(label="Audio Meta Information"), gr.Textbox(label="GAMA Output")],
@@ -151,4 +151,4 @@ demo = gr.Interface(fn=predict,
                     "GAMA-IT is authored by members of the GAMMA Lab at the University of Maryland, College Park and Adobe, USA. <br>" +
                     "**GAMA-IT is not an ASR model and has limited ability to recognize the speech content. It primarily focuses on perception and understanding of non-speech sounds.**<br>" +
                     "Input an audio and ask quesions! Audio will be converted to 16kHz and padded or trim to 10 seconds.")
-demo.launch(debug=True, share=True)

 link = "https://github.com/Sreyan88/GAMA"
 text = "[Github]"
 paper_link = "https://sreyan88.github.io/gamaaudio/"
+paper_text = "https://arxiv.org/pdf/2406.11768"
 demo = gr.Interface(fn=predict,
                     inputs=[gr.Audio(type="filepath"), gr.Textbox(value='Describe the audio in detail', label='Edit the textbox to ask your own questions!')],
                     outputs=[gr.Textbox(label="Audio Meta Information"), gr.Textbox(label="GAMA Output")],
                     "GAMA-IT is authored by members of the GAMMA Lab at the University of Maryland, College Park and Adobe, USA. <br>" +
                     "**GAMA-IT is not an ASR model and has limited ability to recognize the speech content. It primarily focuses on perception and understanding of non-speech sounds.**<br>" +
                     "Input an audio and ask quesions! Audio will be converted to 16kHz and padded or trim to 10 seconds.")
+demo.launch()