Spaces:

yeliudev
/

VideoMind-2B

Running on Zero

yeliudev commited on Mar 29

Commit

a5316b9

verified ·

1 Parent(s): ba0b022

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -52,7 +52,7 @@ BADGE = """
 """
 LOGO = '<p align="center"><img width="350" src="https://raw.githubusercontent.com/yeliudev/VideoMind/refs/heads/main/.github/logo.png"></p>'
-DISC = '**VideoMind** is a multi-modal agent framework that enhances video reasoning by emulating *human-like* processes, such as *breaking down tasks*, *localizing and verifying moments*, and *synthesizing answers*. This approach addresses the unique challenges of temporal-grounded reasoning in a progressive strategy. This demo showcases how VideoMind-2B handles video-language tasks. Please open an <a href="https://github.com/yeliudev/VideoMind/issues/new" target="_blank">issue</a> if you meet any problems or have any suggestions.'  # noqa
 # yapf:disable
 EXAMPLES = [
@@ -624,7 +624,7 @@ def build_demo():
                     submit_ctx = submit_ctx.then(main, [video, prompt, role, temperature, max_new_tokens], chat)
                     submit_ctx.then(enable_btns, None, [random_btn, reset_btn, submit_btn])
-                gr.Markdown('##### Need example data? Explore examples tab or click 🔮 Random to sample one!')
             with gr.Column(scale=5):
                 chat.render()

 """
 LOGO = '<p align="center"><img width="350" src="https://raw.githubusercontent.com/yeliudev/VideoMind/refs/heads/main/.github/logo.png"></p>'
+DISC = '**VideoMind** is a multi-modal agent framework that enhances video reasoning by emulating *human-like* processes, such as *breaking down tasks*, *localizing and verifying moments*, and *synthesizing answers*. Our method addresses the unique challenges of temporal-grounded reasoning in a progressive strategy. This demo showcases how VideoMind-2B handles video-language tasks. Please open an <a href="https://github.com/yeliudev/VideoMind/issues/new" target="_blank">issue</a> if you meet any problems.'  # noqa
 # yapf:disable
 EXAMPLES = [
                     submit_ctx = submit_ctx.then(main, [video, prompt, role, temperature, max_new_tokens], chat)
                     submit_ctx.then(enable_btns, None, [random_btn, reset_btn, submit_btn])
+                gr.Markdown('###### Need example data? Explore examples tab or click 🔮 Random to sample one!')
             with gr.Column(scale=5):
                 chat.render()