Spaces:

ManishThota
/

GSoC-Super-Rapid-Annotator

Runtime error

App Files Files Community

ManishThota commited on Aug 21, 2024

Commit

05789a2

verified ·

1 Parent(s): 5fb761e

Update app.py

Browse files

Files changed (1) hide show

app.py +11 -6

app.py CHANGED Viewed

@@ -2,10 +2,15 @@ import warnings
 warnings.filterwarnings("ignore")
 import gradio as gr
 from src.video_model import describe_video  # Assuming this function processes the video and query
 # --- Function to construct the final query ---
 def process_video_and_questions(video, sitting, hands, location, screen):
-    query = "Describe this video in detail and answer the questions"
     additional_info = []
     if sitting:
         additional_info.append("Is the subject in the video standing or sitting?")
@@ -22,9 +27,11 @@ def process_video_and_questions(video, sitting, hands, location, screen):
     <annotation>screen_interaction: 0</annotation>"""
     final_query = query + " " + " ".join(additional_info)
     final_prompt = final_query + " " + end_query
     # Assuming your describe_video function handles the video processing
     response = describe_video(video, final_prompt)
-    return response
 # Video and text inputs for the interface
 video = gr.Video(label="Video")
@@ -58,15 +65,13 @@ title = "GSoC Super Raid Annotator"
 description = "Annotate Videos"
 article = "<p style='text-align: center'><a href='https://github.com/OpenBMB/MiniCPM-V' target='_blank'>Model GitHub Repo</a> | <a href='https://huggingface.co/openbmb/MiniCPM-V-2_6' target='_blank'>Model Page</a></p>"
 custom_theme = gr.themes.Soft(
-    # Set the primary hue of the Soft theme to your red color
     primary_hue="red",
     secondary_hue="red")
 # Launch the interface
 interface = gr.Interface(
-    fn=process_video_and_questions, # Updated function to handle the query construction
     inputs=[video, sitting, hands, location, screen],
     outputs=response,
     examples=examples,
@@ -76,4 +81,4 @@ interface = gr.Interface(
     theme=custom_theme,
     allow_flagging="never",
 )
-interface.launch(debug=False)

 warnings.filterwarnings("ignore")
 import gradio as gr
 from src.video_model import describe_video  # Assuming this function processes the video and query
+import os
 # --- Function to construct the final query ---
 def process_video_and_questions(video, sitting, hands, location, screen):
+    # Extract the video name (filename)
+    video_name = os.path.basename(video)
+    # Construct the query with the video name included
+    query = f"Describe the video '{video_name}' in detail and answer the questions"
     additional_info = []
     if sitting:
         additional_info.append("Is the subject in the video standing or sitting?")
     <annotation>screen_interaction: 0</annotation>"""
     final_query = query + " " + " ".join(additional_info)
     final_prompt = final_query + " " + end_query
     # Assuming your describe_video function handles the video processing
     response = describe_video(video, final_prompt)
+    final_response = f"<video_name>{video_name}</video_name>" + " " + response
+    return final_response
 # Video and text inputs for the interface
 video = gr.Video(label="Video")
 description = "Annotate Videos"
 article = "<p style='text-align: center'><a href='https://github.com/OpenBMB/MiniCPM-V' target='_blank'>Model GitHub Repo</a> | <a href='https://huggingface.co/openbmb/MiniCPM-V-2_6' target='_blank'>Model Page</a></p>"
 custom_theme = gr.themes.Soft(
     primary_hue="red",
     secondary_hue="red")
 # Launch the interface
 interface = gr.Interface(
+    fn=process_video_and_questions,
     inputs=[video, sitting, hands, location, screen],
     outputs=response,
     examples=examples,
     theme=custom_theme,
     allow_flagging="never",
 )
+interface.launch(debug=False)