Spaces:

adiv07
/

SOAP_temp

Runtime error

App Files Files Community

adiv07 commited on Jul 17, 2024

Commit

91b6d49

verified ·

1 Parent(s): b143466

Update Gpt4oDemo.py

Browse files

Files changed (1) hide show

Gpt4oDemo.py +19 -20

Gpt4oDemo.py CHANGED Viewed

@@ -139,31 +139,30 @@ def process_video(video_path, seconds_per_frame=2, target_width=320, target_heig
     clip.audio.write_audiofile(audio_path, bitrate="32k")
     clip.audio.close()
     clip.close()
-    #transcribe_video(audio_path)
     print(f"Extracted {len(base64Frames)} frames")
     print(f"Extracted audio to {audio_path}")
     return base64Frames, audio_path
 chat_history = []
-# chat_history.append({
-#             "role": "system",
-#             "content": (
-#                     """
-#                         You are an assistant chatbot for a Speech Language Pathologist (SLP).
-#                         Your task is to help analyze a provided video of a therapy session and answer questions accurately.
-#                         Provide timestamps for specific events or behaviors mentioned. Conclude each response with possible follow-up questions.
-#                         Follow these steps:
-#                         1.	Suggest to the user to ask, “To get started, you can try asking me how many people there are in the video.”
-#                         2.  Detect how many people are in the video.
-#                         2.	Suggest to the user to tell you the names of the people in the video, starting from left to right.
-#                         3.	After receiving the names, respond with, “Ok thank you! Now you can ask me any questions about this video.”
-#                         4.	If the user asks about a behavior, respond with, “My understanding of this behavior is [xxx - AI generated output]. Is this a behavior that you want to track? If it is, please define this behavior and tell me more about it so I can analyze it more accurately according to your practice.”
-#                         5.	If you receive names, confirm that these are the names of the people from left to right.
-#                     """
-#             )
-#         })
 def transcribe_video(filename):
     global transcript

     clip.audio.write_audiofile(audio_path, bitrate="32k")
     clip.audio.close()
     clip.close()
+    transcribe_video(audio_path)
     print(f"Extracted {len(base64Frames)} frames")
     print(f"Extracted audio to {audio_path}")
     return base64Frames, audio_path
 chat_history = []
+chat_history.append({
+            "role": "system",
+            "content": (
+                    """
+                        You are an assistant chatbot for a Speech Language Pathologist (SLP).
+                        Your task is to help analyze a provided video of a therapy session and answer questions accurately.
+                        Provide timestamps in MM:SS format as frames are given at 1 fps for specific events or behaviors mentioned.
+                        Analyse the video for IRB based on information below: Initiating Behavioral Request (IBR): the child's skill in using behavior(s) to elicit aid in obtaining an object, or object related event
+                        Instances of IBR:
+                        -Language: Listen for intelligible single words or greater verbal expressions the child uses to request an object or assistance.
+                        -React:Observe if the child extends their arm with an open palm towards the object or the adult. Do not consider grabbing as a --requesting gesture.
+                        -Point: Look for the child pointing at the object or direction where the object is located.
+                        -Give: Watch if the child hands a toy or object to the adult to request help.
+                    """
+            )
+        })
 def transcribe_video(filename):
     global transcript