SmolVLM2-XSPFGenerator

Running on Zero

App Files Files Community

Miquel Farre commited on Feb 13

Commit

b7a96e8

1 Parent(s): 312644d

fix

Browse files

Files changed (1) hide show

app.py +8 -3

app.py CHANGED Viewed

@@ -57,7 +57,12 @@ class VideoHighlightDetector:
     def analyze_video_content(self, video_path: str) -> str:
         """Analyze video content to determine its type and description."""
         messages = [
             {
                 "role": "user",
                 "content": [
@@ -76,7 +81,7 @@ class VideoHighlightDetector:
         ).to(self.device)
         outputs = self.model.generate(**inputs, max_new_tokens=512, do_sample=True, temperature=0.7)
-        return self.processor.decode(outputs[0], skip_special_tokens=True)
     def determine_highlights(self, video_description: str) -> str:
         """Determine what constitutes highlights based on video description."""
@@ -104,7 +109,7 @@ class VideoHighlightDetector:
         ).to(self.device)
         outputs = self.model.generate(**inputs, max_new_tokens=256, do_sample=True, temperature=0.7)
-        return self.processor.decode(outputs[0], skip_special_tokens=True)
     def process_segment(self, video_path: str, highlight_types: str) -> bool:
         """Process a video segment and determine if it contains highlights."""
@@ -132,7 +137,7 @@ class VideoHighlightDetector:
         ).to(self.device)
         outputs = self.model.generate(**inputs, max_new_tokens=64, do_sample=False)
-        response = self.processor.decode(outputs[0], skip_special_tokens=True).lower()
         return "yes" in response

     def analyze_video_content(self, video_path: str) -> str:
         """Analyze video content to determine its type and description."""
+        system_message = "You are a helpful assistant that can understand videos. Describe what type of video this is and what's happening in it."
         messages = [
+            {
+                "role": "system",
+                "content": [{"type": "text", "text": system_message}]
+            },
             {
                 "role": "user",
                 "content": [
         ).to(self.device)
         outputs = self.model.generate(**inputs, max_new_tokens=512, do_sample=True, temperature=0.7)
+        return self.processor.decode(outputs[0], skip_special_tokens=True).lower().split("Assistant: ")[1]
     def determine_highlights(self, video_description: str) -> str:
         """Determine what constitutes highlights based on video description."""
         ).to(self.device)
         outputs = self.model.generate(**inputs, max_new_tokens=256, do_sample=True, temperature=0.7)
+        return self.processor.decode(outputs[0], skip_special_tokens=True).lower().split("Assistant: ")[1]
     def process_segment(self, video_path: str, highlight_types: str) -> bool:
         """Process a video segment and determine if it contains highlights."""
         ).to(self.device)
         outputs = self.model.generate(**inputs, max_new_tokens=64, do_sample=False)
+        response = self.processor.decode(outputs[0], skip_special_tokens=True).lower().split("Assistant: ")[1]
         return "yes" in response