Chroma-Extra

Running on Zero

App Files Files Community

gokaygokay commited on Mar 2

Commit

2022eac

1 Parent(s): dfc83f9

add init

Browse files

Files changed (1) hide show

llm_inference_video.py +29 -1

llm_inference_video.py CHANGED Viewed

@@ -90,7 +90,9 @@ class VideoLLMInferenceNode:
         custom_elements: str = "",
         provider: str = "SambaNova",
         model: str = "Meta-Llama-3.1-70B-Instruct",
-        prompt_length: str = "Medium"
     ) -> str:
         """
         Generate a video prompt using the specified LLM provider
@@ -106,6 +108,8 @@ class VideoLLMInferenceNode:
             provider: LLM provider (SambaNova or Groq)
             model: Model name
             prompt_length: Desired prompt length
         Returns:
             str: Generated video prompt
@@ -114,6 +118,24 @@ class VideoLLMInferenceNode:
             return "Please enter a concept for the video."
         try:
             # Helper function to format optional elements
             def format_element(element, element_type):
                 if element == "None" or not element:
@@ -203,6 +225,9 @@ Focus on these elements while maintaining the specified sentence count:
 4. Style and aesthetic choices
 5. Key moments
 6. Emotional impact
 IMPORTANT REQUIREMENTS:
 - Deliver exactly the specified number of sentences
@@ -220,8 +245,11 @@ IMPORTANT REQUIREMENTS:
 Camera Movement: {camera_movement if camera_movement else 'No specific camera movement'}
 Core Concept: {concept}
 Please create a {prompt_length.lower()}-length description incorporating these elements into a cohesive narrative.
 Avoid talking about 'video' or 'videos'. Do not start with 'The video opens with...' or 'The video starts with...' and do not include 'in this video' or 'focus of this video'. kind of terms. Do not say "Here is your video prompt" or "Here is your video description" or anything like that. Just give the prompt."""
             # Call the appropriate API based on provider

         custom_elements: str = "",
         provider: str = "SambaNova",
         model: str = "Meta-Llama-3.1-70B-Instruct",
+        prompt_length: str = "Medium",
+        image_path: str = "",
+        video_path: str = ""
     ) -> str:
         """
         Generate a video prompt using the specified LLM provider
             provider: LLM provider (SambaNova or Groq)
             model: Model name
             prompt_length: Desired prompt length
+            image_path: Optional path to an image for VLM description
+            video_path: Optional path to a video for VLM description
         Returns:
             str: Generated video prompt
             return "Please enter a concept for the video."
         try:
+            # Get VLM descriptions if image or video paths are provided
+            image_description = ""
+            video_description = ""
+            if image_path:
+                try:
+                    image_description = self.analyze_image(image_path, "Describe this image in detail for a video creator.")
+                    print(f"Generated image description: {image_description}")
+                except Exception as e:
+                    print(f"Error generating image description: {str(e)}")
+            if video_path:
+                try:
+                    video_description = self.analyze_video(video_path)
+                    print(f"Generated video description: {video_description}")
+                except Exception as e:
+                    print(f"Error generating video description: {str(e)}")
             # Helper function to format optional elements
             def format_element(element, element_type):
                 if element == "None" or not element:
 4. Style and aesthetic choices
 5. Key moments
 6. Emotional impact
+{'' if not image_description and not video_description else '7. Elements from the provided image/video descriptions'}
+{'' if not image_description and not video_description else 'If image or video descriptions are provided, incorporate their key visual elements and content into your description to ensure accuracy and relevance.'}
 IMPORTANT REQUIREMENTS:
 - Deliver exactly the specified number of sentences
 Camera Movement: {camera_movement if camera_movement else 'No specific camera movement'}
 Core Concept: {concept}
+{f'Reference Image Description: {image_description}' if image_description else ''}
+{f'Reference Video Description: {video_description}' if video_description else ''}
 Please create a {prompt_length.lower()}-length description incorporating these elements into a cohesive narrative.
+{'' if not image_description and not video_description else 'Use the provided image/video descriptions as reference to inform your prompt creation.'}
 Avoid talking about 'video' or 'videos'. Do not start with 'The video opens with...' or 'The video starts with...' and do not include 'in this video' or 'focus of this video'. kind of terms. Do not say "Here is your video prompt" or "Here is your video description" or anything like that. Just give the prompt."""
             # Call the appropriate API based on provider