InstaVideo

Runtime error

App Files Files Community

rahul7star commited on about 1 month ago

Commit

aeb9017

verified ·

1 Parent(s): 07fdcce

new math testing

Browse files

Files changed (1) hide show

app.py +56 -13

app.py CHANGED Viewed

@@ -34,24 +34,66 @@ pipe.load_lora_weights(causvid_path, adapter_name="causvid_lora")
 pipe.set_adapters(["causvid_lora"], adapter_weights=[0.95])
 pipe.fuse_lora()
 MOD_VALUE = 32
-DEFAULT_H_SLIDER_VALUE =  512
-DEFAULT_W_SLIDER_VALUE =  896
-# Environment variable check
-IS_ORIGINAL_SPACE = os.environ.get("IS_ORIGINAL_SPACE", "True") == "True"
-# Original limits
-ORIGINAL_SLIDER_MIN_H, ORIGINAL_SLIDER_MAX_H = 128, 1280
-ORIGINAL_SLIDER_MIN_W, ORIGINAL_SLIDER_MAX_W = 128, 1280
-ORIGINAL_MAX_DURATION = round(81/24, 1)  # MAX_FRAMES_MODEL/FIXED_FPS
-# Limited space constants
 LIMITED_MAX_RESOLUTION = 640
 LIMITED_MAX_DURATION = 2.0
 LIMITED_MAX_STEPS = 4
-# Set limits based on environment variable
 if IS_ORIGINAL_SPACE:
     SLIDER_MIN_H, SLIDER_MAX_H = 128, LIMITED_MAX_RESOLUTION
     SLIDER_MIN_W, SLIDER_MAX_W = 128, LIMITED_MAX_RESOLUTION
@@ -61,14 +103,15 @@ else:
     SLIDER_MIN_H, SLIDER_MAX_H = ORIGINAL_SLIDER_MIN_H, ORIGINAL_SLIDER_MAX_H
     SLIDER_MIN_W, SLIDER_MAX_W = ORIGINAL_SLIDER_MIN_W, ORIGINAL_SLIDER_MAX_W
     MAX_DURATION = ORIGINAL_MAX_DURATION
-    MAX_STEPS = 8
 MAX_SEED = np.iinfo(np.int32).max
 FIXED_FPS = 24
-FIXED_OUTPUT_FPS = 18 # we downspeed the output video as a temporary "trick"
 MIN_FRAMES_MODEL = 8
-MAX_FRAMES_MODEL = 81
 default_prompt_t2v = "cinematic footage, group of pedestrians dancing in the streets of NYC, high quality breakdance, 4K, tiktok video, intricate details, instagram feel, dynamic camera, smooth dance motion, dimly lit, stylish, beautiful faces, smiling, music video"
 default_negative_prompt = "Bright tones, overexposed, static, blurred details, subtitles, style, works, paintings, images, static, overall gray, worst quality, low quality, JPEG compression residue, ugly, incomplete, extra fingers, poorly drawn hands, poorly drawn faces, deformed, disfigured, misshapen limbs, fused fingers, still picture, messy background, three legs, many people in the background, walking backwards, watermark, text, signature"

 pipe.set_adapters(["causvid_lora"], adapter_weights=[0.95])
 pipe.fuse_lora()
+# MOD_VALUE = 32
+# DEFAULT_H_SLIDER_VALUE =  512
+# DEFAULT_W_SLIDER_VALUE =  896
+# # Environment variable check
+# IS_ORIGINAL_SPACE = os.environ.get("IS_ORIGINAL_SPACE", "True") == "True"
+# # Original limits
+# ORIGINAL_SLIDER_MIN_H, ORIGINAL_SLIDER_MAX_H = 128, 1280
+# ORIGINAL_SLIDER_MIN_W, ORIGINAL_SLIDER_MAX_W = 128, 1280
+# ORIGINAL_MAX_DURATION = round(81/24, 1)  # MAX_FRAMES_MODEL/FIXED_FPS
+# # Limited space constants
+# LIMITED_MAX_RESOLUTION = 640
+# LIMITED_MAX_DURATION = 2.0
+# LIMITED_MAX_STEPS = 4
+# # Set limits based on environment variable
+# if IS_ORIGINAL_SPACE:
+#     SLIDER_MIN_H, SLIDER_MAX_H = 128, LIMITED_MAX_RESOLUTION
+#     SLIDER_MIN_W, SLIDER_MAX_W = 128, LIMITED_MAX_RESOLUTION
+#     MAX_DURATION = LIMITED_MAX_DURATION
+#     MAX_STEPS = LIMITED_MAX_STEPS
+# else:
+#     SLIDER_MIN_H, SLIDER_MAX_H = ORIGINAL_SLIDER_MIN_H, ORIGINAL_SLIDER_MAX_H
+#     SLIDER_MIN_W, SLIDER_MAX_W = ORIGINAL_SLIDER_MIN_W, ORIGINAL_SLIDER_MAX_W
+#     MAX_DURATION = ORIGINAL_MAX_DURATION
+#     MAX_STEPS = 8
+# MAX_SEED = np.iinfo(np.int32).max
+# FIXED_FPS = 24
+# FIXED_OUTPUT_FPS = 18 # we downspeed the output video as a temporary "trick"
+# MIN_FRAMES_MODEL = 8
+# MAX_FRAMES_MODEL = 81
+#New math to make it High Res
 MOD_VALUE = 32
+# Defaults for higher-res generation
+DEFAULT_H_SLIDER_VALUE = 768
+DEFAULT_W_SLIDER_VALUE = 1344  # 16:9 friendly and divisible by MOD_VALUE
+# Original Space = Hugging Face space with compute limits
+IS_ORIGINAL_SPACE = os.environ.get("IS_ORIGINAL_SPACE", "True") == "True"
+# Conservative limits for low-end environments
 LIMITED_MAX_RESOLUTION = 640
 LIMITED_MAX_DURATION = 2.0
 LIMITED_MAX_STEPS = 4
+# Generous limits for local or Pro spaces
+ORIGINAL_SLIDER_MIN_H, ORIGINAL_SLIDER_MAX_H = 128, 1536
+ORIGINAL_SLIDER_MIN_W, ORIGINAL_SLIDER_MAX_W = 128, 1536
+ORIGINAL_MAX_DURATION = round(81 / 24, 1)  # 3.4 seconds
+ORIGINAL_MAX_STEPS = 8
+# Use limited or original (generous) settings
 if IS_ORIGINAL_SPACE:
     SLIDER_MIN_H, SLIDER_MAX_H = 128, LIMITED_MAX_RESOLUTION
     SLIDER_MIN_W, SLIDER_MAX_W = 128, LIMITED_MAX_RESOLUTION
     SLIDER_MIN_H, SLIDER_MAX_H = ORIGINAL_SLIDER_MIN_H, ORIGINAL_SLIDER_MAX_H
     SLIDER_MIN_W, SLIDER_MAX_W = ORIGINAL_SLIDER_MIN_W, ORIGINAL_SLIDER_MAX_W
     MAX_DURATION = ORIGINAL_MAX_DURATION
+    MAX_STEPS = ORIGINAL_MAX_STEPS
 MAX_SEED = np.iinfo(np.int32).max
 FIXED_FPS = 24
+FIXED_OUTPUT_FPS = 18  # reduce final video FPS to save space
 MIN_FRAMES_MODEL = 8
+MAX_FRAMES_MODEL = 81
 default_prompt_t2v = "cinematic footage, group of pedestrians dancing in the streets of NYC, high quality breakdance, 4K, tiktok video, intricate details, instagram feel, dynamic camera, smooth dance motion, dimly lit, stylish, beautiful faces, smiling, music video"
 default_negative_prompt = "Bright tones, overexposed, static, blurred details, subtitles, style, works, paintings, images, static, overall gray, worst quality, low quality, JPEG compression residue, ugly, incomplete, extra fingers, poorly drawn hands, poorly drawn faces, deformed, disfigured, misshapen limbs, fused fingers, still picture, messy background, three legs, many people in the background, walking backwards, watermark, text, signature"