jbilcke-hf
/

HunyuanVideo-HFIE

HunyuanVideoPipeline

Inference Endpoints

Model card Files Files and versions Community

jbilcke-hf HF staff commited on 28 days ago

Commit

cdf6b7a

·

verified ·

1 Parent(s): 28747d9

Update handler.py

Files changed (1) hide show

handler.py +7 -2

handler.py CHANGED Viewed

@@ -7,6 +7,7 @@ import random
 import traceback
 import torch
 import os
 # note: there is no HunyuanImageToVideoPipeline yet in Diffusers
 from diffusers import HunyuanVideoPipeline, HunyuanVideoTransformer3DModel, FasterCacheConfig
@@ -276,7 +277,7 @@ class EndpointHandler:
             #else:
             #    disable_teacache(self.pipeline.transformer)
-            with torch.inference_mode():
                 # Prepare generation parameters
                 generation_kwargs = {
@@ -360,7 +361,11 @@ class EndpointHandler:
                     asyncio.set_event_loop(loop)
                 video_uri, metadata = loop.run_until_complete(self.process_frames(frames, config))
                 return {
                     "video": video_uri,
                     "content-type": "video/mp4",

 import traceback
 import torch
 import os
+import gc
 # note: there is no HunyuanImageToVideoPipeline yet in Diffusers
 from diffusers import HunyuanVideoPipeline, HunyuanVideoTransformer3DModel, FasterCacheConfig
             #else:
             #    disable_teacache(self.pipeline.transformer)
+            with torch.amp.autocast_mode.autocast('cuda', torch.bfloat16), torch.no_grad(), torch.inference_mode():
                 # Prepare generation parameters
                 generation_kwargs = {
                     asyncio.set_event_loop(loop)
                 video_uri, metadata = loop.run_until_complete(self.process_frames(frames, config))
+                torch.cuda.empty_cache()
+                torch.cuda.reset_peak_memory_stats()
+                gc.collect()
                 return {
                     "video": video_uri,
                     "content-type": "video/mp4",