jbilcke-hf
/

LTX-Video-0.9.1-HFIE

Model card Files Files and versions

jbilcke-hf commited on Feb 24

Commit

ffd9d14

·

verified ·

1 Parent(s): 4f3ad04

Update handler.py

Files changed (1) hide show

handler.py +15 -0

handler.py CHANGED Viewed

@@ -154,6 +154,13 @@ class EndpointHandler:
             #apply_teacache(self.image_to_video)
         else:
             # Initialize models with bfloat16 precision
             self.text_to_video = LTXPipeline.from_pretrained(
@@ -163,6 +170,14 @@ class EndpointHandler:
             #apply_teacache(self.text_to_video)
         # Initialize LoRA tracking
         self._current_lora_model = None

             #apply_teacache(self.image_to_video)
+            # Compilation requires some time to complete, so it is best suited for
+            # situations where you prepare your pipeline once and then perform the
+            # same type of inference operations multiple times.
+            # For example, calling the compiled pipeline on a different image size
+            # triggers compilation again which can be expensive.
+            self.image_to_video.unet = torch.compile(self.image_to_video.unet, mode="reduce-overhead", fullgraph=True)
         else:
             # Initialize models with bfloat16 precision
             self.text_to_video = LTXPipeline.from_pretrained(
             #apply_teacache(self.text_to_video)
+            # Compilation requires some time to complete, so it is best suited for
+            # situations where you prepare your pipeline once and then perform the
+            # same type of inference operations multiple times.
+            # For example, calling the compiled pipeline on a different image size
+            # triggers compilation again which can be expensive.
+            self.text_to_video.unet = torch.compile(self.text_to_video.unet, mode="reduce-overhead", fullgraph=True)
         # Initialize LoRA tracking
         self._current_lora_model = None