Spaces:

slabstech
/

dhwani-internal-api-server

Paused

sachin commited on 18 days ago

Commit

7222675

1 Parent(s): 453f545

add- torch compile

Files changed (1) hide show

src/server/main.py CHANGED Viewed

@@ -386,6 +386,9 @@ class TranslateManager:
             torch_dtype=torch.float16,
             attn_implementation="flash_attention_2"
         ).to(self.device_type)
         return tokenizer, model
 class ModelManager:

             torch_dtype=torch.float16,
             attn_implementation="flash_attention_2"
         ).to(self.device_type)
+        model = torch.compile(model, mode="reduce-overhead")
+        print("Model compiled with torch.compile")
         return tokenizer, model
 class ModelManager: