fff01

Paused

doubility123 commited on Feb 5

Commit

a3742d0

1 Parent(s): 9b99c45

update

Files changed (1) hide show

deepseek_vl2/serve/inference.py CHANGED Viewed

@@ -39,7 +39,7 @@ def load_model(model_path, dtype=torch.bfloat16):
     tokenizer = vl_chat_processor.tokenizer
     vl_gpt: DeepseekVLV2ForCausalLM = AutoModelForCausalLM.from_pretrained(
-        model_path, trust_remote_code=True, torch_dtype=dtype
     )
     if torch.cuda.is_available():
         vl_gpt = vl_gpt.cuda()

     tokenizer = vl_chat_processor.tokenizer
     vl_gpt: DeepseekVLV2ForCausalLM = AutoModelForCausalLM.from_pretrained(
+        model_path, force_download=False, trust_remote_code=True, torch_dtype=dtype
     )
     if torch.cuda.is_available():
         vl_gpt = vl_gpt.cuda()