Commit
·
a3742d0
1
Parent(s):
9b99c45
update
Browse files
deepseek_vl2/serve/inference.py
CHANGED
@@ -39,7 +39,7 @@ def load_model(model_path, dtype=torch.bfloat16):
|
|
39 |
tokenizer = vl_chat_processor.tokenizer
|
40 |
|
41 |
vl_gpt: DeepseekVLV2ForCausalLM = AutoModelForCausalLM.from_pretrained(
|
42 |
-
model_path, trust_remote_code=True, torch_dtype=dtype
|
43 |
)
|
44 |
if torch.cuda.is_available():
|
45 |
vl_gpt = vl_gpt.cuda()
|
|
|
39 |
tokenizer = vl_chat_processor.tokenizer
|
40 |
|
41 |
vl_gpt: DeepseekVLV2ForCausalLM = AutoModelForCausalLM.from_pretrained(
|
42 |
+
model_path, force_download=False, trust_remote_code=True, torch_dtype=dtype
|
43 |
)
|
44 |
if torch.cuda.is_available():
|
45 |
vl_gpt = vl_gpt.cuda()
|