qwen2.5-VL-api

Running

danilohssantana commited on Feb 20

Commit

3ab6021

1 Parent(s): 3d2e7b8

adding new model

Files changed (1) hide show

main.py CHANGED Viewed

@@ -35,8 +35,8 @@ class PredictRequest(BaseModel):
 #     device_map="auto",
 #     # attn_implementation="flash_attention_2",
 # )
-checkpoint = "Qwen/Qwen2.5-VL-7B-Instruct"
 min_pixels = 256 * 28 * 28
 max_pixels = 1280 * 28 * 28
 processor = AutoProcessor.from_pretrained(

 #     device_map="auto",
 #     # attn_implementation="flash_attention_2",
 # )
+# checkpoint = "Qwen/Qwen2.5-VL-7B-Instruct"
+checkpoint = "Qwen/Qwen2-VL-72B-Instruct-GPTQ-Int4"
 min_pixels = 256 * 28 * 28
 max_pixels = 1280 * 28 * 28
 processor = AutoProcessor.from_pretrained(