OP7 commited on
Commit
b09dd05
·
verified ·
1 Parent(s): 91d6fed

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +8 -10
app.py CHANGED
@@ -30,20 +30,18 @@ import gradio as gr
30
  from PIL import Image
31
  import torch
32
 
33
-
34
-
35
- # # Create a configuration for quantization
36
- # quantization_config = BitsAndBytesConfig(
37
- # load_in_4bit=True,
38
- # bnb_4bit_compute_dtype="float16",
39
- # bnb_4bit_use_double_quant=True,
40
- # bnb_4bit_quant_type="nf4",
41
- # )
42
 
43
  # Load the model and processor
44
  model = Qwen2VLForConditionalGeneration.from_pretrained(
45
  "Qwen/QVQ-72B-Preview", device_map="auto",
46
- # quantization_config=quantization_config,
47
  offload_folder="offload",
48
  )
49
  processor = AutoProcessor.from_pretrained("Qwen/QVQ-72B-Preview")
 
30
  from PIL import Image
31
  import torch
32
 
33
+ # Create a configuration for quantization
34
+ quantization_config = BitsAndBytesConfig(
35
+ load_in_8bit=True,
36
+ bnb_8bit_compute_dtype="float16",
37
+ bnb_8bit_use_double_quant=True,
38
+ bnb_8bit_quant_type="nf4",
39
+ )
 
 
40
 
41
  # Load the model and processor
42
  model = Qwen2VLForConditionalGeneration.from_pretrained(
43
  "Qwen/QVQ-72B-Preview", device_map="auto",
44
+ quantization_config=quantization_config,
45
  offload_folder="offload",
46
  )
47
  processor = AutoProcessor.from_pretrained("Qwen/QVQ-72B-Preview")