Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
@@ -112,7 +112,7 @@ def initialize_model():
|
|
112 |
torch_dtype=torch.float16,
|
113 |
device_map="auto",
|
114 |
attn_implementation="flash_attention_2",
|
115 |
-
quantization_config=quantization_config
|
116 |
)
|
117 |
|
118 |
return model, tokenizer
|
|
|
112 |
torch_dtype=torch.float16,
|
113 |
device_map="auto",
|
114 |
attn_implementation="flash_attention_2",
|
115 |
+
# quantization_config=quantization_config
|
116 |
)
|
117 |
|
118 |
return model, tokenizer
|