Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
@@ -101,7 +101,7 @@ def initialize_model():
|
|
101 |
device_map="cuda",
|
102 |
attn_implementation="flash_attention_2",
|
103 |
trust_remote_code=True,
|
104 |
-
|
105 |
|
106 |
)
|
107 |
|
|
|
101 |
device_map="cuda",
|
102 |
attn_implementation="flash_attention_2",
|
103 |
trust_remote_code=True,
|
104 |
+
quantization_config=quantization_config
|
105 |
|
106 |
)
|
107 |
|