Spaces:
Running
on
Zero
Running
on
Zero
zR
commited on
Commit
·
5cecc58
1
Parent(s):
85c524d
cuda
Browse files
app.py
CHANGED
@@ -38,6 +38,7 @@ model = AutoModelForCausalLM.from_pretrained(
|
|
38 |
model_name,
|
39 |
torch_dtype=torch.bfloat16,
|
40 |
trust_remote_code=True,
|
|
|
41 |
attn_implementation="flash_attention_2",
|
42 |
)
|
43 |
|
|
|
38 |
model_name,
|
39 |
torch_dtype=torch.bfloat16,
|
40 |
trust_remote_code=True,
|
41 |
+
device="cuda",
|
42 |
attn_implementation="flash_attention_2",
|
43 |
)
|
44 |
|