zR commited on
Commit
5cecc58
·
1 Parent(s): 85c524d
Files changed (1) hide show
  1. app.py +1 -0
app.py CHANGED
@@ -38,6 +38,7 @@ model = AutoModelForCausalLM.from_pretrained(
38
  model_name,
39
  torch_dtype=torch.bfloat16,
40
  trust_remote_code=True,
 
41
  attn_implementation="flash_attention_2",
42
  )
43
 
 
38
  model_name,
39
  torch_dtype=torch.bfloat16,
40
  trust_remote_code=True,
41
+ device="cuda",
42
  attn_implementation="flash_attention_2",
43
  )
44