zhengr commited on
Commit
be7d67b
·
verified ·
1 Parent(s): 9777dd4

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -3
app.py CHANGED
@@ -29,7 +29,8 @@ streamer = TextStreamer(tokenizer)
29
 
30
  #model = AutoModelForCausalLM.from_pretrained(model, trust_remote_code=True, token = access_token, device_map="cuda", load_in_8bit=True, offload_folder="offload/")
31
  #model = PeftModel.from_pretrained(model, peft_model, offload_folder="offload/")
32
- model = AutoModelForCausalLM.from_pretrained(model, trust_remote_code=True, token = access_token, device_map="cuda", load_in_8bit=True)
 
33
  model = PeftModel.from_pretrained(model, peft_model)
34
 
35
  model = model.eval()
@@ -398,9 +399,9 @@ def ask(symbol, weeks_before, withbasic):
398
  #model=model.to(device)
399
 
400
  print(model.device)
 
401
  inputs = tokenizer(pt, return_tensors='pt')
402
-
403
- inputs = {key: value.to(model.device('cuda:0')) for key, value in inputs.items()}
404
  #inputs = {key: value.to(model.device) for key, value in inputs.items()}
405
  #inputs = {key: value.to('cuda:0') for key, value in inputs.items()}
406
  print("Inputs loaded onto devices.")
 
29
 
30
  #model = AutoModelForCausalLM.from_pretrained(model, trust_remote_code=True, token = access_token, device_map="cuda", load_in_8bit=True, offload_folder="offload/")
31
  #model = PeftModel.from_pretrained(model, peft_model, offload_folder="offload/")
32
+
33
+ model = AutoModelForCausalLM.from_pretrained(model, trust_remote_code=True, device_map="cuda")
34
  model = PeftModel.from_pretrained(model, peft_model)
35
 
36
  model = model.eval()
 
399
  #model=model.to(device)
400
 
401
  print(model.device)
402
+
403
  inputs = tokenizer(pt, return_tensors='pt')
404
+ inputs = {key: value.to(model.device) for key, value in inputs.items()}
 
405
  #inputs = {key: value.to(model.device) for key, value in inputs.items()}
406
  #inputs = {key: value.to('cuda:0') for key, value in inputs.items()}
407
  print("Inputs loaded onto devices.")