robinhad commited on
Commit
3f1088f
·
verified ·
1 Parent(s): a028ca0

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -3
app.py CHANGED
@@ -23,11 +23,10 @@ quant_config = BitsAndBytesConfig(
23
  tokenizer = LlamaTokenizer.from_pretrained(model_name)
24
  model = LlamaForCausalLM.from_pretrained(
25
  model_name,
26
- device_map="cpu"
27
- #quantization_config=quant_config
28
  )
29
 
30
- model = PeftModel.from_pretrained(model, lora_name, hf_device_map="cpu")
31
 
32
  model = model.to("cuda")
33
 
 
23
  tokenizer = LlamaTokenizer.from_pretrained(model_name)
24
  model = LlamaForCausalLM.from_pretrained(
25
  model_name,
26
+ quantization_config=quant_config
 
27
  )
28
 
29
+ model = PeftModel.from_pretrained(model, lora_name, torch_device="cpu")
30
 
31
  model = model.to("cuda")
32