Daemontatox commited on
Commit
a93bc12
·
verified ·
1 Parent(s): 05fbf52

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -4
app.py CHANGED
@@ -34,10 +34,10 @@ h3 {
34
  device = "cuda" # for GPU usage or "cpu" for CPU usage
35
 
36
  quantization_config = BitsAndBytesConfig(
37
- load_in_8bit=True,
38
- bnb_8bit_compute_dtype=torch.bfloat16,
39
- bnb_8bit_use_double_quant=True,
40
- bnb_8bit_quant_type= "nf4")
41
 
42
  tokenizer = AutoTokenizer.from_pretrained(MODEL)
43
  model = AutoModelForCausalLM.from_pretrained(
 
34
  device = "cuda" # for GPU usage or "cpu" for CPU usage
35
 
36
  quantization_config = BitsAndBytesConfig(
37
+ load_in_4bit=True,
38
+ bnb_4bit_compute_dtype=torch.bfloat16,
39
+ bnb_4bit_use_double_quant=True,
40
+ bnb_4bit_quant_type= "nf4")
41
 
42
  tokenizer = AutoTokenizer.from_pretrained(MODEL)
43
  model = AutoModelForCausalLM.from_pretrained(