ruslanmv commited on
Commit
b6e8fb0
·
1 Parent(s): cc16819

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -3
app.py CHANGED
@@ -35,9 +35,10 @@ print(f"Low memory: {LOW_MEMORY}")
35
 
36
  # Quantization configuration for efficient model loading
37
  # Define BitsAndBytesConfig
38
- quantization_config = BitsAndBytesConfig(load_in_4bit=True,
39
- bnb_4bit_quant_type="nf4",
40
- bnb_4bit_compute_dtype=torch.float16)
 
41
 
42
 
43
  # Load models only once
 
35
 
36
  # Quantization configuration for efficient model loading
37
  # Define BitsAndBytesConfig
38
+ quantization_config = BitsAndBytesConfig(
39
+ load_in_4bit=True,
40
+ bnb_4bit_compute_dtype=torch.float16
41
+ )
42
 
43
 
44
  # Load models only once