cpt core 4
Browse files
scripts/cpt_core_model_4.py
CHANGED
|
@@ -4,7 +4,7 @@ from transformers import AutoTokenizer
|
|
| 4 |
|
| 5 |
max_seq_length = 16385
|
| 6 |
dtype = torch.bfloat16
|
| 7 |
-
load_in_4bit =
|
| 8 |
model_name = '../out/pretrain-core-3/hf'
|
| 9 |
output_dir = '../out/cpt-core-4'
|
| 10 |
|
|
|
|
| 4 |
|
| 5 |
max_seq_length = 16385
|
| 6 |
dtype = torch.bfloat16
|
| 7 |
+
load_in_4bit = False
|
| 8 |
model_name = '../out/pretrain-core-3/hf'
|
| 9 |
output_dir = '../out/cpt-core-4'
|
| 10 |
|