cpt core 4
Browse files
scripts/cpt_core_model_4.py
CHANGED
@@ -4,7 +4,7 @@ from transformers import AutoTokenizer
|
|
4 |
|
5 |
max_seq_length = 16385
|
6 |
dtype = torch.bfloat16
|
7 |
-
load_in_4bit =
|
8 |
model_name = '../out/pretrain-core-3/hf'
|
9 |
output_dir = '../out/cpt-core-4'
|
10 |
|
|
|
4 |
|
5 |
max_seq_length = 16385
|
6 |
dtype = torch.bfloat16
|
7 |
+
load_in_4bit = False
|
8 |
model_name = '../out/pretrain-core-3/hf'
|
9 |
output_dir = '../out/cpt-core-4'
|
10 |
|