cpt core 4
Browse files
scripts/cpt_core_model_4.py
CHANGED
@@ -82,7 +82,7 @@ trainer = UnslothTrainer(
|
|
82 |
max_seq_length=max_seq_length,
|
83 |
dataset_num_proc=32,
|
84 |
max_steps=len(litgpt_streaming_dataset),
|
85 |
-
packing
|
86 |
|
87 |
args = UnslothTrainingArguments(
|
88 |
per_device_train_batch_size=16,
|
|
|
82 |
max_seq_length=max_seq_length,
|
83 |
dataset_num_proc=32,
|
84 |
max_steps=len(litgpt_streaming_dataset),
|
85 |
+
packing=False, # Can make training 5x faster for short sequences.
|
86 |
|
87 |
args = UnslothTrainingArguments(
|
88 |
per_device_train_batch_size=16,
|