Update app.py
Browse files
app.py
CHANGED
@@ -114,13 +114,13 @@ trainer = SFTTrainer(
|
|
114 |
packing=False,
|
115 |
args=TrainingArguments(
|
116 |
per_device_train_batch_size=1,
|
117 |
-
gradient_accumulation_steps=
|
118 |
learning_rate=2e-4,
|
119 |
fp16=not is_bfloat16_supported(),
|
120 |
bf16=is_bfloat16_supported(),
|
121 |
warmup_steps=5,
|
122 |
logging_steps=10,
|
123 |
-
max_steps=
|
124 |
optim="adamw_8bit",
|
125 |
weight_decay=0.01,
|
126 |
lr_scheduler_type="linear",
|
|
|
114 |
packing=False,
|
115 |
args=TrainingArguments(
|
116 |
per_device_train_batch_size=1,
|
117 |
+
gradient_accumulation_steps=1,
|
118 |
learning_rate=2e-4,
|
119 |
fp16=not is_bfloat16_supported(),
|
120 |
bf16=is_bfloat16_supported(),
|
121 |
warmup_steps=5,
|
122 |
logging_steps=10,
|
123 |
+
max_steps=100,
|
124 |
optim="adamw_8bit",
|
125 |
weight_decay=0.01,
|
126 |
lr_scheduler_type="linear",
|