Spaces:
Paused
Paused
Update train.py
Browse files
train.py
CHANGED
@@ -27,10 +27,11 @@ SHARD_SIZE = int(2e+5)
|
|
27 |
FP16 = True
|
28 |
WEIGHT_DECAY = 1e-3
|
29 |
GRADIENT_ACCUMULATION_STEPS = BATCH_SIZE // 4
|
30 |
-
|
31 |
PUSH_TO_HUB = True
|
32 |
|
33 |
-
total_steps =
|
|
|
34 |
|
35 |
class Space:
|
36 |
def __init__(self):
|
@@ -202,6 +203,7 @@ def train_model(model, tokenizer, dataset, push, isinst):
|
|
202 |
save_steps=WARMUP_STEPS * 5,
|
203 |
logging_steps=WARMUP_STEPS,
|
204 |
eval_strategy="no",
|
|
|
205 |
# eval_steps=WARMUP_STEPS,
|
206 |
save_total_limit=2,
|
207 |
)
|
|
|
27 |
FP16 = True
|
28 |
WEIGHT_DECAY = 1e-3
|
29 |
GRADIENT_ACCUMULATION_STEPS = BATCH_SIZE // 4
|
30 |
+
|
31 |
PUSH_TO_HUB = True
|
32 |
|
33 |
+
total_steps = (SHARD_SIZE * EPOCHS) // (BATCH_SIZE * GRADIENT_ACCUMULATION_STEPS)
|
34 |
+
WARMUP_STEPS = total_steps * 0.1
|
35 |
|
36 |
class Space:
|
37 |
def __init__(self):
|
|
|
203 |
save_steps=WARMUP_STEPS * 5,
|
204 |
logging_steps=WARMUP_STEPS,
|
205 |
eval_strategy="no",
|
206 |
+
report_to="no",
|
207 |
# eval_steps=WARMUP_STEPS,
|
208 |
save_total_limit=2,
|
209 |
)
|