nroggendorff commited on
Commit
ae4cbda
·
verified ·
1 Parent(s): 37138f9

Update train.py

Browse files
Files changed (1) hide show
  1. train.py +4 -2
train.py CHANGED
@@ -27,10 +27,11 @@ SHARD_SIZE = int(2e+5)
27
  FP16 = True
28
  WEIGHT_DECAY = 1e-3
29
  GRADIENT_ACCUMULATION_STEPS = BATCH_SIZE // 4
30
- WARMUP_STEPS = ((SHARD_SIZE // (BATCH_SIZE * GRADIENT_ACCUMULATION_STEPS)) * EPOCHS) // 10
31
  PUSH_TO_HUB = True
32
 
33
- total_steps = WARMUP_STEPS * 10
 
34
 
35
  class Space:
36
  def __init__(self):
@@ -202,6 +203,7 @@ def train_model(model, tokenizer, dataset, push, isinst):
202
  save_steps=WARMUP_STEPS * 5,
203
  logging_steps=WARMUP_STEPS,
204
  eval_strategy="no",
 
205
  # eval_steps=WARMUP_STEPS,
206
  save_total_limit=2,
207
  )
 
27
  FP16 = True
28
  WEIGHT_DECAY = 1e-3
29
  GRADIENT_ACCUMULATION_STEPS = BATCH_SIZE // 4
30
+
31
  PUSH_TO_HUB = True
32
 
33
+ total_steps = (SHARD_SIZE * EPOCHS) // (BATCH_SIZE * GRADIENT_ACCUMULATION_STEPS)
34
+ WARMUP_STEPS = total_steps * 0.1
35
 
36
  class Space:
37
  def __init__(self):
 
203
  save_steps=WARMUP_STEPS * 5,
204
  logging_steps=WARMUP_STEPS,
205
  eval_strategy="no",
206
+ report_to="no",
207
  # eval_steps=WARMUP_STEPS,
208
  save_total_limit=2,
209
  )