lesso06 commited on
Commit
a988832
·
verified ·
1 Parent(s): 14df2cd

Training in progress, step 350, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f90f29add083e70435ccfcdb9324896e0d661ce675afea96492133329ed27409
3
  size 1157746040
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1da9f0e1748b79b0e2ea094ecc52c3475afb89979699261200296acbbf4c5b0
3
  size 1157746040
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:17f29963d218f536f17aa1aea587ddabfad09e50c404853c0317e3fff1876cb9
3
  size 588700500
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:adfa8bf05dc665b19a9d27cdfc7aeb1f8e04a1e815cd33dacbdaff1b978c4950
3
  size 588700500
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:be935466c588a753f80b4b6fd059919104354d0102b7a2dca4181c83f51ce99e
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7211b19267643e4a4695239646f9fc645d8110b1d66e4a8494a1b44822fb5bcd
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cf9d37d8ac9041b1174177f2abdfd03da05c909db05db7e02be2b5adefcdb593
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edaf981d1dfb35fd3b5ff50f9b58cbbedb093fe8427ac222964e342dc83dc071
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 1.7082891464233398,
3
- "best_model_checkpoint": "miner_id_24/checkpoint-250",
4
- "epoch": 0.08526360665056132,
5
  "eval_steps": 50,
6
- "global_step": 300,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -273,6 +273,49 @@
273
  "eval_samples_per_second": 9.008,
274
  "eval_steps_per_second": 2.261,
275
  "step": 300
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
276
  }
277
  ],
278
  "logging_steps": 10,
@@ -287,7 +330,7 @@
287
  "early_stopping_threshold": 0.0
288
  },
289
  "attributes": {
290
- "early_stopping_patience_counter": 1
291
  }
292
  },
293
  "TrainerControl": {
@@ -301,7 +344,7 @@
301
  "attributes": {}
302
  }
303
  },
304
- "total_flos": 5.215556344165171e+16,
305
  "train_batch_size": 2,
306
  "trial_name": null,
307
  "trial_params": null
 
1
  {
2
+ "best_metric": 1.625133752822876,
3
+ "best_model_checkpoint": "miner_id_24/checkpoint-350",
4
+ "epoch": 0.0994742077589882,
5
  "eval_steps": 50,
6
+ "global_step": 350,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
273
  "eval_samples_per_second": 9.008,
274
  "eval_steps_per_second": 2.261,
275
  "step": 300
276
+ },
277
+ {
278
+ "epoch": 0.0881057268722467,
279
+ "grad_norm": 1.6801893711090088,
280
+ "learning_rate": 7.808204475323423e-05,
281
+ "loss": 1.097,
282
+ "step": 310
283
+ },
284
+ {
285
+ "epoch": 0.09094784709393207,
286
+ "grad_norm": 1.468928575515747,
287
+ "learning_rate": 7.117124957938042e-05,
288
+ "loss": 1.6221,
289
+ "step": 320
290
+ },
291
+ {
292
+ "epoch": 0.09378996731561745,
293
+ "grad_norm": 2.429023027420044,
294
+ "learning_rate": 6.441552087816105e-05,
295
+ "loss": 1.7242,
296
+ "step": 330
297
+ },
298
+ {
299
+ "epoch": 0.09663208753730283,
300
+ "grad_norm": 2.3508596420288086,
301
+ "learning_rate": 5.784777188072502e-05,
302
+ "loss": 1.5539,
303
+ "step": 340
304
+ },
305
+ {
306
+ "epoch": 0.0994742077589882,
307
+ "grad_norm": 1.75046968460083,
308
+ "learning_rate": 5.150000000000002e-05,
309
+ "loss": 1.8748,
310
+ "step": 350
311
+ },
312
+ {
313
+ "epoch": 0.0994742077589882,
314
+ "eval_loss": 1.625133752822876,
315
+ "eval_runtime": 82.1926,
316
+ "eval_samples_per_second": 9.015,
317
+ "eval_steps_per_second": 2.263,
318
+ "step": 350
319
  }
320
  ],
321
  "logging_steps": 10,
 
330
  "early_stopping_threshold": 0.0
331
  },
332
  "attributes": {
333
+ "early_stopping_patience_counter": 0
334
  }
335
  },
336
  "TrainerControl": {
 
344
  "attributes": {}
345
  }
346
  },
347
+ "total_flos": 6.106822301712384e+16,
348
  "train_batch_size": 2,
349
  "trial_name": null,
350
  "trial_params": null