lesso10 commited on
Commit
3b5f65b
·
verified ·
1 Parent(s): 47adb3d

Training in progress, step 263, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b84400837bef983cc3abec69ee1a32ef4ca5fdd992aed4368f742208087954f2
3
  size 72936
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df9231c70dee7e32ded47caf5663af30dde5230a32544540abb78487c1d4aedd
3
  size 72936
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:478083457920f8c762d943d8406b493cb7eeb8a86abafa26deb6098eb89b9543
3
  size 151106
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6eb7bb014eba9a50dc99631309e24993cb53ef6f4400a355740166a50052dfa2
3
  size 151106
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:53c6141d9349cbeee031d01ce56ea60718c6e315d601bf731c74a0ca690f5afb
3
  size 14180
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fbc1de8416f86affe82bd96e37b50e56fc74868b9c9b5cdff5ee4416dd4d240
3
  size 14180
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:99573f786b471698147a90bca9832c01f3a6051546b34cf62733f3000c01a587
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce50c1db2e1ed1848dbc95405ff8f729fea88553cef218c8a2f3ff7b61aead36
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 12.254945755004883,
3
  "best_model_checkpoint": "miner_id_24/checkpoint-250",
4
- "epoch": 0.9505703422053232,
5
  "eval_steps": 50,
6
- "global_step": 250,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -230,6 +230,13 @@
230
  "eval_samples_per_second": 151.566,
231
  "eval_steps_per_second": 38.233,
232
  "step": 250
 
 
 
 
 
 
 
233
  }
234
  ],
235
  "logging_steps": 10,
@@ -253,12 +260,12 @@
253
  "should_evaluate": false,
254
  "should_log": false,
255
  "should_save": true,
256
- "should_training_stop": false
257
  },
258
  "attributes": {}
259
  }
260
  },
261
- "total_flos": 120520704000.0,
262
  "train_batch_size": 4,
263
  "trial_name": null,
264
  "trial_params": null
 
1
  {
2
  "best_metric": 12.254945755004883,
3
  "best_model_checkpoint": "miner_id_24/checkpoint-250",
4
+ "epoch": 1.0,
5
  "eval_steps": 50,
6
+ "global_step": 263,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
230
  "eval_samples_per_second": 151.566,
231
  "eval_steps_per_second": 38.233,
232
  "step": 250
233
+ },
234
+ {
235
+ "epoch": 0.9885931558935361,
236
+ "grad_norm": 0.38638147711753845,
237
+ "learning_rate": 1.0277121540277156e-07,
238
+ "loss": 12.2669,
239
+ "step": 260
240
  }
241
  ],
242
  "logging_steps": 10,
 
260
  "should_evaluate": false,
261
  "should_log": false,
262
  "should_save": true,
263
+ "should_training_stop": true
264
  },
265
  "attributes": {}
266
  }
267
  },
268
+ "total_flos": 126787780608.0,
269
  "train_batch_size": 4,
270
  "trial_name": null,
271
  "trial_params": null