tarabukinivan commited on
Commit
fe1b16b
·
verified ·
1 Parent(s): d356834

Training in progress, step 37, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4aa5a47573be3416e99e5731f9e9edfea50b7c0c3c07dfc651500dbecf7ea258
3
  size 80792096
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3d960105c0000a1c5419b399739a6ddfe9ea2fb39ce96f094246cc053509265
3
  size 80792096
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d12803c8d2c4edb9109716fd818ec49d8d1acfb94ecb586870aaca607b5b4e34
3
  size 161810282
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b71eb4dabeb1309f4cb0150d70e1b74002a15cf3bfba976d3d02aa236adf2864
3
  size 161810282
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:41c61cee4798669841c3c630b2c76576f4cd8b9a6de6d1faf68fb6f76158011c
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0996d79bee52ccc33c437c59c27c1b0a298f5e87d30c2a5c45de8080d570a2cc
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:24f70974ebe6e16031ce63527ce3fea95f8e56e83073513783f6d8a14f9aa0e8
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:403a4035e63034a6e33503614432aa83d524d5b8ffac47cac18a35f9606be4b7
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.035285469247733396,
5
  "eval_steps": 5,
6
- "global_step": 36,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -169,12 +169,12 @@
169
  "should_evaluate": false,
170
  "should_log": false,
171
  "should_save": true,
172
- "should_training_stop": false
173
  },
174
  "attributes": {}
175
  }
176
  },
177
- "total_flos": 1.2546979531849728e+16,
178
  "train_batch_size": 2,
179
  "trial_name": null,
180
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.03626562117128155,
5
  "eval_steps": 5,
6
+ "global_step": 37,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
169
  "should_evaluate": false,
170
  "should_log": false,
171
  "should_save": true,
172
+ "should_training_stop": true
173
  },
174
  "attributes": {}
175
  }
176
  },
177
+ "total_flos": 1.2895506741067776e+16,
178
  "train_batch_size": 2,
179
  "trial_name": null,
180
  "trial_params": null