lesso commited on
Commit
472cbbe
·
verified ·
1 Parent(s): 924151b

Training in progress, step 300, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:058530e4eca99670ba0055d082a2a4d9f5f1ec55158c626ecd381ff8c1e3ad4e
3
  size 201892112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17ed18ddb023a3395a41a23181578cfeba8e7519d1310b3a40b04942780145f0
3
  size 201892112
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:04a5e427456baf8da92567a0350f1723ab6595d58be597a7b216854a05d2d9f4
3
- size 102864548
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c80c1f04c65f4b069b9b7ca9cb4de410727a589a5ee29e5712e78cdaa8a8d7bc
3
+ size 102864868
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7131b70fc7ebdd91a4fdaf6a201da7ae892386e8abcc9ed2410b4cbcda1633cf
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:827aa64c8faf16952bd9662def653a65b68fa9797cf29fca95f2cd42c5fffb53
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6bc544fc67f1b8a2b1db90f19b38ff839ccead6d1b6c5672460d1acb014ba0c1
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a987734371c39c6974f0e478c7d6a4ed2064b15a4162308e0d41fa113d63e748
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.10329132527112961,
3
  "best_model_checkpoint": "miner_id_24/checkpoint-150",
4
- "epoch": 1.2654867256637168,
5
  "eval_steps": 50,
6
- "global_step": 250,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -90,6 +90,21 @@
90
  "eval_samples_per_second": 176.766,
91
  "eval_steps_per_second": 5.574,
92
  "step": 250
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
93
  }
94
  ],
95
  "logging_steps": 50,
@@ -104,7 +119,7 @@
104
  "early_stopping_threshold": 0.0
105
  },
106
  "attributes": {
107
- "early_stopping_patience_counter": 2
108
  }
109
  },
110
  "TrainerControl": {
@@ -113,12 +128,12 @@
113
  "should_evaluate": false,
114
  "should_log": false,
115
  "should_save": true,
116
- "should_training_stop": false
117
  },
118
  "attributes": {}
119
  }
120
  },
121
- "total_flos": 1.0708402219411046e+17,
122
  "train_batch_size": 32,
123
  "trial_name": null,
124
  "trial_params": null
 
1
  {
2
  "best_metric": 0.10329132527112961,
3
  "best_model_checkpoint": "miner_id_24/checkpoint-150",
4
+ "epoch": 1.5183312262958282,
5
  "eval_steps": 50,
6
+ "global_step": 300,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
90
  "eval_samples_per_second": 176.766,
91
  "eval_steps_per_second": 5.574,
92
  "step": 250
93
+ },
94
+ {
95
+ "epoch": 1.5183312262958282,
96
+ "grad_norm": 0.07207214087247849,
97
+ "learning_rate": 0.000203,
98
+ "loss": 0.1043,
99
+ "step": 300
100
+ },
101
+ {
102
+ "epoch": 1.5183312262958282,
103
+ "eval_loss": 0.10684775561094284,
104
+ "eval_runtime": 7.5158,
105
+ "eval_samples_per_second": 177.228,
106
+ "eval_steps_per_second": 5.588,
107
+ "step": 300
108
  }
109
  ],
110
  "logging_steps": 50,
 
119
  "early_stopping_threshold": 0.0
120
  },
121
  "attributes": {
122
+ "early_stopping_patience_counter": 3
123
  }
124
  },
125
  "TrainerControl": {
 
128
  "should_evaluate": false,
129
  "should_log": false,
130
  "should_save": true,
131
+ "should_training_stop": true
132
  },
133
  "attributes": {}
134
  }
135
  },
136
+ "total_flos": 1.2841550071883366e+17,
137
  "train_batch_size": 32,
138
  "trial_name": null,
139
  "trial_params": null