Training in progress, step 200, checkpoint

Files changed (12) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:97e403247e108f8661572e48642fcee35333d59756d365dd88e42aa8fa631e01
 size 109069176

 version https://git-lfs.github.com/spec/v1
+oid sha256:74cb1b9a17e01550d57f682c2272b3bcf0a1d728f76798a7a32cd2fc0da17666
 size 109069176

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a78ccc666d673e12a1d28ba1a0c083d89609fb81d00fe4e836b0adb4a945bd17
 size 218182522

 version https://git-lfs.github.com/spec/v1
+oid sha256:db82133d614c41620cd9d82024c4fa04bf2e666462b7f18d90c603df7f58d315
 size 218182522

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6ec13f903514339721d4fa36583de00b741de7c3211dcacf6bacb6d18deb801b
 size 15920

 version https://git-lfs.github.com/spec/v1
+oid sha256:2ad52e7945fe9fccdea4f2280e2dc163fe9acbd3e1c3c17e8c8ca07c93e117b3
 size 15920

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:50f071de52013f68f57295901e5ddc08acc43e109f8cb7dba74f60d0d7748715
 size 15920

 version https://git-lfs.github.com/spec/v1
+oid sha256:650fb6d7204c3921156794778517ab758b12af1b15578a6d4066a15364eadb18
 size 15920

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2cef6d64e63d59ee2eba46b2f0fb6178a55d13fa9afc1aee77233b4e227ad515
 size 15920

 version https://git-lfs.github.com/spec/v1
+oid sha256:0cd00350105ff8d620631953fb7bad049e92b7f8b1d194f2d8b461d9448c9fd9
 size 15920

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:355963aa21309380e38afe68229d60ff9b15967107a7ef4c7eab7ebd3ea50e61
 size 15920

 version https://git-lfs.github.com/spec/v1
+oid sha256:f5e3eff2a323c0142563dd3a05e44b71e2aa10e311417bc0135233e704c94d7f
 size 15920

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b6fedcc7a1d8a5aba26bb77ebd09b6a5407e2df12c52b6dd86a40947cc2f00e7
 size 15920

 version https://git-lfs.github.com/spec/v1
+oid sha256:942e183d63fa3202f22fbed87394f5ac3082586d3385de3d8387035dd8d2ed4c
 size 15920

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5d40d58def6274140f8becda92cf0bc42993ad0baa6ff0c0e293520959b0e50a
 size 15920

 version https://git-lfs.github.com/spec/v1
+oid sha256:4523f9690e096f422bb89f32ba1ddaf9d455ed4ca615ae687c8f8f6d368018aa
 size 15920

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c8c72974fa22951100db4aed3d7025edc277b935bd704506d0196e9eee2c07b1
 size 15920

 version https://git-lfs.github.com/spec/v1
+oid sha256:ac839e2f87d1ad1ec27d2da48d8042750d005b15c60b3cd4cce3067920c0f77e
 size 15920

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3d7a738add2d312885f59497ef6711c979d20522d5f170a22e3ed6a959bf9c0f
 size 15920

 version https://git-lfs.github.com/spec/v1
+oid sha256:70c519ea38804e0064881be32c12048052b312ec0030222b8613a2d3c3f8bd9c
 size 15920

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:54097a2547f55954225eced1bc1b37eabe661762014e3a7653069b8596a803c8
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:b9422972de243dbed72656536159e149e3061feb398bc1fce55cbdc45f11de4f
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.25,
   "eval_steps": 100,
-  "global_step": 100,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -15,6 +15,14 @@
       "eval_samples_per_second": 9.358,
       "eval_steps_per_second": 0.292,
       "step": 100
     }
   ],
   "logging_steps": 500,
@@ -34,7 +42,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 1.4808884027850752e+17,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.5,
   "eval_steps": 100,
+  "global_step": 200,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 9.358,
       "eval_steps_per_second": 0.292,
       "step": 100
+    },
+    {
+      "epoch": 0.5,
+      "eval_loss": 0.018465671688318253,
+      "eval_runtime": 3.4208,
+      "eval_samples_per_second": 9.355,
+      "eval_steps_per_second": 0.292,
+      "step": 200
     }
   ],
   "logging_steps": 500,
       "attributes": {}
     }
   },
+  "total_flos": 2.9617768055701504e+17,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null