Training in progress, step 50, checkpoint

Files changed (5) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d6691c97c2ffe4d42101beaf5dd8eda4772426c736425774069da9f263b82bc1
 size 3558888

 version https://git-lfs.github.com/spec/v1
+oid sha256:f771ec08b58b5db2df1e35e840beea613fd221403cda69960cf10980b637f430
 size 3558888

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ec7ebe01b39eec308e3272194599a058aefb21154deb4a9a287329a00bad5898
 size 7198906

 version https://git-lfs.github.com/spec/v1
+oid sha256:5ba8e1b2a096f1141bc55a687262f697707eec5e5ef262b6683ba51ab8056edb
 size 7198906

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:73a19190b84f0531119dab9b890331fcea2eae794322be8422a5be37c17d74a3
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:04fca484010f00fef17865c6b5cf7f6664a5d9146ff300b3753875bfa60c7f76
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5f34000de8119b9f7164ac0e78cd1e7173e2cfe31e95319137ec32abdf60c7ba
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:a4ad95690c27927b8374216bcc4afe0bd6bd85edbbc60e77edab073d52865c2e
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.189873417721519,
   "eval_steps": 5,
-  "global_step": 45,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -79,13 +79,21 @@
       "eval_samples_per_second": 19.133,
       "eval_steps_per_second": 2.392,
       "step": 45
     }
   ],
   "logging_steps": 500,
   "max_steps": 237,
   "num_train_epochs": 1,
   "save_steps": 5,
-  "total_flos": 185618320588800.0,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.2109704641350211,
   "eval_steps": 5,
+  "global_step": 50,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 19.133,
       "eval_steps_per_second": 2.392,
       "step": 45
+    },
+    {
+      "epoch": 0.21,
+      "eval_loss": 15.608057975769043,
+      "eval_runtime": 121.069,
+      "eval_samples_per_second": 19.163,
+      "eval_steps_per_second": 2.395,
+      "step": 50
     }
   ],
   "logging_steps": 500,
   "max_steps": 237,
   "num_train_epochs": 1,
   "save_steps": 5,
+  "total_flos": 206242578432000.0,
   "trial_name": null,
   "trial_params": null
 }