evgmaslov commited on
Commit
aa7d2a2
·
verified ·
1 Parent(s): 34538db

Training in progress, step 200, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:97e403247e108f8661572e48642fcee35333d59756d365dd88e42aa8fa631e01
3
  size 109069176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74cb1b9a17e01550d57f682c2272b3bcf0a1d728f76798a7a32cd2fc0da17666
3
  size 109069176
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a78ccc666d673e12a1d28ba1a0c083d89609fb81d00fe4e836b0adb4a945bd17
3
  size 218182522
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db82133d614c41620cd9d82024c4fa04bf2e666462b7f18d90c603df7f58d315
3
  size 218182522
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ec13f903514339721d4fa36583de00b741de7c3211dcacf6bacb6d18deb801b
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ad52e7945fe9fccdea4f2280e2dc163fe9acbd3e1c3c17e8c8ca07c93e117b3
3
  size 15920
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:50f071de52013f68f57295901e5ddc08acc43e109f8cb7dba74f60d0d7748715
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:650fb6d7204c3921156794778517ab758b12af1b15578a6d4066a15364eadb18
3
  size 15920
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2cef6d64e63d59ee2eba46b2f0fb6178a55d13fa9afc1aee77233b4e227ad515
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0cd00350105ff8d620631953fb7bad049e92b7f8b1d194f2d8b461d9448c9fd9
3
  size 15920
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:355963aa21309380e38afe68229d60ff9b15967107a7ef4c7eab7ebd3ea50e61
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5e3eff2a323c0142563dd3a05e44b71e2aa10e311417bc0135233e704c94d7f
3
  size 15920
last-checkpoint/rng_state_4.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b6fedcc7a1d8a5aba26bb77ebd09b6a5407e2df12c52b6dd86a40947cc2f00e7
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:942e183d63fa3202f22fbed87394f5ac3082586d3385de3d8387035dd8d2ed4c
3
  size 15920
last-checkpoint/rng_state_5.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5d40d58def6274140f8becda92cf0bc42993ad0baa6ff0c0e293520959b0e50a
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4523f9690e096f422bb89f32ba1ddaf9d455ed4ca615ae687c8f8f6d368018aa
3
  size 15920
last-checkpoint/rng_state_6.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c8c72974fa22951100db4aed3d7025edc277b935bd704506d0196e9eee2c07b1
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac839e2f87d1ad1ec27d2da48d8042750d005b15c60b3cd4cce3067920c0f77e
3
  size 15920
last-checkpoint/rng_state_7.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3d7a738add2d312885f59497ef6711c979d20522d5f170a22e3ed6a959bf9c0f
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70c519ea38804e0064881be32c12048052b312ec0030222b8613a2d3c3f8bd9c
3
  size 15920
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:54097a2547f55954225eced1bc1b37eabe661762014e3a7653069b8596a803c8
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9422972de243dbed72656536159e149e3061feb398bc1fce55cbdc45f11de4f
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.25,
5
  "eval_steps": 100,
6
- "global_step": 100,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -15,6 +15,14 @@
15
  "eval_samples_per_second": 9.358,
16
  "eval_steps_per_second": 0.292,
17
  "step": 100
 
 
 
 
 
 
 
 
18
  }
19
  ],
20
  "logging_steps": 500,
@@ -34,7 +42,7 @@
34
  "attributes": {}
35
  }
36
  },
37
- "total_flos": 1.4808884027850752e+17,
38
  "train_batch_size": 4,
39
  "trial_name": null,
40
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.5,
5
  "eval_steps": 100,
6
+ "global_step": 200,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
15
  "eval_samples_per_second": 9.358,
16
  "eval_steps_per_second": 0.292,
17
  "step": 100
18
+ },
19
+ {
20
+ "epoch": 0.5,
21
+ "eval_loss": 0.018465671688318253,
22
+ "eval_runtime": 3.4208,
23
+ "eval_samples_per_second": 9.355,
24
+ "eval_steps_per_second": 0.292,
25
+ "step": 200
26
  }
27
  ],
28
  "logging_steps": 500,
 
42
  "attributes": {}
43
  }
44
  },
45
+ "total_flos": 2.9617768055701504e+17,
46
  "train_batch_size": 4,
47
  "trial_name": null,
48
  "trial_params": null