SystemAdmin123 commited on
Commit
9f2b016
·
verified ·
1 Parent(s): d83a698

Training in progress, step 20, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:25a257c5b2e34eda80e3d84f1a8cc4247ba163d63b057609915a20d5c03487fe
3
  size 2066752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5acd54546310927e397d2601dbfa4802a3e8dcaae83fca1cf6eb8d637b7a3718
3
  size 2066752
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1633f2b7e8962c026ec42e81ab43f9714d71927f4f946adc9ea9df77d428a7dd
3
  size 2162798
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b33c209a866661ee58b3141afc7148cd60ff320391c20638f94e38521197299
3
  size 2162798
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a4651e32e118f1ea1a8e26dfbbe64298593e12e6a71bcd36cb77f04f86d3f86d
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02bd6697dd0ac01f79967d93e880e93c5ad7e5d6a672668dd596f9f42c435066
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f0c1eba909fbb51daca773a25c075f182b4096aff21c9b4ff19dbada2080ac99
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1946c0d35865c02655624537450071d8e3a581f1d24f3c539357cae293b3d2d2
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:28adb9f06e220aefdc723ea4380a84d42b8bfb87cc53ce65859d55ce1876f51c
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9faf933c304288a566e09316737d2bdccb42e76da4138d98110982bcbf5dbf1
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:423c49ed521f6986d20d8b29112b383f4b0f3f2e228084ef82c2ad7dcd5d1de8
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f2cb6de5c0f2b78c1515e90a9ab03144587d336dd27fc87023f09785c5d64cb
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a60c7d771c1fd156acee762fba03c724cb41829a3f71df370ecd1d20b134982
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84f22729b765b6841bd185712dd3ab8bf338866cd8396b5dce62f9950913691a
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 16.666666666666668,
5
- "eval_steps": 200,
6
- "global_step": 100,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -11,9 +11,9 @@
11
  {
12
  "epoch": 0.16666666666666666,
13
  "eval_loss": 10.376375198364258,
14
- "eval_runtime": 2.361,
15
- "eval_samples_per_second": 635.755,
16
- "eval_steps_per_second": 5.083,
17
  "step": 1
18
  },
19
  {
@@ -31,67 +31,19 @@
31
  "step": 20
32
  },
33
  {
34
- "epoch": 5.0,
35
- "grad_norm": 0.2236328125,
36
- "learning_rate": 0.00016772815716257412,
37
- "loss": 10.3433,
38
- "step": 30
39
- },
40
- {
41
- "epoch": 6.666666666666667,
42
- "grad_norm": 0.3203125,
43
- "learning_rate": 0.00014016954246529696,
44
- "loss": 10.3073,
45
- "step": 40
46
- },
47
- {
48
- "epoch": 8.333333333333334,
49
- "grad_norm": 0.330078125,
50
- "learning_rate": 0.00010825793454723325,
51
- "loss": 10.2602,
52
- "step": 50
53
- },
54
- {
55
- "epoch": 10.0,
56
- "grad_norm": 0.326171875,
57
- "learning_rate": 7.54514512859201e-05,
58
- "loss": 10.2203,
59
- "step": 60
60
- },
61
- {
62
- "epoch": 11.666666666666666,
63
- "grad_norm": 0.326171875,
64
- "learning_rate": 4.530518418775733e-05,
65
- "loss": 10.1945,
66
- "step": 70
67
- },
68
- {
69
- "epoch": 13.333333333333334,
70
- "grad_norm": 0.328125,
71
- "learning_rate": 2.1085949060360654e-05,
72
- "loss": 10.1812,
73
- "step": 80
74
- },
75
- {
76
- "epoch": 15.0,
77
- "grad_norm": 0.328125,
78
- "learning_rate": 5.418275829936537e-06,
79
- "loss": 10.1773,
80
- "step": 90
81
- },
82
- {
83
- "epoch": 16.666666666666668,
84
- "grad_norm": 0.328125,
85
- "learning_rate": 0.0,
86
- "loss": 10.1767,
87
- "step": 100
88
  }
89
  ],
90
  "logging_steps": 10,
91
  "max_steps": 100,
92
  "num_input_tokens_seen": 0,
93
  "num_train_epochs": 17,
94
- "save_steps": 200,
95
  "stateful_callbacks": {
96
  "TrainerControl": {
97
  "args": {
@@ -99,12 +51,12 @@
99
  "should_evaluate": false,
100
  "should_log": false,
101
  "should_save": true,
102
- "should_training_stop": true
103
  },
104
  "attributes": {}
105
  }
106
  },
107
- "total_flos": 81831709900800.0,
108
  "train_batch_size": 32,
109
  "trial_name": null,
110
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 3.3333333333333335,
5
+ "eval_steps": 20,
6
+ "global_step": 20,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
11
  {
12
  "epoch": 0.16666666666666666,
13
  "eval_loss": 10.376375198364258,
14
+ "eval_runtime": 2.4239,
15
+ "eval_samples_per_second": 619.257,
16
+ "eval_steps_per_second": 4.951,
17
  "step": 1
18
  },
19
  {
 
31
  "step": 20
32
  },
33
  {
34
+ "epoch": 3.3333333333333335,
35
+ "eval_loss": 10.353797912597656,
36
+ "eval_runtime": 2.3252,
37
+ "eval_samples_per_second": 645.523,
38
+ "eval_steps_per_second": 5.161,
39
+ "step": 20
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
40
  }
41
  ],
42
  "logging_steps": 10,
43
  "max_steps": 100,
44
  "num_input_tokens_seen": 0,
45
  "num_train_epochs": 17,
46
+ "save_steps": 20,
47
  "stateful_callbacks": {
48
  "TrainerControl": {
49
  "args": {
 
51
  "should_evaluate": false,
52
  "should_log": false,
53
  "should_save": true,
54
+ "should_training_stop": false
55
  },
56
  "attributes": {}
57
  }
58
  },
59
+ "total_flos": 16366341980160.0,
60
  "train_batch_size": 32,
61
  "trial_name": null,
62
  "trial_params": null
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:177153b8e669200606260ec62fe7b0361ef90146a1e5f2d49d0dff2a631eb3c0
3
  size 6904
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d3b61fe0c0e98b749a00886c559e77a474e82e543f32a1ea385827052eed1fc
3
  size 6904