mmekias commited on
Commit
4fb1a15
·
1 Parent(s): 7c15f94

End of training

Browse files
all_results.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 5.0,
3
+ "eval_accuracy": 0.9774436090225563,
4
+ "eval_loss": 0.19460569322109222,
5
+ "eval_runtime": 1.8724,
6
+ "eval_samples_per_second": 71.033,
7
+ "eval_steps_per_second": 2.67,
8
+ "train_loss": 0.42934251626332604,
9
+ "train_runtime": 152.2911,
10
+ "train_samples_per_second": 33.948,
11
+ "train_steps_per_second": 1.083
12
+ }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 5.0,
3
+ "eval_accuracy": 0.9774436090225563,
4
+ "eval_loss": 0.19460569322109222,
5
+ "eval_runtime": 1.8724,
6
+ "eval_samples_per_second": 71.033,
7
+ "eval_steps_per_second": 2.67
8
+ }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aecd07b47a43187477f9b407652dd7dfd2e8507e66deeddba12c8c0e330aadbd
3
  size 343282929
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b89bcab8922707bd9cfbd2809ed22b14726d6f6340068e1e93b5183eac083edb
3
  size 343282929
runs/Nov26_15-40-57_gpu-05/events.out.tfevents.1637926907.gpu-05.1035007.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0834cc80bd1861f1ec883bc138e3e87aa9e270101f5e8eddafb1a94457ea9384
3
- size 6541
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0521af50fbbdf8bb6b5ef5ffae7ebbeb1ddbf23f1fc894d0bcde6022ea8027da
3
+ size 7689
runs/Nov26_15-40-57_gpu-05/events.out.tfevents.1637927062.gpu-05.1035007.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40d357a0e68aed1e7925256e54cb2b806c8652c90993efa9d5b9767b6c1969a4
3
+ size 363
train_results.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 5.0,
3
+ "train_loss": 0.42934251626332604,
4
+ "train_runtime": 152.2911,
5
+ "train_samples_per_second": 33.948,
6
+ "train_steps_per_second": 1.083
7
+ }
trainer_state.json ADDED
@@ -0,0 +1,166 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.19460569322109222,
3
+ "best_model_checkpoint": "./beans_outputs/checkpoint-165",
4
+ "epoch": 5.0,
5
+ "global_step": 165,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.3,
12
+ "learning_rate": 1.8787878787878792e-05,
13
+ "loss": 1.0301,
14
+ "step": 10
15
+ },
16
+ {
17
+ "epoch": 0.61,
18
+ "learning_rate": 1.7575757575757576e-05,
19
+ "loss": 0.8837,
20
+ "step": 20
21
+ },
22
+ {
23
+ "epoch": 0.91,
24
+ "learning_rate": 1.6363636363636366e-05,
25
+ "loss": 0.7436,
26
+ "step": 30
27
+ },
28
+ {
29
+ "epoch": 1.0,
30
+ "eval_accuracy": 0.9774436090225563,
31
+ "eval_loss": 0.6124519109725952,
32
+ "eval_runtime": 1.9453,
33
+ "eval_samples_per_second": 68.371,
34
+ "eval_steps_per_second": 2.57,
35
+ "step": 33
36
+ },
37
+ {
38
+ "epoch": 1.21,
39
+ "learning_rate": 1.5151515151515153e-05,
40
+ "loss": 0.611,
41
+ "step": 40
42
+ },
43
+ {
44
+ "epoch": 1.52,
45
+ "learning_rate": 1.3939393939393942e-05,
46
+ "loss": 0.516,
47
+ "step": 50
48
+ },
49
+ {
50
+ "epoch": 1.82,
51
+ "learning_rate": 1.2727272727272728e-05,
52
+ "loss": 0.4365,
53
+ "step": 60
54
+ },
55
+ {
56
+ "epoch": 2.0,
57
+ "eval_accuracy": 0.9774436090225563,
58
+ "eval_loss": 0.34239351749420166,
59
+ "eval_runtime": 1.9228,
60
+ "eval_samples_per_second": 69.17,
61
+ "eval_steps_per_second": 2.6,
62
+ "step": 66
63
+ },
64
+ {
65
+ "epoch": 2.12,
66
+ "learning_rate": 1.1515151515151517e-05,
67
+ "loss": 0.4036,
68
+ "step": 70
69
+ },
70
+ {
71
+ "epoch": 2.42,
72
+ "learning_rate": 1.0303030303030304e-05,
73
+ "loss": 0.3354,
74
+ "step": 80
75
+ },
76
+ {
77
+ "epoch": 2.73,
78
+ "learning_rate": 9.090909090909091e-06,
79
+ "loss": 0.3164,
80
+ "step": 90
81
+ },
82
+ {
83
+ "epoch": 3.0,
84
+ "eval_accuracy": 0.9849624060150376,
85
+ "eval_loss": 0.23850761353969574,
86
+ "eval_runtime": 1.9166,
87
+ "eval_samples_per_second": 69.394,
88
+ "eval_steps_per_second": 2.609,
89
+ "step": 99
90
+ },
91
+ {
92
+ "epoch": 3.03,
93
+ "learning_rate": 7.87878787878788e-06,
94
+ "loss": 0.3057,
95
+ "step": 100
96
+ },
97
+ {
98
+ "epoch": 3.33,
99
+ "learning_rate": 6.666666666666667e-06,
100
+ "loss": 0.2561,
101
+ "step": 110
102
+ },
103
+ {
104
+ "epoch": 3.64,
105
+ "learning_rate": 5.4545454545454545e-06,
106
+ "loss": 0.2487,
107
+ "step": 120
108
+ },
109
+ {
110
+ "epoch": 3.94,
111
+ "learning_rate": 4.242424242424243e-06,
112
+ "loss": 0.2347,
113
+ "step": 130
114
+ },
115
+ {
116
+ "epoch": 4.0,
117
+ "eval_accuracy": 0.9774436090225563,
118
+ "eval_loss": 0.1993345469236374,
119
+ "eval_runtime": 1.9018,
120
+ "eval_samples_per_second": 69.932,
121
+ "eval_steps_per_second": 2.629,
122
+ "step": 132
123
+ },
124
+ {
125
+ "epoch": 4.24,
126
+ "learning_rate": 3.0303030303030305e-06,
127
+ "loss": 0.2092,
128
+ "step": 140
129
+ },
130
+ {
131
+ "epoch": 4.55,
132
+ "learning_rate": 1.8181818181818183e-06,
133
+ "loss": 0.2314,
134
+ "step": 150
135
+ },
136
+ {
137
+ "epoch": 4.85,
138
+ "learning_rate": 6.060606060606061e-07,
139
+ "loss": 0.2135,
140
+ "step": 160
141
+ },
142
+ {
143
+ "epoch": 5.0,
144
+ "eval_accuracy": 0.9774436090225563,
145
+ "eval_loss": 0.19460569322109222,
146
+ "eval_runtime": 1.9052,
147
+ "eval_samples_per_second": 69.809,
148
+ "eval_steps_per_second": 2.624,
149
+ "step": 165
150
+ },
151
+ {
152
+ "epoch": 5.0,
153
+ "step": 165,
154
+ "total_flos": 0.0,
155
+ "train_loss": 0.42934251626332604,
156
+ "train_runtime": 152.2911,
157
+ "train_samples_per_second": 33.948,
158
+ "train_steps_per_second": 1.083
159
+ }
160
+ ],
161
+ "max_steps": 165,
162
+ "num_train_epochs": 5,
163
+ "total_flos": 0.0,
164
+ "trial_name": null,
165
+ "trial_params": null
166
+ }