Jaewan commited on
Commit
15ff140
·
1 Parent(s): 4688b05

End of training

Browse files
all_results.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 15.0,
3
+ "eval_loss": 0.3793739378452301,
4
+ "eval_runtime": 78.0857,
5
+ "eval_samples": 1647,
6
+ "eval_samples_per_second": 21.092,
7
+ "eval_steps_per_second": 2.638,
8
+ "eval_wer": 0.3446021856807272,
9
+ "train_loss": 1.0822357591868177,
10
+ "train_runtime": 3765.0907,
11
+ "train_samples": 3478,
12
+ "train_samples_per_second": 13.856,
13
+ "train_steps_per_second": 0.434
14
+ }
eval_results.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 15.0,
3
+ "eval_loss": 0.3793739378452301,
4
+ "eval_runtime": 78.0857,
5
+ "eval_samples": 1647,
6
+ "eval_samples_per_second": 21.092,
7
+ "eval_steps_per_second": 2.638,
8
+ "eval_wer": 0.3446021856807272
9
+ }
runs/Dec19_10-36-20_gpu08/events.out.tfevents.1671452678.gpu08.217435.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e05381a497f1315e5aa6576d20638e142ae71f31ac454a9d2f44fe4f3cc2092
3
+ size 358
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 15.0,
3
+ "train_loss": 1.0822357591868177,
4
+ "train_runtime": 3765.0907,
5
+ "train_samples": 3478,
6
+ "train_samples_per_second": 13.856,
7
+ "train_steps_per_second": 0.434
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,187 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 15.0,
5
+ "global_step": 1635,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.92,
12
+ "eval_loss": 3.595559597015381,
13
+ "eval_runtime": 78.9286,
14
+ "eval_samples_per_second": 20.867,
15
+ "eval_steps_per_second": 2.61,
16
+ "eval_wer": 1.0,
17
+ "step": 100
18
+ },
19
+ {
20
+ "epoch": 1.83,
21
+ "eval_loss": 3.0269057750701904,
22
+ "eval_runtime": 78.2182,
23
+ "eval_samples_per_second": 21.056,
24
+ "eval_steps_per_second": 2.634,
25
+ "eval_wer": 0.9998978653865795,
26
+ "step": 200
27
+ },
28
+ {
29
+ "epoch": 2.75,
30
+ "eval_loss": 0.9827112555503845,
31
+ "eval_runtime": 77.904,
32
+ "eval_samples_per_second": 21.141,
33
+ "eval_steps_per_second": 2.644,
34
+ "eval_wer": 0.8110509651720968,
35
+ "step": 300
36
+ },
37
+ {
38
+ "epoch": 3.67,
39
+ "eval_loss": 0.6235527396202087,
40
+ "eval_runtime": 78.104,
41
+ "eval_samples_per_second": 21.087,
42
+ "eval_steps_per_second": 2.638,
43
+ "eval_wer": 0.6303748340312532,
44
+ "step": 400
45
+ },
46
+ {
47
+ "epoch": 4.59,
48
+ "learning_rate": 0.0002988,
49
+ "loss": 3.1866,
50
+ "step": 500
51
+ },
52
+ {
53
+ "epoch": 4.59,
54
+ "eval_loss": 0.5015883445739746,
55
+ "eval_runtime": 78.1295,
56
+ "eval_samples_per_second": 21.08,
57
+ "eval_steps_per_second": 2.637,
58
+ "eval_wer": 0.5264017975691963,
59
+ "step": 500
60
+ },
61
+ {
62
+ "epoch": 5.5,
63
+ "eval_loss": 0.4523301422595978,
64
+ "eval_runtime": 77.6138,
65
+ "eval_samples_per_second": 21.22,
66
+ "eval_steps_per_second": 2.654,
67
+ "eval_wer": 0.493514452047799,
68
+ "step": 600
69
+ },
70
+ {
71
+ "epoch": 6.42,
72
+ "eval_loss": 0.4305676221847534,
73
+ "eval_runtime": 78.2496,
74
+ "eval_samples_per_second": 21.048,
75
+ "eval_steps_per_second": 2.633,
76
+ "eval_wer": 0.4527627412930242,
77
+ "step": 700
78
+ },
79
+ {
80
+ "epoch": 7.34,
81
+ "eval_loss": 0.43279117345809937,
82
+ "eval_runtime": 78.3317,
83
+ "eval_samples_per_second": 21.026,
84
+ "eval_steps_per_second": 2.63,
85
+ "eval_wer": 0.43294862628944947,
86
+ "step": 800
87
+ },
88
+ {
89
+ "epoch": 8.26,
90
+ "eval_loss": 0.40258118510246277,
91
+ "eval_runtime": 77.3151,
92
+ "eval_samples_per_second": 21.302,
93
+ "eval_steps_per_second": 2.664,
94
+ "eval_wer": 0.4104790113369421,
95
+ "step": 900
96
+ },
97
+ {
98
+ "epoch": 9.17,
99
+ "learning_rate": 0.00016837004405286342,
100
+ "loss": 0.227,
101
+ "step": 1000
102
+ },
103
+ {
104
+ "epoch": 9.17,
105
+ "eval_loss": 0.409604012966156,
106
+ "eval_runtime": 77.7312,
107
+ "eval_samples_per_second": 21.188,
108
+ "eval_steps_per_second": 2.65,
109
+ "eval_wer": 0.4080277806148504,
110
+ "step": 1000
111
+ },
112
+ {
113
+ "epoch": 10.09,
114
+ "eval_loss": 0.3921073079109192,
115
+ "eval_runtime": 78.0257,
116
+ "eval_samples_per_second": 21.108,
117
+ "eval_steps_per_second": 2.64,
118
+ "eval_wer": 0.3914819732407313,
119
+ "step": 1100
120
+ },
121
+ {
122
+ "epoch": 11.01,
123
+ "eval_loss": 0.3830062448978424,
124
+ "eval_runtime": 77.5372,
125
+ "eval_samples_per_second": 21.241,
126
+ "eval_steps_per_second": 2.657,
127
+ "eval_wer": 0.37779593504238584,
128
+ "step": 1200
129
+ },
130
+ {
131
+ "epoch": 11.93,
132
+ "eval_loss": 0.38462668657302856,
133
+ "eval_runtime": 77.1044,
134
+ "eval_samples_per_second": 21.361,
135
+ "eval_steps_per_second": 2.672,
136
+ "eval_wer": 0.36155653150852823,
137
+ "step": 1300
138
+ },
139
+ {
140
+ "epoch": 12.84,
141
+ "eval_loss": 0.3887845277786255,
142
+ "eval_runtime": 76.824,
143
+ "eval_samples_per_second": 21.439,
144
+ "eval_steps_per_second": 2.681,
145
+ "eval_wer": 0.3618629353487897,
146
+ "step": 1400
147
+ },
148
+ {
149
+ "epoch": 13.76,
150
+ "learning_rate": 3.621145374449339e-05,
151
+ "loss": 0.1046,
152
+ "step": 1500
153
+ },
154
+ {
155
+ "epoch": 13.76,
156
+ "eval_loss": 0.38607490062713623,
157
+ "eval_runtime": 78.3544,
158
+ "eval_samples_per_second": 21.02,
159
+ "eval_steps_per_second": 2.629,
160
+ "eval_wer": 0.3509345317127975,
161
+ "step": 1500
162
+ },
163
+ {
164
+ "epoch": 14.68,
165
+ "eval_loss": 0.3798215985298157,
166
+ "eval_runtime": 77.659,
167
+ "eval_samples_per_second": 21.208,
168
+ "eval_steps_per_second": 2.653,
169
+ "eval_wer": 0.3455213972015116,
170
+ "step": 1600
171
+ },
172
+ {
173
+ "epoch": 15.0,
174
+ "step": 1635,
175
+ "total_flos": 6.464559143942451e+18,
176
+ "train_loss": 1.0822357591868177,
177
+ "train_runtime": 3765.0907,
178
+ "train_samples_per_second": 13.856,
179
+ "train_steps_per_second": 0.434
180
+ }
181
+ ],
182
+ "max_steps": 1635,
183
+ "num_train_epochs": 15,
184
+ "total_flos": 6.464559143942451e+18,
185
+ "trial_name": null,
186
+ "trial_params": null
187
+ }