bagasshw commited on
Commit
d0dddce
·
verified ·
1 Parent(s): 32cb015

End of training

Browse files
README.md CHANGED
@@ -1,15 +1,20 @@
1
  ---
2
  library_name: transformers
 
 
3
  license: apache-2.0
4
  base_model: openai/whisper-tiny
5
  tags:
 
 
 
6
  - generated_from_trainer
7
  datasets:
8
  - jv_id_asr_split
9
  metrics:
10
  - wer
11
  model-index:
12
- - name: whisper-tiny-javanese-openslr-v2
13
  results:
14
  - task:
15
  name: Automatic Speech Recognition
@@ -29,7 +34,7 @@ model-index:
29
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
30
  should probably proofread and complete it, then remove this comment. -->
31
 
32
- # whisper-tiny-javanese-openslr-v2
33
 
34
  This model is a fine-tuned version of [openai/whisper-tiny](https://huggingface.co/openai/whisper-tiny) on the jv_id_asr_split dataset.
35
  It achieves the following results on the evaluation set:
 
1
  ---
2
  library_name: transformers
3
+ language:
4
+ - jv
5
  license: apache-2.0
6
  base_model: openai/whisper-tiny
7
  tags:
8
+ - whisper
9
+ - javanese
10
+ - asr
11
  - generated_from_trainer
12
  datasets:
13
  - jv_id_asr_split
14
  metrics:
15
  - wer
16
  model-index:
17
+ - name: Whisper Tiny Java
18
  results:
19
  - task:
20
  name: Automatic Speech Recognition
 
34
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
35
  should probably proofread and complete it, then remove this comment. -->
36
 
37
+ # Whisper Tiny Java
38
 
39
  This model is a fine-tuned version of [openai/whisper-tiny](https://huggingface.co/openai/whisper-tiny) on the jv_id_asr_split dataset.
40
  It achieves the following results on the evaluation set:
all_results.json CHANGED
@@ -1,21 +1,21 @@
1
  {
2
- "epoch": 4.9922212618841835,
3
- "eval_loss": 0.5638014078140259,
4
- "eval_runtime": 4431.4054,
5
  "eval_samples": 18504,
6
- "eval_samples_per_second": 4.176,
7
- "eval_steps_per_second": 0.261,
8
- "eval_wer": 0.4824482518630893,
9
  "pretrained_eval_loss": 4.0292205810546875,
10
  "pretrained_eval_model_preparation_time": 0.0019,
11
  "pretrained_eval_runtime": 3181.6206,
12
  "pretrained_eval_samples_per_second": 5.816,
13
  "pretrained_eval_steps_per_second": 0.364,
14
  "pretrained_eval_wer": 1.3043423861619188,
15
- "total_flos": 1.819709817421824e+19,
16
- "train_loss": 0.0,
17
- "train_runtime": 0.166,
18
  "train_samples": 148052,
19
- "train_samples_per_second": 4460643.449,
20
- "train_steps_per_second": 17414.502
21
  }
 
1
  {
2
+ "epoch": 4.32152117545376,
3
+ "eval_loss": 0.2792496979236603,
4
+ "eval_runtime": 2784.0877,
5
  "eval_samples": 18504,
6
+ "eval_samples_per_second": 6.646,
7
+ "eval_steps_per_second": 0.416,
8
+ "eval_wer": 0.6471586421539112,
9
  "pretrained_eval_loss": 4.0292205810546875,
10
  "pretrained_eval_model_preparation_time": 0.0019,
11
  "pretrained_eval_runtime": 3181.6206,
12
  "pretrained_eval_samples_per_second": 5.816,
13
  "pretrained_eval_steps_per_second": 0.364,
14
  "pretrained_eval_wer": 1.3043423861619188,
15
+ "total_flos": 1.574545111842816e+19,
16
+ "train_loss": 0.17131386260986328,
17
+ "train_runtime": 60097.0332,
18
  "train_samples": 148052,
19
+ "train_samples_per_second": 10.649,
20
+ "train_steps_per_second": 0.042
21
  }
eval_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "epoch": 4.9922212618841835,
3
- "eval_loss": 0.5638014078140259,
4
- "eval_runtime": 4431.4054,
5
  "eval_samples": 18504,
6
- "eval_samples_per_second": 4.176,
7
- "eval_steps_per_second": 0.261,
8
- "eval_wer": 0.4824482518630893
9
  }
 
1
  {
2
+ "epoch": 4.32152117545376,
3
+ "eval_loss": 0.2792496979236603,
4
+ "eval_runtime": 2784.0877,
5
  "eval_samples": 18504,
6
+ "eval_samples_per_second": 6.646,
7
+ "eval_steps_per_second": 0.416,
8
+ "eval_wer": 0.6471586421539112
9
  }
runs/Mar16_11-27-13_dgx-a100/events.out.tfevents.1742162147.dgx-a100.690596.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e21f99fd4b547a7a4a11673fb97d703230d36858f63e11d5e9466d541fd28a3d
3
+ size 406
train_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "epoch": 4.9922212618841835,
3
- "total_flos": 1.819709817421824e+19,
4
- "train_loss": 0.0,
5
- "train_runtime": 0.166,
6
  "train_samples": 148052,
7
- "train_samples_per_second": 4460643.449,
8
- "train_steps_per_second": 17414.502
9
  }
 
1
  {
2
+ "epoch": 4.32152117545376,
3
+ "total_flos": 1.574545111842816e+19,
4
+ "train_loss": 0.17131386260986328,
5
+ "train_runtime": 60097.0332,
6
  "train_samples": 148052,
7
+ "train_samples_per_second": 10.649,
8
+ "train_steps_per_second": 0.042
9
  }
trainer_state.json CHANGED
@@ -1,266 +1,246 @@
1
  {
2
- "best_metric": 0.4824482518630893,
 
3
  "best_model_checkpoint": "/raid/p-storage/slp01_565a7357/bagas-fine-tune-whisper/whisper-tiny-javanese-openslr-v2/checkpoint-500",
4
- "epoch": 4.9922212618841835,
5
  "eval_steps": 500,
6
- "global_step": 2890,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.17286084701815038,
13
- "grad_norm": 6.286952018737793,
14
- "learning_rate": 3.3910034602076125e-06,
15
- "loss": 3.0341,
16
  "step": 100
17
  },
18
  {
19
  "epoch": 0.34572169403630076,
20
- "grad_norm": 4.7146077156066895,
21
- "learning_rate": 6.85121107266436e-06,
22
- "loss": 1.3208,
23
  "step": 200
24
  },
25
  {
26
  "epoch": 0.5185825410544511,
27
- "grad_norm": 4.3300933837890625,
28
- "learning_rate": 9.965397923875434e-06,
29
- "loss": 0.9403,
30
  "step": 300
31
  },
32
  {
33
  "epoch": 0.6914433880726015,
34
- "grad_norm": 4.19991397857666,
35
- "learning_rate": 9.580930411380239e-06,
36
- "loss": 0.7674,
37
  "step": 400
38
  },
39
  {
40
  "epoch": 0.8643042350907519,
41
- "grad_norm": 3.640639066696167,
42
- "learning_rate": 9.196462898885045e-06,
43
- "loss": 0.6676,
44
  "step": 500
45
  },
46
  {
47
  "epoch": 0.8643042350907519,
48
- "eval_loss": 0.5638014078140259,
49
- "eval_runtime": 6063.2097,
50
- "eval_samples_per_second": 3.052,
51
- "eval_steps_per_second": 0.191,
52
- "eval_wer": 0.4824482518630893,
53
  "step": 500
54
  },
55
  {
56
  "epoch": 1.0363007778738116,
57
- "grad_norm": 3.6083388328552246,
58
- "learning_rate": 8.811995386389852e-06,
59
- "loss": 0.6009,
60
  "step": 600
61
  },
62
  {
63
  "epoch": 1.2091616248919619,
64
- "grad_norm": 3.529407024383545,
65
- "learning_rate": 8.427527873894657e-06,
66
- "loss": 0.5501,
67
  "step": 700
68
  },
69
  {
70
  "epoch": 1.3820224719101124,
71
- "grad_norm": 3.4671249389648438,
72
- "learning_rate": 8.043060361399463e-06,
73
- "loss": 0.523,
74
  "step": 800
75
  },
76
  {
77
  "epoch": 1.5548833189282627,
78
- "grad_norm": 3.357516288757324,
79
- "learning_rate": 7.658592848904268e-06,
80
- "loss": 0.4992,
81
  "step": 900
82
  },
83
  {
84
  "epoch": 1.727744165946413,
85
- "grad_norm": 3.260972738265991,
86
- "learning_rate": 7.274125336409074e-06,
87
- "loss": 0.4792,
88
  "step": 1000
89
  },
90
  {
91
  "epoch": 1.727744165946413,
92
- "eval_loss": 0.42836251854896545,
93
- "eval_runtime": 5157.0546,
94
- "eval_samples_per_second": 3.588,
95
- "eval_steps_per_second": 0.224,
96
- "eval_wer": 0.5330351347758427,
97
  "step": 1000
98
  },
99
  {
100
- "epoch": 1.9006050129645635,
101
- "grad_norm": 3.132084608078003,
102
- "learning_rate": 6.88965782391388e-06,
103
- "loss": 0.4654,
104
  "step": 1100
105
  },
106
  {
107
- "epoch": 2.072601555747623,
108
- "grad_norm": 3.0205070972442627,
109
- "learning_rate": 6.505190311418685e-06,
110
- "loss": 0.4387,
111
  "step": 1200
112
  },
113
  {
114
- "epoch": 2.2454624027657735,
115
- "grad_norm": 3.090315103530884,
116
- "learning_rate": 6.120722798923492e-06,
117
- "loss": 0.4201,
118
  "step": 1300
119
  },
120
  {
121
- "epoch": 2.4183232497839238,
122
- "grad_norm": 3.003020763397217,
123
- "learning_rate": 5.736255286428297e-06,
124
- "loss": 0.4111,
125
  "step": 1400
126
  },
127
  {
128
- "epoch": 2.591184096802074,
129
- "grad_norm": 2.9050354957580566,
130
- "learning_rate": 5.351787773933102e-06,
131
- "loss": 0.3988,
132
  "step": 1500
133
  },
134
  {
135
- "epoch": 2.591184096802074,
136
- "eval_loss": 0.3772418200969696,
137
- "eval_runtime": 3820.8123,
138
- "eval_samples_per_second": 4.843,
139
- "eval_steps_per_second": 0.303,
140
- "eval_wer": 0.5687485826445312,
141
  "step": 1500
142
  },
143
  {
144
- "epoch": 2.764044943820225,
145
- "grad_norm": 2.983358383178711,
146
- "learning_rate": 4.967320261437909e-06,
147
- "loss": 0.392,
148
  "step": 1600
149
  },
150
  {
151
- "epoch": 2.936905790838375,
152
- "grad_norm": 2.932623863220215,
153
- "learning_rate": 4.5828527489427145e-06,
154
- "loss": 0.3882,
155
  "step": 1700
156
  },
157
  {
158
- "epoch": 3.1089023336214345,
159
- "grad_norm": 2.8963847160339355,
160
- "learning_rate": 4.19838523644752e-06,
161
- "loss": 0.3684,
162
  "step": 1800
163
  },
164
  {
165
- "epoch": 3.2817631806395853,
166
- "grad_norm": 3.005558967590332,
167
- "learning_rate": 3.8139177239523264e-06,
168
- "loss": 0.3638,
169
  "step": 1900
170
  },
171
  {
172
- "epoch": 3.4546240276577356,
173
- "grad_norm": 2.9087977409362793,
174
- "learning_rate": 3.429450211457132e-06,
175
- "loss": 0.3565,
176
  "step": 2000
177
  },
178
  {
179
- "epoch": 3.4546240276577356,
180
- "eval_loss": 0.35282832384109497,
181
- "eval_runtime": 3674.1258,
182
- "eval_samples_per_second": 5.036,
183
- "eval_steps_per_second": 0.315,
184
- "eval_wer": 0.6203598714409715,
185
  "step": 2000
186
  },
187
  {
188
- "epoch": 3.627484874675886,
189
- "grad_norm": 2.949126958847046,
190
- "learning_rate": 3.044982698961938e-06,
191
- "loss": 0.3582,
192
  "step": 2100
193
  },
194
  {
195
- "epoch": 3.800345721694036,
196
- "grad_norm": 2.861595869064331,
197
- "learning_rate": 2.660515186466744e-06,
198
- "loss": 0.3549,
199
  "step": 2200
200
  },
201
  {
202
- "epoch": 3.973206568712187,
203
- "grad_norm": 2.6879312992095947,
204
- "learning_rate": 2.2760476739715497e-06,
205
- "loss": 0.351,
206
  "step": 2300
207
  },
208
  {
209
- "epoch": 4.145203111495246,
210
- "grad_norm": 3.0249099731445312,
211
- "learning_rate": 1.8915801614763554e-06,
212
- "loss": 0.339,
213
  "step": 2400
214
  },
215
  {
216
- "epoch": 4.318063958513397,
217
- "grad_norm": 2.900782585144043,
218
- "learning_rate": 1.5071126489811613e-06,
219
- "loss": 0.3386,
220
  "step": 2500
221
  },
222
  {
223
- "epoch": 4.318063958513397,
224
- "eval_loss": 0.34060564637184143,
225
- "eval_runtime": 4820.2463,
226
- "eval_samples_per_second": 3.839,
227
- "eval_steps_per_second": 0.24,
228
- "eval_wer": 0.6603038810125197,
229
  "step": 2500
230
  },
231
  {
232
- "epoch": 4.490924805531547,
233
- "grad_norm": 2.7883245944976807,
234
- "learning_rate": 1.122645136485967e-06,
235
- "loss": 0.3351,
236
- "step": 2600
237
- },
238
- {
239
- "epoch": 4.663785652549698,
240
- "grad_norm": 2.759507894515991,
241
- "learning_rate": 7.381776239907729e-07,
242
- "loss": 0.3364,
243
- "step": 2700
244
- },
245
- {
246
- "epoch": 4.8366464995678475,
247
- "grad_norm": 2.8885769844055176,
248
- "learning_rate": 3.5371011149557864e-07,
249
- "loss": 0.334,
250
- "step": 2800
251
- },
252
- {
253
- "epoch": 4.9922212618841835,
254
- "step": 2890,
255
- "total_flos": 1.819709817421824e+19,
256
- "train_loss": 0.0,
257
- "train_runtime": 0.166,
258
- "train_samples_per_second": 4460643.449,
259
- "train_steps_per_second": 17414.502
260
  }
261
  ],
262
  "logging_steps": 100,
263
- "max_steps": 2890,
264
  "num_input_tokens_seen": 0,
265
  "num_train_epochs": 5,
266
  "save_steps": 500,
@@ -276,7 +256,7 @@
276
  "attributes": {}
277
  }
278
  },
279
- "total_flos": 1.819709817421824e+19,
280
  "train_batch_size": 64,
281
  "trial_name": null,
282
  "trial_params": null
 
1
  {
2
+ "best_global_step": null,
3
+ "best_metric": 0.47698996707825364,
4
  "best_model_checkpoint": "/raid/p-storage/slp01_565a7357/bagas-fine-tune-whisper/whisper-tiny-javanese-openslr-v2/checkpoint-500",
5
+ "epoch": 4.32152117545376,
6
  "eval_steps": 500,
7
+ "global_step": 2500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
11
  "log_history": [
12
  {
13
  "epoch": 0.17286084701815038,
14
+ "grad_norm": 5.079843521118164,
15
+ "learning_rate": 7.840000000000001e-06,
16
+ "loss": 2.5618,
17
  "step": 100
18
  },
19
  {
20
  "epoch": 0.34572169403630076,
21
+ "grad_norm": 4.103299617767334,
22
+ "learning_rate": 1.584e-05,
23
+ "loss": 1.021,
24
  "step": 200
25
  },
26
  {
27
  "epoch": 0.5185825410544511,
28
+ "grad_norm": 3.8726439476013184,
29
+ "learning_rate": 1.9573333333333335e-05,
30
+ "loss": 0.7363,
31
  "step": 300
32
  },
33
  {
34
  "epoch": 0.6914433880726015,
35
+ "grad_norm": 3.9386720657348633,
36
+ "learning_rate": 1.8684444444444446e-05,
37
+ "loss": 0.6066,
38
  "step": 400
39
  },
40
  {
41
  "epoch": 0.8643042350907519,
42
+ "grad_norm": 3.273592472076416,
43
+ "learning_rate": 1.7795555555555557e-05,
44
+ "loss": 0.528,
45
  "step": 500
46
  },
47
  {
48
  "epoch": 0.8643042350907519,
49
+ "eval_loss": 0.4466875493526459,
50
+ "eval_runtime": 5073.2528,
51
+ "eval_samples_per_second": 3.647,
52
+ "eval_steps_per_second": 0.228,
53
+ "eval_wer": 0.47698996707825364,
54
  "step": 500
55
  },
56
  {
57
  "epoch": 1.0363007778738116,
58
+ "grad_norm": 3.0979788303375244,
59
+ "learning_rate": 1.690666666666667e-05,
60
+ "loss": 0.4728,
61
  "step": 600
62
  },
63
  {
64
  "epoch": 1.2091616248919619,
65
+ "grad_norm": 3.1844944953918457,
66
+ "learning_rate": 1.601777777777778e-05,
67
+ "loss": 0.4222,
68
  "step": 700
69
  },
70
  {
71
  "epoch": 1.3820224719101124,
72
+ "grad_norm": 2.981661319732666,
73
+ "learning_rate": 1.5128888888888891e-05,
74
+ "loss": 0.404,
75
  "step": 800
76
  },
77
  {
78
  "epoch": 1.5548833189282627,
79
+ "grad_norm": 3.146735906600952,
80
+ "learning_rate": 1.4240000000000001e-05,
81
+ "loss": 0.3867,
82
  "step": 900
83
  },
84
  {
85
  "epoch": 1.727744165946413,
86
+ "grad_norm": 2.873340368270874,
87
+ "learning_rate": 1.3351111111111112e-05,
88
+ "loss": 0.3702,
89
  "step": 1000
90
  },
91
  {
92
  "epoch": 1.727744165946413,
93
+ "eval_loss": 0.34238535165786743,
94
+ "eval_runtime": 6401.1103,
95
+ "eval_samples_per_second": 2.891,
96
+ "eval_steps_per_second": 0.181,
97
+ "eval_wer": 0.5528429218245372,
98
  "step": 1000
99
  },
100
  {
101
+ "epoch": 1.902333621434745,
102
+ "grad_norm": 2.7809109687805176,
103
+ "learning_rate": 1.2462222222222222e-05,
104
+ "loss": 0.3611,
105
  "step": 1100
106
  },
107
  {
108
+ "epoch": 2.076058772687986,
109
+ "grad_norm": 2.62384295463562,
110
+ "learning_rate": 1.1573333333333335e-05,
111
+ "loss": 0.3371,
112
  "step": 1200
113
  },
114
  {
115
+ "epoch": 2.2489196197061365,
116
+ "grad_norm": 2.793154716491699,
117
+ "learning_rate": 1.0684444444444446e-05,
118
+ "loss": 0.3134,
119
  "step": 1300
120
  },
121
  {
122
+ "epoch": 2.421780466724287,
123
+ "grad_norm": 2.5597171783447266,
124
+ "learning_rate": 9.795555555555556e-06,
125
+ "loss": 0.3069,
126
  "step": 1400
127
  },
128
  {
129
+ "epoch": 2.5946413137424376,
130
+ "grad_norm": 2.6140079498291016,
131
+ "learning_rate": 8.906666666666667e-06,
132
+ "loss": 0.2988,
133
  "step": 1500
134
  },
135
  {
136
+ "epoch": 2.5946413137424376,
137
+ "eval_loss": 0.30312925577163696,
138
+ "eval_runtime": 2962.721,
139
+ "eval_samples_per_second": 6.246,
140
+ "eval_steps_per_second": 0.391,
141
+ "eval_wer": 0.5552201690660703,
142
  "step": 1500
143
  },
144
  {
145
+ "epoch": 2.767502160760588,
146
+ "grad_norm": 2.635817050933838,
147
+ "learning_rate": 8.017777777777779e-06,
148
+ "loss": 0.2948,
149
  "step": 1600
150
  },
151
  {
152
+ "epoch": 2.940363007778738,
153
+ "grad_norm": 2.918149709701538,
154
+ "learning_rate": 7.12888888888889e-06,
155
+ "loss": 0.2903,
156
  "step": 1700
157
  },
158
  {
159
+ "epoch": 3.1123595505617976,
160
+ "grad_norm": 2.2907419204711914,
161
+ "learning_rate": 6.24e-06,
162
+ "loss": 0.2711,
163
  "step": 1800
164
  },
165
  {
166
+ "epoch": 3.2852203975799483,
167
+ "grad_norm": 2.640625238418579,
168
+ "learning_rate": 5.351111111111112e-06,
169
+ "loss": 0.2667,
170
  "step": 1900
171
  },
172
  {
173
+ "epoch": 3.4580812445980986,
174
+ "grad_norm": 2.5180225372314453,
175
+ "learning_rate": 4.462222222222223e-06,
176
+ "loss": 0.2607,
177
  "step": 2000
178
  },
179
  {
180
+ "epoch": 3.4580812445980986,
181
+ "eval_loss": 0.28587546944618225,
182
+ "eval_runtime": 2830.646,
183
+ "eval_samples_per_second": 6.537,
184
+ "eval_steps_per_second": 0.409,
185
+ "eval_wer": 0.6484880238350316,
186
  "step": 2000
187
  },
188
  {
189
+ "epoch": 3.630942091616249,
190
+ "grad_norm": 2.6452524662017822,
191
+ "learning_rate": 3.5733333333333336e-06,
192
+ "loss": 0.2637,
193
  "step": 2100
194
  },
195
  {
196
+ "epoch": 3.8038029386343992,
197
+ "grad_norm": 2.3364474773406982,
198
+ "learning_rate": 2.6844444444444445e-06,
199
+ "loss": 0.2615,
200
  "step": 2200
201
  },
202
  {
203
+ "epoch": 3.9766637856525495,
204
+ "grad_norm": 2.414165496826172,
205
+ "learning_rate": 1.7955555555555556e-06,
206
+ "loss": 0.2603,
207
  "step": 2300
208
  },
209
  {
210
+ "epoch": 4.148660328435609,
211
+ "grad_norm": 2.3572444915771484,
212
+ "learning_rate": 9.066666666666668e-07,
213
+ "loss": 0.2483,
214
  "step": 2400
215
  },
216
  {
217
+ "epoch": 4.32152117545376,
218
+ "grad_norm": 2.6238534450531006,
219
+ "learning_rate": 1.777777777777778e-08,
220
+ "loss": 0.2481,
221
  "step": 2500
222
  },
223
  {
224
+ "epoch": 4.32152117545376,
225
+ "eval_loss": 0.2792496979236603,
226
+ "eval_runtime": 2806.8606,
227
+ "eval_samples_per_second": 6.592,
228
+ "eval_steps_per_second": 0.412,
229
+ "eval_wer": 0.6471586421539112,
230
  "step": 2500
231
  },
232
  {
233
+ "epoch": 4.32152117545376,
234
+ "step": 2500,
235
+ "total_flos": 1.574545111842816e+19,
236
+ "train_loss": 0.17131386260986328,
237
+ "train_runtime": 60097.0332,
238
+ "train_samples_per_second": 10.649,
239
+ "train_steps_per_second": 0.042
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
240
  }
241
  ],
242
  "logging_steps": 100,
243
+ "max_steps": 2500,
244
  "num_input_tokens_seen": 0,
245
  "num_train_epochs": 5,
246
  "save_steps": 500,
 
256
  "attributes": {}
257
  }
258
  },
259
+ "total_flos": 1.574545111842816e+19,
260
  "train_batch_size": 64,
261
  "trial_name": null,
262
  "trial_params": null