liuh6 commited on
Commit
9af7d29
·
verified ·
1 Parent(s): 0c7971c

End of training

Browse files
Files changed (2) hide show
  1. README.md +7 -8
  2. generation_config.json +90 -1
README.md CHANGED
@@ -24,7 +24,7 @@ model-index:
24
  metrics:
25
  - name: Wer
26
  type: wer
27
- value: 16.060365369340744
28
  ---
29
 
30
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -34,8 +34,8 @@ should probably proofread and complete it, then remove this comment. -->
34
 
35
  This model is a fine-tuned version of [openai/whisper-tiny](https://huggingface.co/openai/whisper-tiny) on the Chinese English dataset.
36
  It achieves the following results on the evaluation set:
37
- - Loss: 0.3722
38
- - Wer: 16.0604
39
 
40
  ## Model description
41
 
@@ -57,19 +57,18 @@ The following hyperparameters were used during training:
57
  - learning_rate: 1e-05
58
  - train_batch_size: 2
59
  - eval_batch_size: 1
60
- - seed: 43
61
  - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
62
  - lr_scheduler_type: linear
63
  - lr_scheduler_warmup_steps: 500
64
- - training_steps: 1500
65
 
66
  ### Training results
67
 
68
  | Training Loss | Epoch | Step | Validation Loss | Wer |
69
  |:-------------:|:------:|:----:|:---------------:|:-------:|
70
- | 0.1887 | 1.6667 | 500 | 0.3696 | 17.6172 |
71
- | 0.0143 | 3.3333 | 1000 | 0.3665 | 15.6632 |
72
- | 0.0115 | 5.0 | 1500 | 0.3722 | 16.0604 |
73
 
74
 
75
  ### Framework versions
 
24
  metrics:
25
  - name: Wer
26
  type: wer
27
+ value: 15.583796664019061
28
  ---
29
 
30
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
34
 
35
  This model is a fine-tuned version of [openai/whisper-tiny](https://huggingface.co/openai/whisper-tiny) on the Chinese English dataset.
36
  It achieves the following results on the evaluation set:
37
+ - Loss: 0.3553
38
+ - Wer: 15.5838
39
 
40
  ## Model description
41
 
 
57
  - learning_rate: 1e-05
58
  - train_batch_size: 2
59
  - eval_batch_size: 1
60
+ - seed: 44
61
  - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
62
  - lr_scheduler_type: linear
63
  - lr_scheduler_warmup_steps: 500
64
+ - training_steps: 1000
65
 
66
  ### Training results
67
 
68
  | Training Loss | Epoch | Step | Validation Loss | Wer |
69
  |:-------------:|:------:|:----:|:---------------:|:-------:|
70
+ | 0.2725 | 1.6667 | 500 | 0.3502 | 15.8380 |
71
+ | 0.0209 | 3.3333 | 1000 | 0.3553 | 15.5838 |
 
72
 
73
 
74
  ### Framework versions
generation_config.json CHANGED
@@ -150,7 +150,96 @@
150
  "pad_token_id": 50257,
151
  "prev_sot_token_id": 50361,
152
  "return_timestamps": false,
153
- "suppress_tokens": [],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
154
  "task_to_id": {
155
  "transcribe": 50359,
156
  "translate": 50358
 
150
  "pad_token_id": 50257,
151
  "prev_sot_token_id": 50361,
152
  "return_timestamps": false,
153
+ "suppress_tokens": [
154
+ 1,
155
+ 2,
156
+ 7,
157
+ 8,
158
+ 9,
159
+ 10,
160
+ 14,
161
+ 25,
162
+ 26,
163
+ 27,
164
+ 28,
165
+ 29,
166
+ 31,
167
+ 58,
168
+ 59,
169
+ 60,
170
+ 61,
171
+ 62,
172
+ 63,
173
+ 90,
174
+ 91,
175
+ 92,
176
+ 93,
177
+ 359,
178
+ 503,
179
+ 522,
180
+ 542,
181
+ 873,
182
+ 893,
183
+ 902,
184
+ 918,
185
+ 922,
186
+ 931,
187
+ 1350,
188
+ 1853,
189
+ 1982,
190
+ 2460,
191
+ 2627,
192
+ 3246,
193
+ 3253,
194
+ 3268,
195
+ 3536,
196
+ 3846,
197
+ 3961,
198
+ 4183,
199
+ 4667,
200
+ 6585,
201
+ 6647,
202
+ 7273,
203
+ 9061,
204
+ 9383,
205
+ 10428,
206
+ 10929,
207
+ 11938,
208
+ 12033,
209
+ 12331,
210
+ 12562,
211
+ 13793,
212
+ 14157,
213
+ 14635,
214
+ 15265,
215
+ 15618,
216
+ 16553,
217
+ 16604,
218
+ 18362,
219
+ 18956,
220
+ 20075,
221
+ 21675,
222
+ 22520,
223
+ 26130,
224
+ 26161,
225
+ 26435,
226
+ 28279,
227
+ 29464,
228
+ 31650,
229
+ 32302,
230
+ 32470,
231
+ 36865,
232
+ 42863,
233
+ 47425,
234
+ 49870,
235
+ 50254,
236
+ 50258,
237
+ 50358,
238
+ 50359,
239
+ 50360,
240
+ 50361,
241
+ 50362
242
+ ],
243
  "task_to_id": {
244
  "transcribe": 50359,
245
  "translate": 50358