zuazo commited on
Commit
a8bb11b
·
verified ·
1 Parent(s): 12eaf33

Model save

Browse files
Files changed (2) hide show
  1. README.md +19 -21
  2. generation_config.json +3 -2
README.md CHANGED
@@ -1,42 +1,39 @@
1
  ---
2
- language:
3
- - gl
4
  license: apache-2.0
5
  base_model: openai/whisper-base
6
  tags:
7
- - whisper-event
8
  - generated_from_trainer
9
  datasets:
10
- - mozilla-foundation/common_voice_13_0
11
  metrics:
12
  - wer
13
  model-index:
14
- - name: Whisper Base Galician
15
  results:
16
  - task:
17
  name: Automatic Speech Recognition
18
  type: automatic-speech-recognition
19
  dataset:
20
- name: mozilla-foundation/common_voice_13_0 gl
21
- type: mozilla-foundation/common_voice_13_0
22
  config: gl
23
  split: test
24
  args: gl
25
  metrics:
26
  - name: Wer
27
  type: wer
28
- value: 18.687913907284766
29
  ---
30
 
31
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
32
  should probably proofread and complete it, then remove this comment. -->
33
 
34
- # Whisper Base Galician
35
 
36
- This model is a fine-tuned version of [openai/whisper-base](https://huggingface.co/openai/whisper-base) on the mozilla-foundation/common_voice_13_0 gl dataset.
37
  It achieves the following results on the evaluation set:
38
- - Loss: 0.4754
39
- - Wer: 18.6879
40
 
41
  ## Model description
42
 
@@ -63,21 +60,22 @@ The following hyperparameters were used during training:
63
  - lr_scheduler_type: linear
64
  - lr_scheduler_warmup_steps: 500
65
  - training_steps: 5000
 
66
 
67
  ### Training results
68
 
69
  | Training Loss | Epoch | Step | Validation Loss | Wer |
70
  |:-------------:|:-----:|:----:|:---------------:|:-------:|
71
- | 0.0088 | 9.02 | 1000 | 0.4219 | 18.7776 |
72
- | 0.0015 | 19.02 | 2000 | 0.4754 | 18.6879 |
73
- | 0.0008 | 29.02 | 3000 | 0.5036 | 18.9000 |
74
- | 0.0005 | 39.02 | 4000 | 0.5225 | 19.0553 |
75
- | 0.0004 | 49.02 | 5000 | 0.5307 | 19.1122 |
76
 
77
 
78
  ### Framework versions
79
 
80
- - Transformers 4.33.0.dev0
81
- - Pytorch 2.0.1+cu117
82
- - Datasets 2.14.4
83
- - Tokenizers 0.13.3
 
1
  ---
 
 
2
  license: apache-2.0
3
  base_model: openai/whisper-base
4
  tags:
 
5
  - generated_from_trainer
6
  datasets:
7
+ - common_voice_13_0
8
  metrics:
9
  - wer
10
  model-index:
11
+ - name: openai/whisper-base
12
  results:
13
  - task:
14
  name: Automatic Speech Recognition
15
  type: automatic-speech-recognition
16
  dataset:
17
+ name: common_voice_13_0
18
+ type: common_voice_13_0
19
  config: gl
20
  split: test
21
  args: gl
22
  metrics:
23
  - name: Wer
24
  type: wer
25
+ value: 17.290976821192054
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
29
  should probably proofread and complete it, then remove this comment. -->
30
 
31
+ # openai/whisper-base
32
 
33
+ This model is a fine-tuned version of [openai/whisper-base](https://huggingface.co/openai/whisper-base) on the common_voice_13_0 dataset.
34
  It achieves the following results on the evaluation set:
35
+ - Loss: 0.4360
36
+ - Wer: 17.2910
37
 
38
  ## Model description
39
 
 
60
  - lr_scheduler_type: linear
61
  - lr_scheduler_warmup_steps: 500
62
  - training_steps: 5000
63
+ - mixed_precision_training: Native AMP
64
 
65
  ### Training results
66
 
67
  | Training Loss | Epoch | Step | Validation Loss | Wer |
68
  |:-------------:|:-----:|:----:|:---------------:|:-------:|
69
+ | 0.372 | 10.0 | 1000 | 0.4173 | 21.0023 |
70
+ | 0.1352 | 20.0 | 2000 | 0.3982 | 18.3620 |
71
+ | 0.0638 | 30.0 | 3000 | 0.4175 | 17.8842 |
72
+ | 0.0371 | 40.0 | 4000 | 0.4310 | 17.4721 |
73
+ | 0.0279 | 50.0 | 5000 | 0.4360 | 17.2910 |
74
 
75
 
76
  ### Framework versions
77
 
78
+ - Transformers 4.37.2
79
+ - Pytorch 2.2.0+cu121
80
+ - Datasets 2.16.1
81
+ - Tokenizers 0.15.1
generation_config.json CHANGED
@@ -152,10 +152,11 @@
152
  "<|yo|>": 50325,
153
  "<|zh|>": 50260
154
  },
155
- "max_initial_timestamp_index": 1,
156
  "max_length": 448,
157
  "no_timestamps_token_id": 50363,
158
  "pad_token_id": 50257,
 
159
  "return_timestamps": false,
160
  "suppress_tokens": [
161
  1,
@@ -251,5 +252,5 @@
251
  "transcribe": 50359,
252
  "translate": 50358
253
  },
254
- "transformers_version": "4.33.0.dev0"
255
  }
 
152
  "<|yo|>": 50325,
153
  "<|zh|>": 50260
154
  },
155
+ "max_initial_timestamp_index": 50,
156
  "max_length": 448,
157
  "no_timestamps_token_id": 50363,
158
  "pad_token_id": 50257,
159
+ "prev_sot_token_id": 50361,
160
  "return_timestamps": false,
161
  "suppress_tokens": [
162
  1,
 
252
  "transcribe": 50359,
253
  "translate": 50358
254
  },
255
+ "transformers_version": "4.37.2"
256
  }