igarciahuidobro commited on
Commit
b95900a
·
verified ·
1 Parent(s): 9c4b6dc

End of training

Browse files
README.md CHANGED
@@ -1,27 +1,25 @@
1
  ---
2
  library_name: transformers
3
- language:
4
- - spa
5
  license: apache-2.0
6
- base_model: stinoco/whisper-tiny-clinical-assistance
7
  tags:
8
  - generated_from_trainer
9
  metrics:
10
  - wer
11
  model-index:
12
- - name: Whisper Pre Tuned 300 Audios - Nacho v1.1
13
  results: []
14
  ---
15
 
16
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
17
  should probably proofread and complete it, then remove this comment. -->
18
 
19
- # Whisper Pre Tuned 300 Audios - Nacho v1.1
20
 
21
- This model is a fine-tuned version of [stinoco/whisper-tiny-clinical-assistance](https://huggingface.co/stinoco/whisper-tiny-clinical-assistance) on the 300 audios 1.0 dataset.
22
  It achieves the following results on the evaluation set:
23
- - Loss: 0.4287
24
- - Wer: 22.0273
25
 
26
  ## Model description
27
 
@@ -56,16 +54,16 @@ The following hyperparameters were used during training:
56
 
57
  | Training Loss | Epoch | Step | Validation Loss | Wer |
58
  |:-------------:|:------:|:----:|:---------------:|:-------:|
59
- | 1.9264 | 1.0 | 18 | 1.1710 | 43.2749 |
60
- | 0.7775 | 2.0 | 36 | 0.5345 | 31.3840 |
61
- | 0.3526 | 3.0 | 54 | 0.4953 | 50.0975 |
62
- | 0.1628 | 4.0 | 72 | 0.4611 | 25.1462 |
63
- | 0.0932 | 5.0 | 90 | 0.4517 | 22.2222 |
64
- | 0.0559 | 6.0 | 108 | 0.4196 | 21.0526 |
65
- | 0.0359 | 7.0 | 126 | 0.4440 | 22.4172 |
66
- | 0.0224 | 8.0 | 144 | 0.4335 | 23.1969 |
67
- | 0.0175 | 9.0 | 162 | 0.4301 | 21.8324 |
68
- | 0.0051 | 9.4507 | 170 | 0.4287 | 22.0273 |
69
 
70
 
71
  ### Framework versions
 
1
  ---
2
  library_name: transformers
 
 
3
  license: apache-2.0
4
+ base_model: rasel35/whisper-base-es-medical-terms
5
  tags:
6
  - generated_from_trainer
7
  metrics:
8
  - wer
9
  model-index:
10
+ - name: whisper-tiny-300-audios
11
  results: []
12
  ---
13
 
14
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
15
  should probably proofread and complete it, then remove this comment. -->
16
 
17
+ # whisper-tiny-300-audios
18
 
19
+ This model is a fine-tuned version of [rasel35/whisper-base-es-medical-terms](https://huggingface.co/rasel35/whisper-base-es-medical-terms) on the None dataset.
20
  It achieves the following results on the evaluation set:
21
+ - Loss: 0.4543
22
+ - Wer: 19.9630
23
 
24
  ## Model description
25
 
 
54
 
55
  | Training Loss | Epoch | Step | Validation Loss | Wer |
56
  |:-------------:|:------:|:----:|:---------------:|:-------:|
57
+ | 1.8385 | 1.0 | 18 | 1.1087 | 37.7079 |
58
+ | 0.6509 | 2.0 | 36 | 0.5255 | 25.1386 |
59
+ | 0.2616 | 3.0 | 54 | 0.4827 | 21.2569 |
60
+ | 0.1177 | 4.0 | 72 | 0.4747 | 21.0721 |
61
+ | 0.0719 | 5.0 | 90 | 0.4630 | 20.8872 |
62
+ | 0.0391 | 6.0 | 108 | 0.4802 | 21.8115 |
63
+ | 0.0313 | 7.0 | 126 | 0.4613 | 20.7024 |
64
+ | 0.023 | 8.0 | 144 | 0.4557 | 17.7449 |
65
+ | 0.0104 | 9.0 | 162 | 0.4513 | 20.1479 |
66
+ | 0.0042 | 9.4507 | 170 | 0.4543 | 19.9630 |
67
 
68
 
69
  ### Framework versions
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "stinoco/whisper-tiny-clinical-assistance",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "apply_spec_augment": false,
@@ -10,19 +10,32 @@
10
  "begin_suppress_tokens": null,
11
  "bos_token_id": 50257,
12
  "classifier_proj_size": 256,
13
- "d_model": 384,
14
- "decoder_attention_heads": 6,
15
- "decoder_ffn_dim": 1536,
16
  "decoder_layerdrop": 0.0,
17
- "decoder_layers": 4,
18
  "decoder_start_token_id": 50258,
19
  "dropout": 0.0,
20
- "encoder_attention_heads": 6,
21
- "encoder_ffn_dim": 1536,
22
  "encoder_layerdrop": 0.0,
23
- "encoder_layers": 4,
24
  "eos_token_id": 50257,
25
- "forced_decoder_ids": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
26
  "init_std": 0.02,
27
  "is_encoder_decoder": true,
28
  "mask_feature_length": 10,
@@ -36,7 +49,7 @@
36
  "max_target_positions": 448,
37
  "median_filter_width": 7,
38
  "model_type": "whisper",
39
- "num_hidden_layers": 4,
40
  "num_mel_bins": 80,
41
  "pad_token_id": 50257,
42
  "scale_embedding": false,
 
1
  {
2
+ "_name_or_path": "rasel35/whisper-base-es-medical-terms",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "apply_spec_augment": false,
 
10
  "begin_suppress_tokens": null,
11
  "bos_token_id": 50257,
12
  "classifier_proj_size": 256,
13
+ "d_model": 512,
14
+ "decoder_attention_heads": 8,
15
+ "decoder_ffn_dim": 2048,
16
  "decoder_layerdrop": 0.0,
17
+ "decoder_layers": 6,
18
  "decoder_start_token_id": 50258,
19
  "dropout": 0.0,
20
+ "encoder_attention_heads": 8,
21
+ "encoder_ffn_dim": 2048,
22
  "encoder_layerdrop": 0.0,
23
+ "encoder_layers": 6,
24
  "eos_token_id": 50257,
25
+ "forced_decoder_ids": [
26
+ [
27
+ 1,
28
+ 50259
29
+ ],
30
+ [
31
+ 2,
32
+ 50359
33
+ ],
34
+ [
35
+ 3,
36
+ 50363
37
+ ]
38
+ ],
39
  "init_std": 0.02,
40
  "is_encoder_decoder": true,
41
  "mask_feature_length": 10,
 
49
  "max_target_positions": 448,
50
  "median_filter_width": 7,
51
  "model_type": "whisper",
52
+ "num_hidden_layers": 6,
53
  "num_mel_bins": 80,
54
  "pad_token_id": 50257,
55
  "scale_embedding": false,
generation_config.json CHANGED
@@ -1,28 +1,36 @@
1
  {
2
  "alignment_heads": [
3
- [
4
- 2,
5
- 2
6
- ],
7
  [
8
  3,
9
- 0
10
  ],
11
  [
12
- 3,
13
  2
14
  ],
15
  [
16
- 3,
17
  3
18
  ],
19
  [
20
- 3,
 
 
 
 
 
 
 
 
 
 
 
 
21
  4
22
  ],
23
  [
24
- 3,
25
- 5
26
  ]
27
  ],
28
  "begin_suppress_tokens": [
@@ -141,7 +149,96 @@
141
  "pad_token_id": 50257,
142
  "prev_sot_token_id": 50361,
143
  "return_timestamps": false,
144
- "suppress_tokens": [],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
145
  "task": "transcribe",
146
  "task_to_id": {
147
  "transcribe": 50359,
 
1
  {
2
  "alignment_heads": [
 
 
 
 
3
  [
4
  3,
5
+ 1
6
  ],
7
  [
8
+ 4,
9
  2
10
  ],
11
  [
12
+ 4,
13
  3
14
  ],
15
  [
16
+ 4,
17
+ 7
18
+ ],
19
+ [
20
+ 5,
21
+ 1
22
+ ],
23
+ [
24
+ 5,
25
+ 2
26
+ ],
27
+ [
28
+ 5,
29
  4
30
  ],
31
  [
32
+ 5,
33
+ 6
34
  ]
35
  ],
36
  "begin_suppress_tokens": [
 
149
  "pad_token_id": 50257,
150
  "prev_sot_token_id": 50361,
151
  "return_timestamps": false,
152
+ "suppress_tokens": [
153
+ 1,
154
+ 2,
155
+ 7,
156
+ 8,
157
+ 9,
158
+ 10,
159
+ 14,
160
+ 25,
161
+ 26,
162
+ 27,
163
+ 28,
164
+ 29,
165
+ 31,
166
+ 58,
167
+ 59,
168
+ 60,
169
+ 61,
170
+ 62,
171
+ 63,
172
+ 90,
173
+ 91,
174
+ 92,
175
+ 93,
176
+ 359,
177
+ 503,
178
+ 522,
179
+ 542,
180
+ 873,
181
+ 893,
182
+ 902,
183
+ 918,
184
+ 922,
185
+ 931,
186
+ 1350,
187
+ 1853,
188
+ 1982,
189
+ 2460,
190
+ 2627,
191
+ 3246,
192
+ 3253,
193
+ 3268,
194
+ 3536,
195
+ 3846,
196
+ 3961,
197
+ 4183,
198
+ 4667,
199
+ 6585,
200
+ 6647,
201
+ 7273,
202
+ 9061,
203
+ 9383,
204
+ 10428,
205
+ 10929,
206
+ 11938,
207
+ 12033,
208
+ 12331,
209
+ 12562,
210
+ 13793,
211
+ 14157,
212
+ 14635,
213
+ 15265,
214
+ 15618,
215
+ 16553,
216
+ 16604,
217
+ 18362,
218
+ 18956,
219
+ 20075,
220
+ 21675,
221
+ 22520,
222
+ 26130,
223
+ 26161,
224
+ 26435,
225
+ 28279,
226
+ 29464,
227
+ 31650,
228
+ 32302,
229
+ 32470,
230
+ 36865,
231
+ 42863,
232
+ 47425,
233
+ 49870,
234
+ 50254,
235
+ 50258,
236
+ 50358,
237
+ 50359,
238
+ 50360,
239
+ 50361,
240
+ 50362
241
+ ],
242
  "task": "transcribe",
243
  "task_to_id": {
244
  "transcribe": 50359,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c069ec4c9e1f73237fab3c012fac58422bc3544d4dd35f9894e82b031e41bc4a
3
- size 151061672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bffab982321fa722ac591f630f527a6a70ac8b338c4d5b533ce0c2d7a74f2ea
3
+ size 290403936
runs/Feb07_15-54-37_pop-os/events.out.tfevents.1738954868.pop-os.74078.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9de5b1302eaea13a303417390b36d04f4df2cbb8b067312e16b6cadb72107c13
3
+ size 11535
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:af780fe109268d0b43e272f2f2b7fda36a030d60e9816ab3e124c07a73043f6a
3
  size 5496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a70c67b6d91835a8367fcd0fe2a9da3bcc8bdf85d21437245380641deaabf86a
3
  size 5496