sabroo
/

w2v-bert-2.0-slovak-colab-CV17.0

@@ -1,19 +1,19 @@
 ---
 base_model: facebook/w2v-bert-2.0
 datasets:
 - common_voice_17_0
-library_name: transformers
-license: mit
 metrics:
 - wer
-tags:
-- generated_from_trainer
 model-index:
 - name: w2v-bert-2.0-slovak-colab-CV17.0
   results:
   - task:
-      type: automatic-speech-recognition
       name: Automatic Speech Recognition
     dataset:
       name: common_voice_17_0
       type: common_voice_17_0
@@ -21,9 +21,9 @@ model-index:
       split: test
       args: sk
     metrics:
-    - type: wer
-      value: 0.13279330117411486
-      name: Wer
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -33,8 +33,8 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [facebook/w2v-bert-2.0](https://huggingface.co/facebook/w2v-bert-2.0) on the common_voice_17_0 dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.3002
-- Wer: 0.1328
 ## Model description
@@ -62,19 +62,22 @@ The following hyperparameters were used during training:
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
 - lr_scheduler_warmup_steps: 500
-- num_epochs: 10
 - mixed_precision_training: Native AMP
 ### Training results
-| Training Loss | Epoch  | Step | Validation Loss | Wer    |
-|:-------------:|:------:|:----:|:---------------:|:------:|
-| 2.3467        | 1.6393 | 300  | 0.3488          | 0.2605 |
-| 0.1905        | 3.2787 | 600  | 0.3339          | 0.2059 |
-| 0.1121        | 4.9180 | 900  | 0.3009          | 0.1849 |
-| 0.0592        | 6.5574 | 1200 | 0.2817          | 0.1482 |
-| 0.0264        | 8.1967 | 1500 | 0.3114          | 0.1385 |
-| 0.0094        | 9.8361 | 1800 | 0.3002          | 0.1328 |
 ### Framework versions

 ---
+library_name: transformers
+license: mit
 base_model: facebook/w2v-bert-2.0
+tags:
+- generated_from_trainer
 datasets:
 - common_voice_17_0
 metrics:
 - wer
 model-index:
 - name: w2v-bert-2.0-slovak-colab-CV17.0
   results:
   - task:
       name: Automatic Speech Recognition
+      type: automatic-speech-recognition
     dataset:
       name: common_voice_17_0
       type: common_voice_17_0
       split: test
       args: sk
     metrics:
+    - name: Wer
+      type: wer
+      value: 0.1358878674797488
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 This model is a fine-tuned version of [facebook/w2v-bert-2.0](https://huggingface.co/facebook/w2v-bert-2.0) on the common_voice_17_0 dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.3823
+- Wer: 0.1359
 ## Model description
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
 - lr_scheduler_warmup_steps: 500
+- num_epochs: 15
 - mixed_precision_training: Native AMP
 ### Training results
+| Training Loss | Epoch   | Step | Validation Loss | Wer    |
+|:-------------:|:-------:|:----:|:---------------:|:------:|
+| 3.1601        | 1.6393  | 300  | 0.4869          | 0.2985 |
+| 0.2141        | 3.2787  | 600  | 0.3886          | 0.2144 |
+| 0.1323        | 4.9180  | 900  | 0.3180          | 0.1840 |
+| 0.0754        | 6.5574  | 1200 | 0.3019          | 0.1750 |
+| 0.0401        | 8.1967  | 1500 | 0.3717          | 0.1525 |
+| 0.022         | 9.8361  | 1800 | 0.3408          | 0.1503 |
+| 0.0083        | 11.4754 | 2100 | 0.3489          | 0.1413 |
+| 0.0027        | 13.1148 | 2400 | 0.3681          | 0.1358 |
+| 0.0011        | 14.7541 | 2700 | 0.3823          | 0.1359 |
 ### Framework versions

config.json CHANGED Viewed

@@ -47,7 +47,7 @@
   "num_hidden_layers": 24,
   "num_negatives": 100,
   "output_hidden_size": 1024,
-  "pad_token_id": 48,
   "position_embeddings_type": "relative_key",
   "proj_codevector_dim": 768,
   "right_max_position_embeddings": 8,
@@ -77,6 +77,6 @@
   "transformers_version": "4.45.2",
   "use_intermediate_ffn_before_adapter": false,
   "use_weighted_layer_sum": false,
-  "vocab_size": 51,
   "xvector_output_dim": 512
 }

   "num_hidden_layers": 24,
   "num_negatives": 100,
   "output_hidden_size": 1024,
+  "pad_token_id": 46,
   "position_embeddings_type": "relative_key",
   "proj_codevector_dim": 768,
   "right_max_position_embeddings": 8,
   "transformers_version": "4.45.2",
   "use_intermediate_ffn_before_adapter": false,
   "use_weighted_layer_sum": false,
+  "vocab_size": 49,
   "xvector_output_dim": 512
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0c9d1233c731a7883e4476561b845923d14a363e3a8c618c322fe19d74080c27
-size 2423023660

 version https://git-lfs.github.com/spec/v1
+oid sha256:22c399b1ffb31d288ee510d0fb07f556f93c4ecf87c08a5ca0e51adb4e1ddb58
+size 2423015460

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3c3e6a73a5edb73730efbca5e8e0e5afcbe1b71c17a1ad83d7a11896f11c034c
 size 5176

 version https://git-lfs.github.com/spec/v1
+oid sha256:67b8d9a2dbf6c2ef5db49f5f257ebcfd3b4bed49a85f5ebc1fa76e1332f3a022
 size 5176