nbaden
/

wav2vec2-large-xlsr-53-demo-colab

@@ -5,24 +5,9 @@ tags:
 - generated_from_trainer
 datasets:
 - common_voice_13_0
-metrics:
-- wer
 model-index:
 - name: wav2vec2-large-xlsr-53-demo-colab
-  results:
-  - task:
-      name: Automatic Speech Recognition
-      type: automatic-speech-recognition
-    dataset:
-      name: common_voice_13_0
-      type: common_voice_13_0
-      config: sah
-      split: test
-      args: sah
-    metrics:
-    - name: Wer
-      type: wer
-      value: 0.5698038864511508
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -31,9 +16,6 @@ should probably proofread and complete it, then remove this comment. -->
 # wav2vec2-large-xlsr-53-demo-colab
 This model is a fine-tuned version of [facebook/wav2vec2-large-xlsr-53](https://huggingface.co/facebook/wav2vec2-large-xlsr-53) on the common_voice_13_0 dataset.
-It achieves the following results on the evaluation set:
-- Loss: 0.8836
-- Wer: 0.5698
 ## Model description
@@ -59,26 +41,17 @@ The following hyperparameters were used during training:
 - gradient_accumulation_steps: 2
 - total_train_batch_size: 32
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
-- lr_scheduler_type: linear
 - lr_scheduler_warmup_steps: 500
-- num_epochs: 100
 ### Training results
-| Training Loss | Epoch | Step | Validation Loss | Wer    |
-|:-------------:|:-----:|:----:|:---------------:|:------:|
-| 0.1354        | 14.04 | 400  | 0.8703          | 0.6377 |
-| 0.1297        | 28.07 | 800  | 0.8601          | 0.6317 |
-| 0.0937        | 42.11 | 1200 | 0.9103          | 0.6320 |
-| 0.0751        | 56.14 | 1600 | 0.8848          | 0.6044 |
-| 0.0582        | 70.18 | 2000 | 0.8630          | 0.5770 |
-| 0.0492        | 84.21 | 2400 | 0.8889          | 0.5786 |
-| 0.0402        | 98.25 | 2800 | 0.8836          | 0.5698 |
 ### Framework versions
 - Transformers 4.34.0
-- Pytorch 2.1.0+cu118
 - Datasets 2.14.5
 - Tokenizers 0.14.1

 - generated_from_trainer
 datasets:
 - common_voice_13_0
 model-index:
 - name: wav2vec2-large-xlsr-53-demo-colab
+  results: []
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 # wav2vec2-large-xlsr-53-demo-colab
 This model is a fine-tuned version of [facebook/wav2vec2-large-xlsr-53](https://huggingface.co/facebook/wav2vec2-large-xlsr-53) on the common_voice_13_0 dataset.
 ## Model description
 - gradient_accumulation_steps: 2
 - total_train_batch_size: 32
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
+- lr_scheduler_type: constant
 - lr_scheduler_warmup_steps: 500
+- num_epochs: 20
 ### Training results
 ### Framework versions
 - Transformers 4.34.0
+- Pytorch 2.1.0+cu121
 - Datasets 2.14.5
 - Tokenizers 0.14.1

config.json CHANGED Viewed

@@ -86,7 +86,7 @@
   "num_hidden_layers": 24,
   "num_negatives": 100,
   "output_hidden_size": 1024,
-  "pad_token_id": 47,
   "proj_codevector_dim": 768,
   "tdnn_dilation": [
     1,
@@ -112,6 +112,6 @@
   "torch_dtype": "float32",
   "transformers_version": "4.34.0",
   "use_weighted_layer_sum": false,
-  "vocab_size": 50,
   "xvector_output_dim": 512
 }

   "num_hidden_layers": 24,
   "num_negatives": 100,
   "output_hidden_size": 1024,
+  "pad_token_id": 45,
   "proj_codevector_dim": 768,
   "tdnn_dilation": [
     1,
   "torch_dtype": "float32",
   "transformers_version": "4.34.0",
   "use_weighted_layer_sum": false,
+  "vocab_size": 48,
   "xvector_output_dim": 512
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2df734d98ecc1e8217c474526d337df466d140427d59f0dfa38e3981b3185555
-size 1262107370

 version https://git-lfs.github.com/spec/v1
+oid sha256:d756ee3e6ae46dc85a03c2a5dad2800bfb999be7e826a7c1f1e7912bd7f58cd4
+size 1262099178

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e236b946192a413d9db31df9da6864d22bd3aa4faa3ffe39765deffd168ab7f8
 size 4536

 version https://git-lfs.github.com/spec/v1
+oid sha256:8661f961f72473d1da09bea5fcf6ef512fd600c704c4313ab14ca264cd4a6597
 size 4536