small lm added

Files changed (10) hide show

README.md CHANGED Viewed

@@ -24,7 +24,21 @@ model-index:
       value: 9.480663281840769
     - name: Test CER
       type: cer
-      value: 2.273015898213336
   - task:
       name: Automatic Speech Recognition
       type: automatic-speech-recognition
@@ -38,7 +52,21 @@ model-index:
       value: 8.122005951166668
     - name: Test CER
       type: cer
-      value: 1.8815347657065468
 ---
 # wav2vec2-large-xlsr-53-german-cv9

       value: 9.480663281840769
     - name: Test CER
       type: cer
+      value: 1.9167347943074394
+  - task:
+      name: Automatic Speech Recognition
+      type: automatic-speech-recognition
+    dataset:
+      name: Common Voice 9
+      type: mozilla-foundation/common_voice_9_0
+      args: de
+    metrics:
+    - name: Test WER
+      type: wer
+      value: 7.49027762774117
+    - name: Test CER
+      type: cer
+      value: 1.9167347943074394
   - task:
       name: Automatic Speech Recognition
       type: automatic-speech-recognition
       value: 8.122005951166668
     - name: Test CER
       type: cer
+      value: 1.
+  - task:
+      name: Automatic Speech Recognition
+      type: automatic-speech-recognition
+    dataset:
+      name: Common Voice 6.1
+      type: common_voice
+      args: de
+    metrics:
+    - name: Test WER (+LM)
+      type: wer
+      value: 6.1453182045203544
+    - name: Test CER (+LM)
+      type: cer
+      value: 1.5247743373447677
 ---
 # wav2vec2-large-xlsr-53-german-cv9

added_tokens.json CHANGED Viewed

+{
+  "</s>": 34,
+  "<s>": 33
+}

alphabet.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"labels": [" ", "a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k", "l", "m", "n", "o", "p", "q", "r", "s", "t", "u", "v", "w", "x", "y", "z", "\u00df", "\u00e4", "\u00f6", "\u00fc", "\u2047", "", "<s>", "</s>"], "is_bpe": false}

language_model/5gram.bin ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:9282e9575d6f2b2853034f0695bd935c36b0262516578f9930c2c69a419a1146
+size 315428505

language_model/attrs.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"alpha": 0.5, "beta": 1.5, "unk_score_offset": -10.0, "score_boundary": true}

language_model/unigrams.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

preprocessor_config.json CHANGED Viewed

@@ -4,6 +4,7 @@
   "feature_size": 1,
   "padding_side": "right",
   "padding_value": 0,
   "return_attention_mask": true,
   "sampling_rate": 16000
 }

   "feature_size": 1,
   "padding_side": "right",
   "padding_value": 0,
+  "processor_class": "Wav2Vec2ProcessorWithLM",
   "return_attention_mask": true,
   "sampling_rate": 16000
 }

special_tokens_map.json CHANGED Viewed

	@@ -1 +1,36 @@
1	- {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]", "additional_special_tokens": [{"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}]}

+{
+  "additional_special_tokens": [
+    {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    }
+  ],
+  "bos_token": "<s>",
+  "eos_token": "</s>",
+  "pad_token": "[PAD]",
+  "unk_token": "[UNK]"
+}

tokenizer_config.json CHANGED Viewed

	@@ -1 +1,13 @@
1	- {"unk_token": "[UNK]", "bos_token": "<s>", "eos_token": "</s>", "pad_token": "[PAD]", "do_lower_case": false, "word_delimiter_token": "\|", "replace_word_delimiter_char": " ", "special_tokens_map_file": null, "name_or_path": "./wav2vec2-large-xlsr-53-german-cv9", "tokenizer_class": "Wav2Vec2CTCTokenizer"}

+{
+  "bos_token": "<s>",
+  "do_lower_case": false,
+  "eos_token": "</s>",
+  "name_or_path": "published/wav2vec2-large-xlsr-53-german-cv9",
+  "pad_token": "[PAD]",
+  "processor_class": "Wav2Vec2ProcessorWithLM",
+  "replace_word_delimiter_char": " ",
+  "special_tokens_map_file": null,
+  "tokenizer_class": "Wav2Vec2CTCTokenizer",
+  "unk_token": "[UNK]",
+  "word_delimiter_token": "|"
+}

vocab.json CHANGED Viewed

	@@ -1 +1,35 @@
1	- {"a": 1, "b": 2, "c": 3, "d": 4, "e": 5, "f": 6, "g": 7, "h": 8, "i": 9, "j": 10, "k": 11, "l": 12, "m": 13, "n": 14, "o": 15, "p": 16, "q": 17, "r": 18, "s": 19, "t": 20, "u": 21, "v": 22, "w": 23, "x": 24, "y": 25, "z": 26, "ß": 27, "ä": 28, "ö": 29, "ü": 30, "\|": 0, "[UNK]": 31, "[PAD]": 32}

+{
+  "[PAD]": 32,
+  "[UNK]": 31,
+  "a": 1,
+  "b": 2,
+  "c": 3,
+  "d": 4,
+  "e": 5,
+  "f": 6,
+  "g": 7,
+  "h": 8,
+  "i": 9,
+  "j": 10,
+  "k": 11,
+  "l": 12,
+  "m": 13,
+  "n": 14,
+  "o": 15,
+  "p": 16,
+  "q": 17,
+  "r": 18,
+  "s": 19,
+  "t": 20,
+  "u": 21,
+  "v": 22,
+  "w": 23,
+  "x": 24,
+  "y": 25,
+  "z": 26,
+  "|": 0,
+  "ß": 27,
+  "ä": 28,
+  "ö": 29,
+  "ü": 30
+}