nvidia
/

stt_zh_citrinet_1024_gamma_0_25

@@ -11,7 +11,6 @@ tags:
 - audio
 - CTC
 - Citrinet
-- Transformer
 - pytorch
 - NeMo
 - hf-asr-leaderboard
@@ -24,108 +23,32 @@ model-index:
       name: Automatic Speech Recognition
       type: automatic-speech-recognition
     dataset:
-      name: LibriSpeech (clean)
-      type: librispeech_asr
-      config: clean
-      split: test
-      args:
-        language: en
-    metrics:
-    - name: Test WER
-      type: wer
-      value: 2.2
-  - task:
-      type: Automatic Speech Recognition
-      name: automatic-speech-recognition
-    dataset:
-      name: LibriSpeech (other)
-      type: librispeech_asr
-      config: other
-      split: test
-      args:
-        language: en
-    metrics:
-    - name: Test WER
-      type: wer
-      value: 4.3
-  - task:
-      type: Automatic Speech Recognition
-      name: automatic-speech-recognition
-    dataset:
-      name: Multilingual LibriSpeech
-      type: facebook/multilingual_librispeech
-      config: english
-      split: test
-      args:
-        language: en
-    metrics:
-    - name: Test WER
-      type: wer
-      value: 7.2
-  - task:
-      type: Automatic Speech Recognition
-      name: automatic-speech-recognition
-    dataset:
-      name: Mozilla Common Voice 7.0
-      type: mozilla-foundation/common_voice_7_0
-      config: en
-      split: test
       args:
-        language: en
     metrics:
-    - name: Test WER
-      type: wer
-      value: 8.0
   - task:
-      type: Automatic Speech Recognition
-      name: automatic-speech-recognition
     dataset:
-      name: Mozilla Common Voice 8.0
-      type: mozilla-foundation/common_voice_8_0
-      config: en
       split: test
       args:
-        language: en
-    metrics:
-    - name: Test WER
-      type: wer
-      value: 9.48
-  - task:
-      type: Automatic Speech Recognition
-      name: automatic-speech-recognition
-    dataset:
-      name: Wall Street Journal 92
-      type: wsj_0
-      args:
-        language: en
     metrics:
-    - name: Test WER
-      type: wer
-      value: 2.0
-  - task:
-      type: Automatic Speech Recognition
-      name: automatic-speech-recognition
-    dataset:
-      name: Wall Street Journal 93
-      type: wsj_1
-      args:
-        language: en
-    metrics:
-    - name: Test WER
-      type: wer
-      value: 2.9
-  - task:
-      type: Automatic Speech Recognition
-      name: automatic-speech-recognition
-    dataset:
-      name: National Singapore Corpus
-      type: nsc_part_1
-      args:
-        language: en
-    metrics:
-    - name: Test WER
-      type: wer
-      value: 7.0
 ---
 # NVIDIA Streaming Citrinet 1024 (zh)

 - audio
 - CTC
 - Citrinet
 - pytorch
 - NeMo
 - hf-asr-leaderboard
       name: Automatic Speech Recognition
       type: automatic-speech-recognition
     dataset:
+      name: Dev iOS
+      type: aishell_2
+      config: iOS
+      split: dev
       args:
+        language: zh
     metrics:
+    - name: Dev CER
+      type: cer
+      value: 4.8
   - task:
+      name: Automatic Speech Recognition
+      type: automatic-speech-recognition
     dataset:
+      name: Test iOS
+      type: aishell_2
+      config: iOS
       split: test
       args:
+        language: zh
     metrics:
+    - name: Test CER
+      type: cer
+      value: 5.1
 ---
 # NVIDIA Streaming Citrinet 1024 (zh)