nvidia
/

stt_en_conformer_ctc_large

@@ -1,5 +1,6 @@
 ---
-language: "en"
 library_name: nemo
 datasets:
 - librispeech_asr
@@ -14,7 +15,7 @@ datasets:
 - Europarl-ASR (EN)
 - Multilingual LibriSpeech (2000 hours)
 - mozilla-foundation/common_voice_7_0
-thumbnail:
 tags:
 - automatic-speech-recognition
 - speech
@@ -32,96 +33,114 @@ widget:
 - example_title: Librispeech sample 2
   src: https://cdn-media.huggingface.co/speech_samples/sample2.flac
 model-index:
-  - name: stt_en_conformer_ctc_large
-    results:
-    - task:
-        type: Automatic Speech Recognition
-        name: automatic-speech-recognition
-      dataset:
-        name: Librispeech (clean)
-        type: librispeech_asr
-        args: en
-      metrics:
-        - name: Test WER
-          type: wer
-          value: 2.2
-    - task:
-        type: Automatic Speech Recognition
-        name: automatic-speech-recognition
-      dataset:
-        name: Librispeech (other)
-        type: librispeech_asr
-        args: en
-      metrics:
-        - name: Test WER
-          type: wer
-          value: 4.3
-    - task:
-        type: Automatic Speech Recognition
-        name: automatic-speech-recognition
-      dataset:
-        name: Multilingual LibriSpeech
-        type: mls
-        args: en
-      metrics:
-        - name: Test WER
-          type: wer
-          value: 7.2
-    - task:
-        type: Automatic Speech Recognition
-        name: automatic-speech-recognition
-      dataset:
-        name: Mozilla Common Voice 7.0
-        type: mozilla-foundation/common_voice_7_0
-        args: en
-      metrics:
-        - name: Test WER
-          type: wer
-          value: 8.0
-    - task:
-        type: Automatic Speech Recognition
-        name: automatic-speech-recognition
-      dataset:
-        name: Mozilla Common Voice 8.0
-        type: mozilla-foundation/common_voice_8_0
-        args: en
-      metrics:
-        - name: Test WER
-          type: wer
-          value: 9.48
-    - task:
-        type: Automatic Speech Recognition
-        name: automatic-speech-recognition
-      dataset:
-        name: Wall Street Journal 92
-        type: wsj_0
-        args: en
-      metrics:
-        - name: Test WER
-          type: wer
-          value: 2.0
-    - task:
-        type: Automatic Speech Recognition
-        name: automatic-speech-recognition
-      dataset:
-        name: Wall Street Journal 93
-        type: wsj_1
-        args: en
-      metrics:
-        - name: Test WER
-          type: wer
-          value: 2.9
-    - task:
-        type: Automatic Speech Recognition
-        name: automatic-speech-recognition
-      dataset:
-        name: National Singapore Corpus
-        type: nsc_part_1
-        args: en
-      metrics:
-        - name: Test WER
-          type: wer
-          value: 7.0
 ---
 ## Model Overview

 ---
+language:
+- en
 library_name: nemo
 datasets:
 - librispeech_asr
 - Europarl-ASR (EN)
 - Multilingual LibriSpeech (2000 hours)
 - mozilla-foundation/common_voice_7_0
+thumbnail: null
 tags:
 - automatic-speech-recognition
 - speech
 - example_title: Librispeech sample 2
   src: https://cdn-media.huggingface.co/speech_samples/sample2.flac
 model-index:
+- name: stt_en_conformer_ctc_large
+  results:
+  - task:
+      name: Automatic Speech Recognition
+      type: automatic-speech-recognition
+    dataset:
+      name: LibriSpeech (clean)
+      type: librispeech_asr
+      config: clean
+      split: test
+      args:
+        language: en
+    metrics:
+    - name: Test WER
+      type: wer
+      value: 2.2
+  - task:
+      type: Automatic Speech Recognition
+      name: automatic-speech-recognition
+    dataset:
+      name: LibriSpeech (other)
+      type: librispeech_asr
+      config: other
+      split: test
+      args:
+        language: en
+    metrics:
+    - name: Test WER
+      type: wer
+      value: 4.3
+  - task:
+      type: Automatic Speech Recognition
+      name: automatic-speech-recognition
+    dataset:
+      name: Multilingual LibriSpeech
+      type: facebook/multilingual_librispeech
+      config: english
+      split: test
+      args:
+        language: en
+    metrics:
+    - name: Test WER
+      type: wer
+      value: 7.2
+  - task:
+      type: Automatic Speech Recognition
+      name: automatic-speech-recognition
+    dataset:
+      name: Mozilla Common Voice 7.0
+      type: mozilla-foundation/common_voice_7_0
+      config: en
+      split: test
+      args:
+        language: en
+    metrics:
+    - name: Test WER
+      type: wer
+      value: 8.0
+  - task:
+      type: Automatic Speech Recognition
+      name: automatic-speech-recognition
+    dataset:
+      name: Mozilla Common Voice 8.0
+      type: mozilla-foundation/common_voice_8_0
+      config: en
+      split: test
+      args:
+        language: en
+    metrics:
+    - name: Test WER
+      type: wer
+      value: 9.48
+  - task:
+      type: Automatic Speech Recognition
+      name: automatic-speech-recognition
+    dataset:
+      name: Wall Street Journal 92
+      type: wsj_0
+      args:
+        language: en
+    metrics:
+    - name: Test WER
+      type: wer
+      value: 2.0
+  - task:
+      type: Automatic Speech Recognition
+      name: automatic-speech-recognition
+    dataset:
+      name: Wall Street Journal 93
+      type: wsj_1
+      args:
+        language: en
+    metrics:
+    - name: Test WER
+      type: wer
+      value: 2.9
+  - task:
+      type: Automatic Speech Recognition
+      name: automatic-speech-recognition
+    dataset:
+      name: National Singapore Corpus
+      type: nsc_part_1
+      args:
+        language: en
+    metrics:
+    - name: Test WER
+      type: wer
+      value: 7.0
 ---
 ## Model Overview