File size: 1,372 Bytes
afcf2d9
fe12949
c25fd87
 
fe12949
65cc2e6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
fe12949
 
65cc2e6
 
 
 
 
 
 
 
 
 
 
 
fe12949
 
65cc2e6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
afcf2d9
65cc2e6
c25fd87
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
---
language:
- pt
- en
- es
tags:
- audio
- automatic-speech-recognition
- hf-asr-leaderboard
widget:
- example_title: Librispeech sample 1
  src: https://cdn-media.huggingface.co/speech_samples/sample1.flac
- example_title: Librispeech sample 2
  src: https://cdn-media.huggingface.co/speech_samples/sample2.flac
model-index:
- name: whisper-medium
  results:
  - task:
      name: Automatic Speech Recognition
      type: automatic-speech-recognition
    dataset:
      name: LibriSpeech (clean)
      type: librispeech_asr
      config: clean
      split: test
      args:
        language: pt
    metrics:
    - name: Test WER
      type: wer
      value: 2.9
  - task:
      name: Automatic Speech Recognition
      type: automatic-speech-recognition
    dataset:
      name: LibriSpeech (other)
      type: librispeech_asr
      config: other
      split: test
      args:
        language: pt
    metrics:
    - name: Test WER
      type: wer
      value: 5.9
  - task:
      name: Automatic Speech Recognition
      type: automatic-speech-recognition
    dataset:
      name: Common Voice 11.0
      type: mozilla-foundation/common_voice_11_0
      config: hi
      split: test
      args:
        language: hi
    metrics:
    - name: Test WER
      type: wer
      value: 53.87
pipeline_tag: automatic-speech-recognition
license: apache-2.0
---

# STT - V0 Base