File size: 10,788 Bytes
2267fac
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
#!/usr/bin/python3
# -*- coding: utf-8 -*-


examples = [
    [
        "Chinese+English",
        "csukuangfj/sherpa-onnx-streaming-zipformer-bilingual-zh-en-2023-02-20",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/tal_csasr/0.wav",
    ],
    [
        "Chinese+English+Cantonese",
        "csukuangfj/sherpa-onnx-paraformer-trilingual-zh-cantonese-en",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/cantonese/2.wav",
    ],
    [
        "Cantonese",
        "zrjin/icefall-asr-mdcc-zipformer-2024-03-11",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/cantonese/1.wav",
    ],
    [
        "English",
        "whisper-base.en",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/librispeech/1089-134686-0001.wav",
    ],
    [
        "Chinese",
        "csukuangfj/sherpa-onnx-paraformer-zh-2024-03-09",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/paraformer-zh/四川话.wav",
    ],
    [
        "Russian",
        "alphacep/vosk-model-ru",
        "greedy_search",
        4,
        "No",
        "./data/test_wavs/russian/russian-i-love-you.wav",
    ],
    [
        "Russian",
        "alphacep/vosk-model-ru",
        "greedy_search",
        4,
        "No",
        "./data/test_wavs/russian/test.wav",
    ],
    [
        "German",
        "csukuangfj/wav2vec2.0-torchaudio",
        "greedy_search",
        4,
        "No",
        "./data/test_wavs/german/20170517-0900-PLENARY-16-de_20170517.wav",
    ],
    [
        "Arabic",
        "AmirHussein/icefall-asr-mgb2-conformer_ctc-2022-27-06",
        "greedy_search",
        4,
        "No",
        "./data/test_wavs/arabic/a.wav",
    ],
    [
        "Tibetan",
        "syzym/icefall-asr-xbmu-amdo31-pruned-transducer-stateless7-2022-12-02",
        "greedy_search",
        4,
        "No",
        "./data/test_wavs/tibetan/a_0_cacm-A70_31117.wav",
    ],
    [
        "French",
        "shaojieli/sherpa-onnx-streaming-zipformer-fr-2023-04-14",
        "greedy_search",
        4,
        "No",
        "./data/test_wavs/french/common_voice_fr_19364697.wav",
    ],
    [
        "Chinese",
        "desh2608/icefall-asr-alimeeting-pruned-transducer-stateless7",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/alimeeting/R8003_M8001-8004-165.wav",
    ],
    [
        "Chinese",
        "csukuangfj/sherpa-onnx-paraformer-zh-2024-03-09",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/paraformer-zh/天津话.wav",
    ],
    [
        "Chinese",
        "csukuangfj/sherpa-onnx-paraformer-zh-2024-03-09",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/paraformer-zh/郑州话.wav",
    ],
    [
        "Chinese",
        "desh2608/icefall-asr-alimeeting-pruned-transducer-stateless7",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/alimeeting/R8008_M8013-8049-74.wav",
    ],
    [
        "Chinese",
        "desh2608/icefall-asr-alimeeting-pruned-transducer-stateless7",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/alimeeting/R8009_M8020_N_SPK8026-8026-209.wav",
    ],
    [
        "English",
        "videodanchik/icefall-asr-tedlium3-conformer-ctc2",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/tedlium3/DanBarber_2010-219.wav",
    ],
    [
        "English",
        "whisper-base.en",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/tedlium3/DanielKahneman_2010-157.wav",
    ],
    [
        "English",
        "videodanchik/icefall-asr-tedlium3-conformer-ctc2",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/tedlium3/RobertGupta_2010U-15.wav",
    ],
    # librispeech
    # https://huggingface.co/csukuangfj/icefall-asr-librispeech-pruned-transducer-stateless5-2022-05-13/tree/main/data/test_wavs
    [
        "English",
        "csukuangfj/icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/librispeech/1089-134686-0001.wav",
    ],
    [
        "English",
        "csukuangfj/icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/librispeech/1221-135766-0001.wav",
    ],
    [
        "English",
        "csukuangfj/icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/librispeech/1221-135766-0002.wav",
    ],
    # gigaspeech
    [
        "English",
        "wgb14/icefall-asr-gigaspeech-pruned-transducer-stateless2",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/gigaspeech/1-minute-audiobook.opus",
    ],
    [
        "English",
        "wgb14/icefall-asr-gigaspeech-pruned-transducer-stateless2",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/gigaspeech/100-seconds-podcast.opus",
    ],
    [
        "English",
        "wgb14/icefall-asr-gigaspeech-pruned-transducer-stateless2",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/gigaspeech/100-seconds-youtube.opus",
    ],
    # wenetspeech
    # https://huggingface.co/luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2/tree/main/data/test_wavs
    [
        "Chinese",
        "luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/wenetspeech/DEV_T0000000000.opus",
    ],
    [
        "Chinese",
        "luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/wenetspeech/DEV_T0000000001.opus",
    ],
    [
        "Chinese",
        "luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/wenetspeech/DEV_T0000000002.opus",
    ],
    # aishell2-A
    # https://huggingface.co/yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-A-2022-07-12/tree/main/data/test_wavs
    [
        "Chinese",
        "yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-A-2022-07-12",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/aishell2/ID0012W0030.wav",
    ],
    [
        "Chinese",
        "yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-A-2022-07-12",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/aishell2/ID0012W0162.wav",
    ],
    [
        "Chinese",
        "yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-A-2022-07-12",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/aishell2/ID0012W0215.wav",
    ],
    # aishell2-B
    # https://huggingface.co/yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-A-2022-07-12/tree/main/data/test_wavs
    [
        "Chinese",
        "yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-B-2022-07-12",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/aishell2/ID0012W0030.wav",
    ],
    [
        "Chinese",
        "yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-B-2022-07-12",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/aishell2/ID0012W0162.wav",
    ],
    [
        "Chinese",
        "yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-B-2022-07-12",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/aishell2/ID0012W0215.wav",
    ],
    # aishell2-B
    # https://huggingface.co/luomingshuang/icefall_asr_aidatatang-200zh_pruned_transducer_stateless2/tree/main/data/test_wavs
    [
        "Chinese",
        "luomingshuang/icefall_asr_aidatatang-200zh_pruned_transducer_stateless2",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/aidatatang_200zh/T0055G0036S0002.wav",
    ],
    [
        "Chinese",
        "luomingshuang/icefall_asr_aidatatang-200zh_pruned_transducer_stateless2",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/aidatatang_200zh/T0055G0036S0003.wav",
    ],
    [
        "Chinese",
        "luomingshuang/icefall_asr_aidatatang-200zh_pruned_transducer_stateless2",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/aidatatang_200zh/T0055G0036S0004.wav",
    ],
    # tal_csasr
    [
        "Chinese+English",
        "ptrnull/icefall-asr-conv-emformer-transducer-stateless2-zh",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/tal_csasr/210_36476_210_8341_1_1533271973_7057520_132.wav",
    ],
    [
        "Chinese+English",
        "ptrnull/icefall-asr-conv-emformer-transducer-stateless2-zh",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/tal_csasr/210_36476_210_8341_1_1533271973_7057520_138.wav",
    ],
    [
        "Chinese+English",
        "ptrnull/icefall-asr-conv-emformer-transducer-stateless2-zh",
        "greedy_search",
        4,
        "Yes",
        "./data/test_wavs/tal_csasr/210_36476_210_8341_1_1533271973_7057520_145.wav",
    ],
    [
        "Tibetan",
        "syzym/icefall-asr-xbmu-amdo31-pruned-transducer-stateless7-2022-12-02",
        "greedy_search",
        4,
        "No",
        "./data/test_wavs/tibetan/a_0_cacm-A70_31116.wav",
    ],
    [
        "Tibetan",
        "syzym/icefall-asr-xbmu-amdo31-pruned-transducer-stateless7-2022-12-02",
        "greedy_search",
        4,
        "No",
        "./data/test_wavs/tibetan/a_0_cacm-A70_31118.wav",
    ],
    # arabic
    [
        "Arabic",
        "AmirHussein/icefall-asr-mgb2-conformer_ctc-2022-27-06",
        "greedy_search",
        4,
        "No",
        "./data/test_wavs/arabic/b.wav",
    ],
    [
        "Arabic",
        "AmirHussein/icefall-asr-mgb2-conformer_ctc-2022-27-06",
        "greedy_search",
        4,
        "No",
        "./data/test_wavs/arabic/c.wav",
    ],
    [
        "German",
        "csukuangfj/wav2vec2.0-torchaudio",
        "greedy_search",
        4,
        "No",
        "./data/test_wavs/german/20120315-0900-PLENARY-14-de_20120315.wav",
    ],
    [
        "French",
        "shaojieli/sherpa-onnx-streaming-zipformer-fr-2023-04-14",
        "greedy_search",
        4,
        "No",
        "./data/test_wavs/french/common_voice_fr_19738183.wav",
    ],
    [
        "French",
        "shaojieli/sherpa-onnx-streaming-zipformer-fr-2023-04-14",
        "greedy_search",
        4,
        "No",
        "./data/test_wavs/french/common_voice_fr_27024649.wav",
    ],
]