root commited on
Commit
c8fc790
1 Parent(s): a23e2a2

Update model

Browse files
Files changed (20) hide show
  1. .gitattributes +1 -0
  2. README.md +740 -0
  3. meta.yaml +8 -0
  4. mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/config.yaml +667 -0
  5. mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/acc_m.png +0 -0
  6. mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/acc_u.png +0 -0
  7. mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/backward_time.png +0 -0
  8. mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/correct_m.png +0 -0
  9. mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/correct_u.png +0 -0
  10. mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/count_m.png +0 -0
  11. mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/count_u.png +0 -0
  12. mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/forward_time.png +0 -0
  13. mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/gpu_max_cached_mem_GB.png +0 -0
  14. mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/iter_time.png +0 -0
  15. mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/loss.png +0 -0
  16. mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/optim0_lr0.png +0 -0
  17. mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/optim_step_time.png +0 -0
  18. mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/train_time.png +0 -0
  19. mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/valid.loss.ave_10best.pth +3 -0
  20. mnt/datastore/exp/kmeans_iter1_hubert_train_960_portion0.1_gigaspeech/km_500.mdl +3 -0
.gitattributes CHANGED
@@ -32,3 +32,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
35
+ *.mdl filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,740 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - espnet
4
+ - audio
5
+ - self-supervised-learning
6
+ language: en
7
+ datasets:
8
+ - librispeech
9
+ license: cc-by-4.0
10
+ ---
11
+
12
+ ## ESPnet2 SSL model
13
+
14
+ ### `espnet/hubert_large_gs_16_librilight60k`
15
+
16
+ This model was trained by wanchichen using librispeech recipe in [espnet](https://github.com/espnet/espnet/).
17
+
18
+ ### Demo: How to use in ESPnet2
19
+
20
+ Follow the [ESPnet installation instructions](https://espnet.github.io/espnet/installation.html)
21
+ if you haven't done that already.
22
+
23
+ ```bash
24
+ cd espnet
25
+
26
+ pip install -e .
27
+ cd egs2/librispeech/ssl1
28
+ ./run.sh --skip_data_prep false --skip_train true --download_model espnet/hubert_large_gs_16_librilight60k
29
+ ```
30
+
31
+
32
+
33
+ ## SSL config
34
+
35
+ <details><summary>expand</summary>
36
+
37
+ ```
38
+ config: conf/tuning/train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins.yaml
39
+ print_config: false
40
+ log_level: INFO
41
+ dry_run: false
42
+ iterator_type: sequence
43
+ output_dir: exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw
44
+ ngpu: 1
45
+ seed: 0
46
+ num_workers: 16
47
+ num_att_plot: 3
48
+ dist_backend: nccl
49
+ dist_init_method: env://
50
+ dist_world_size: 8
51
+ dist_rank: 0
52
+ local_rank: 0
53
+ dist_master_addr: localhost
54
+ dist_master_port: 55415
55
+ dist_launcher: null
56
+ multiprocessing_distributed: true
57
+ unused_parameters: true
58
+ sharded_ddp: false
59
+ cudnn_enabled: true
60
+ cudnn_benchmark: false
61
+ cudnn_deterministic: true
62
+ collect_stats: false
63
+ write_collected_feats: false
64
+ max_epoch: 190
65
+ patience: null
66
+ val_scheduler_criterion:
67
+ - valid
68
+ - loss
69
+ early_stopping_criterion:
70
+ - valid
71
+ - loss
72
+ - min
73
+ best_model_criterion:
74
+ - - valid
75
+ - loss
76
+ - min
77
+ keep_nbest_models: 10
78
+ nbest_averaging_interval: 0
79
+ grad_clip: 5.0
80
+ grad_clip_type: 2.0
81
+ grad_noise: false
82
+ accum_grad: 16
83
+ no_forward_run: false
84
+ resume: true
85
+ train_dtype: float32
86
+ use_amp: true
87
+ log_interval: null
88
+ use_matplotlib: true
89
+ use_tensorboard: true
90
+ create_graph_in_tensorboard: false
91
+ use_wandb: false
92
+ wandb_project: null
93
+ wandb_id: null
94
+ wandb_entity: null
95
+ wandb_name: null
96
+ wandb_model_log_interval: -1
97
+ detect_anomaly: false
98
+ pretrain_path: null
99
+ init_param: []
100
+ ignore_init_mismatch: false
101
+ freeze_param: []
102
+ num_iters_per_epoch: 40000
103
+ batch_size: 20
104
+ valid_batch_size: null
105
+ batch_bins: 100000
106
+ valid_batch_bins: null
107
+ train_shape_file:
108
+ - exp/hubert_iter1_stats_raw/splits16/speech_shape
109
+ - exp/hubert_iter1_stats_raw/splits16/text_shape.word
110
+ valid_shape_file:
111
+ - exp/hubert_iter1_stats_raw/valid/speech_shape
112
+ - exp/hubert_iter1_stats_raw/valid/text_shape.word
113
+ batch_type: numel
114
+ valid_batch_type: null
115
+ fold_length:
116
+ - 80000
117
+ - 400
118
+ sort_in_batch: descending
119
+ sort_batch: descending
120
+ multiple_iterator: true
121
+ chunk_length: 500
122
+ chunk_shift_ratio: 0.5
123
+ num_cache_chunks: 1024
124
+ train_data_path_and_name_and_type:
125
+ - - exp/hubert_iter1_stats_raw/splits16/wav.scp
126
+ - speech
127
+ - sound
128
+ - - exp/hubert_iter1_stats_raw/splits16/text.km.kmeans_iter1_hubert_train_60k_portion0.1_gigaspeech
129
+ - text
130
+ - text
131
+ valid_data_path_and_name_and_type:
132
+ - - dump/raw/dev/wav.scp
133
+ - speech
134
+ - sound
135
+ - - dump/raw/dev/text.km.kmeans_iter1_hubert_train_60k_portion0.1_gigaspeech
136
+ - text
137
+ - text
138
+ allow_variable_data_keys: false
139
+ max_cache_size: 0.0
140
+ max_cache_fd: 32
141
+ valid_max_cache_size: null
142
+ exclude_weight_decay: false
143
+ exclude_weight_decay_conf: {}
144
+ optim: adam
145
+ optim_conf:
146
+ lr: 0.0005
147
+ scheduler: warmuplr
148
+ scheduler_conf:
149
+ warmup_steps: 32000
150
+ token_list:
151
+ - '6'
152
+ - '185'
153
+ - '233'
154
+ - '206'
155
+ - '200'
156
+ - '47'
157
+ - '129'
158
+ - '362'
159
+ - '436'
160
+ - '50'
161
+ - '30'
162
+ - '137'
163
+ - '39'
164
+ - '126'
165
+ - '81'
166
+ - '78'
167
+ - '444'
168
+ - '439'
169
+ - '230'
170
+ - '33'
171
+ - '14'
172
+ - '61'
173
+ - '450'
174
+ - '239'
175
+ - '293'
176
+ - '161'
177
+ - '410'
178
+ - '355'
179
+ - '262'
180
+ - '475'
181
+ - '338'
182
+ - '201'
183
+ - '242'
184
+ - '318'
185
+ - '159'
186
+ - '56'
187
+ - '190'
188
+ - '21'
189
+ - '259'
190
+ - '458'
191
+ - '187'
192
+ - '268'
193
+ - '7'
194
+ - '398'
195
+ - '67'
196
+ - '11'
197
+ - '455'
198
+ - '241'
199
+ - '4'
200
+ - '261'
201
+ - '412'
202
+ - '388'
203
+ - '402'
204
+ - '414'
205
+ - '180'
206
+ - '41'
207
+ - '198'
208
+ - '100'
209
+ - '459'
210
+ - '96'
211
+ - '235'
212
+ - '267'
213
+ - '203'
214
+ - '189'
215
+ - '60'
216
+ - '160'
217
+ - '64'
218
+ - '300'
219
+ - '295'
220
+ - '473'
221
+ - '37'
222
+ - '130'
223
+ - '77'
224
+ - '424'
225
+ - '369'
226
+ - '217'
227
+ - '366'
228
+ - '3'
229
+ - '82'
230
+ - '149'
231
+ - '330'
232
+ - '79'
233
+ - '351'
234
+ - '223'
235
+ - '446'
236
+ - '269'
237
+ - '148'
238
+ - '186'
239
+ - '110'
240
+ - '62'
241
+ - '471'
242
+ - '316'
243
+ - '433'
244
+ - '127'
245
+ - '354'
246
+ - '243'
247
+ - '457'
248
+ - '240'
249
+ - '375'
250
+ - '46'
251
+ - '40'
252
+ - '339'
253
+ - '224'
254
+ - '183'
255
+ - '179'
256
+ - '357'
257
+ - '430'
258
+ - '83'
259
+ - '49'
260
+ - '154'
261
+ - '237'
262
+ - '460'
263
+ - '353'
264
+ - '289'
265
+ - '92'
266
+ - '109'
267
+ - '311'
268
+ - '71'
269
+ - '391'
270
+ - '406'
271
+ - '43'
272
+ - '73'
273
+ - '418'
274
+ - '437'
275
+ - '250'
276
+ - '463'
277
+ - '120'
278
+ - '346'
279
+ - '146'
280
+ - '454'
281
+ - '211'
282
+ - '274'
283
+ - '167'
284
+ - '345'
285
+ - '10'
286
+ - '68'
287
+ - '348'
288
+ - '244'
289
+ - '102'
290
+ - '474'
291
+ - '192'
292
+ - '144'
293
+ - '112'
294
+ - '25'
295
+ - '449'
296
+ - '308'
297
+ - '405'
298
+ - '48'
299
+ - '212'
300
+ - '205'
301
+ - '124'
302
+ - '153'
303
+ - '9'
304
+ - '5'
305
+ - '258'
306
+ - '306'
307
+ - '80'
308
+ - '394'
309
+ - '328'
310
+ - '208'
311
+ - '166'
312
+ - '36'
313
+ - '352'
314
+ - '18'
315
+ - '397'
316
+ - '66'
317
+ - '31'
318
+ - '16'
319
+ - '426'
320
+ - '332'
321
+ - '23'
322
+ - '281'
323
+ - '215'
324
+ - '88'
325
+ - '171'
326
+ - '221'
327
+ - '184'
328
+ - '202'
329
+ - '470'
330
+ - '247'
331
+ - '38'
332
+ - '389'
333
+ - '315'
334
+ - '197'
335
+ - '349'
336
+ - '304'
337
+ - '393'
338
+ - '380'
339
+ - '132'
340
+ - '456'
341
+ - '367'
342
+ - '479'
343
+ - '360'
344
+ - '123'
345
+ - '162'
346
+ - '365'
347
+ - '337'
348
+ - '467'
349
+ - '234'
350
+ - '364'
351
+ - '376'
352
+ - '173'
353
+ - '478'
354
+ - '425'
355
+ - '218'
356
+ - '297'
357
+ - '469'
358
+ - '282'
359
+ - '298'
360
+ - '451'
361
+ - '20'
362
+ - '117'
363
+ - '52'
364
+ - '113'
365
+ - '165'
366
+ - '280'
367
+ - '292'
368
+ - '226'
369
+ - '104'
370
+ - '55'
371
+ - '145'
372
+ - '286'
373
+ - '86'
374
+ - '294'
375
+ - '15'
376
+ - '216'
377
+ - '279'
378
+ - '275'
379
+ - '253'
380
+ - '312'
381
+ - '378'
382
+ - '287'
383
+ - '76'
384
+ - '168'
385
+ - '116'
386
+ - '368'
387
+ - '396'
388
+ - '336'
389
+ - '290'
390
+ - '53'
391
+ - '103'
392
+ - '0'
393
+ - '411'
394
+ - '228'
395
+ - '408'
396
+ - '285'
397
+ - '151'
398
+ - '325'
399
+ - '193'
400
+ - '428'
401
+ - '401'
402
+ - '320'
403
+ - '182'
404
+ - '480'
405
+ - '264'
406
+ - '383'
407
+ - '114'
408
+ - '115'
409
+ - '374'
410
+ - '141'
411
+ - '22'
412
+ - '466'
413
+ - '384'
414
+ - '174'
415
+ - '59'
416
+ - '326'
417
+ - '105'
418
+ - '232'
419
+ - '464'
420
+ - '251'
421
+ - '24'
422
+ - '172'
423
+ - '150'
424
+ - '299'
425
+ - '89'
426
+ - '344'
427
+ - '427'
428
+ - '333'
429
+ - '434'
430
+ - '107'
431
+ - '291'
432
+ - '194'
433
+ - '497'
434
+ - '452'
435
+ - '317'
436
+ - '254'
437
+ - '213'
438
+ - '499'
439
+ - '483'
440
+ - '432'
441
+ - '95'
442
+ - '321'
443
+ - '111'
444
+ - '8'
445
+ - '175'
446
+ - '277'
447
+ - '65'
448
+ - '342'
449
+ - '382'
450
+ - '301'
451
+ - '45'
452
+ - '443'
453
+ - '63'
454
+ - '93'
455
+ - '489'
456
+ - '74'
457
+ - '387'
458
+ - '370'
459
+ - '340'
460
+ - '358'
461
+ - '220'
462
+ - '429'
463
+ - '2'
464
+ - '331'
465
+ - '181'
466
+ - '32'
467
+ - '324'
468
+ - '191'
469
+ - '238'
470
+ - '313'
471
+ - '157'
472
+ - '91'
473
+ - '101'
474
+ - '118'
475
+ - '350'
476
+ - '356'
477
+ - '486'
478
+ - '188'
479
+ - '142'
480
+ - '419'
481
+ - '195'
482
+ - '164'
483
+ - '487'
484
+ - '255'
485
+ - '323'
486
+ - '222'
487
+ - '35'
488
+ - '245'
489
+ - '359'
490
+ - '249'
491
+ - '98'
492
+ - '271'
493
+ - '231'
494
+ - '125'
495
+ - '29'
496
+ - '34'
497
+ - '119'
498
+ - '134'
499
+ - '284'
500
+ - '309'
501
+ - '409'
502
+ - '422'
503
+ - '147'
504
+ - '484'
505
+ - '462'
506
+ - '390'
507
+ - '440'
508
+ - '283'
509
+ - '84'
510
+ - '108'
511
+ - '139'
512
+ - '170'
513
+ - '303'
514
+ - '371'
515
+ - '381'
516
+ - '278'
517
+ - '329'
518
+ - '28'
519
+ - '87'
520
+ - '403'
521
+ - '256'
522
+ - '441'
523
+ - '334'
524
+ - '12'
525
+ - '260'
526
+ - '265'
527
+ - '69'
528
+ - '122'
529
+ - '488'
530
+ - '99'
531
+ - '42'
532
+ - '302'
533
+ - '97'
534
+ - '70'
535
+ - '152'
536
+ - '177'
537
+ - '138'
538
+ - '296'
539
+ - '51'
540
+ - '491'
541
+ - '199'
542
+ - '176'
543
+ - '204'
544
+ - '169'
545
+ - '386'
546
+ - '494'
547
+ - '400'
548
+ - '341'
549
+ - '229'
550
+ - '273'
551
+ - '485'
552
+ - '135'
553
+ - '227'
554
+ - '54'
555
+ - '314'
556
+ - '343'
557
+ - '477'
558
+ - '465'
559
+ - '482'
560
+ - '257'
561
+ - '435'
562
+ - '423'
563
+ - '121'
564
+ - '496'
565
+ - '448'
566
+ - '453'
567
+ - '85'
568
+ - '57'
569
+ - '276'
570
+ - '210'
571
+ - '272'
572
+ - '236'
573
+ - '407'
574
+ - '445'
575
+ - '90'
576
+ - '266'
577
+ - '490'
578
+ - '307'
579
+ - '155'
580
+ - '136'
581
+ - '19'
582
+ - '319'
583
+ - '498'
584
+ - '163'
585
+ - '75'
586
+ - '442'
587
+ - '495'
588
+ - '421'
589
+ - '209'
590
+ - '361'
591
+ - '156'
592
+ - '395'
593
+ - '472'
594
+ - '415'
595
+ - '347'
596
+ - '252'
597
+ - '468'
598
+ - '476'
599
+ - '106'
600
+ - '143'
601
+ - '263'
602
+ - '373'
603
+ - '327'
604
+ - '322'
605
+ - '399'
606
+ - '404'
607
+ - '13'
608
+ - '288'
609
+ - '207'
610
+ - '58'
611
+ - '481'
612
+ - '131'
613
+ - '385'
614
+ - '447'
615
+ - '219'
616
+ - '438'
617
+ - '461'
618
+ - '416'
619
+ - '246'
620
+ - '417'
621
+ - '26'
622
+ - '158'
623
+ - '431'
624
+ - '270'
625
+ - '128'
626
+ - '413'
627
+ - '310'
628
+ - '140'
629
+ - '17'
630
+ - '392'
631
+ - '44'
632
+ - '27'
633
+ - '214'
634
+ - '377'
635
+ - '305'
636
+ - '72'
637
+ - '420'
638
+ - '133'
639
+ - '363'
640
+ - '379'
641
+ - '94'
642
+ - '225'
643
+ - '335'
644
+ - '493'
645
+ - '492'
646
+ - '372'
647
+ - '196'
648
+ - '248'
649
+ - '178'
650
+ - '1'
651
+ - <unk>
652
+ - <sos/eos>
653
+ init: null
654
+ collate_fn_conf:
655
+ label_downsampling: 1
656
+ pad: false
657
+ rand_crop: true
658
+ input_size: 1
659
+ num_classes: 500
660
+ use_preprocessor: true
661
+ token_type: word
662
+ bpemodel: null
663
+ non_linguistic_symbols: null
664
+ cleaner: null
665
+ g2p: null
666
+ speech_volume_normalize: null
667
+ rir_scp: null
668
+ rir_apply_prob: 1.0
669
+ noise_scp: null
670
+ noise_apply_prob: 1.0
671
+ noise_db_range: '13_15'
672
+ pred_masked_weight: 1.0
673
+ pred_nomask_weight: 0.0
674
+ loss_weights: 0.0
675
+ frontend: null
676
+ frontend_conf: {}
677
+ specaug: null
678
+ specaug_conf: {}
679
+ normalize: null
680
+ normalize_conf: {}
681
+ preencoder: null
682
+ preencoder_conf: {}
683
+ encoder: torchaudio_hubert
684
+ encoder_conf:
685
+ encoder_projection_dropout: 0.0
686
+ encoder_attention_dropout: 0.0
687
+ encoder_ff_interm_dropout: 0.0
688
+ encoder_dropout: 0.0
689
+ encoder_layer_drop: 0.0
690
+ extractor_mode: layer_norm
691
+ encoder_embed_dim: 1024
692
+ encoder_num_layers: 24
693
+ encoder_num_heads: 16
694
+ encoder_ff_interm_features: 4096
695
+ encoder_layer_norm_first: true
696
+ normalize_feats: true
697
+ final_dim: 768
698
+ model: torchaudio
699
+ model_conf: {}
700
+ required:
701
+ - output_dir
702
+ - token_list
703
+ version: '202301'
704
+ distributed: true
705
+ ```
706
+
707
+ </details>
708
+
709
+
710
+
711
+ ### Citing ESPnet
712
+
713
+ ```BibTex
714
+ @inproceedings{watanabe2018espnet,
715
+ author={Shinji Watanabe and Takaaki Hori and Shigeki Karita and Tomoki Hayashi and Jiro Nishitoba and Yuya Unno and Nelson Yalta and Jahn Heymann and Matthew Wiesner and Nanxin Chen and Adithya Renduchintala and Tsubasa Ochiai},
716
+ title={{ESPnet}: End-to-End Speech Processing Toolkit},
717
+ year={2018},
718
+ booktitle={Proceedings of Interspeech},
719
+ pages={2207--2211},
720
+ doi={10.21437/Interspeech.2018-1456},
721
+ url={http://dx.doi.org/10.21437/Interspeech.2018-1456}
722
+ }
723
+
724
+
725
+
726
+
727
+ ```
728
+
729
+ or arXiv:
730
+
731
+ ```bibtex
732
+ @misc{watanabe2018espnet,
733
+ title={ESPnet: End-to-End Speech Processing Toolkit},
734
+ author={Shinji Watanabe and Takaaki Hori and Shigeki Karita and Tomoki Hayashi and Jiro Nishitoba and Yuya Unno and Nelson Yalta and Jahn Heymann and Matthew Wiesner and Nanxin Chen and Adithya Renduchintala and Tsubasa Ochiai},
735
+ year={2018},
736
+ eprint={1804.00015},
737
+ archivePrefix={arXiv},
738
+ primaryClass={cs.CL}
739
+ }
740
+ ```
meta.yaml ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ espnet: '202301'
2
+ files:
3
+ model_file: /mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/valid.loss.ave_10best.pth
4
+ python: "3.8.16 (default, Jan 17 2023, 23:13:24) \n[GCC 11.2.0]"
5
+ timestamp: 1680639936.937445
6
+ torch: 1.13.1
7
+ yaml_files:
8
+ train_config: /mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/config.yaml
mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/config.yaml ADDED
@@ -0,0 +1,667 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/tuning/train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ dry_run: false
5
+ iterator_type: sequence
6
+ output_dir: exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw
7
+ ngpu: 1
8
+ seed: 0
9
+ num_workers: 16
10
+ num_att_plot: 3
11
+ dist_backend: nccl
12
+ dist_init_method: env://
13
+ dist_world_size: 8
14
+ dist_rank: 0
15
+ local_rank: 0
16
+ dist_master_addr: localhost
17
+ dist_master_port: 55415
18
+ dist_launcher: null
19
+ multiprocessing_distributed: true
20
+ unused_parameters: true
21
+ sharded_ddp: false
22
+ cudnn_enabled: true
23
+ cudnn_benchmark: false
24
+ cudnn_deterministic: true
25
+ collect_stats: false
26
+ write_collected_feats: false
27
+ max_epoch: 190
28
+ patience: null
29
+ val_scheduler_criterion:
30
+ - valid
31
+ - loss
32
+ early_stopping_criterion:
33
+ - valid
34
+ - loss
35
+ - min
36
+ best_model_criterion:
37
+ - - valid
38
+ - loss
39
+ - min
40
+ keep_nbest_models: 10
41
+ nbest_averaging_interval: 0
42
+ grad_clip: 5.0
43
+ grad_clip_type: 2.0
44
+ grad_noise: false
45
+ accum_grad: 16
46
+ no_forward_run: false
47
+ resume: true
48
+ train_dtype: float32
49
+ use_amp: true
50
+ log_interval: null
51
+ use_matplotlib: true
52
+ use_tensorboard: true
53
+ create_graph_in_tensorboard: false
54
+ use_wandb: false
55
+ wandb_project: null
56
+ wandb_id: null
57
+ wandb_entity: null
58
+ wandb_name: null
59
+ wandb_model_log_interval: -1
60
+ detect_anomaly: false
61
+ pretrain_path: null
62
+ init_param: []
63
+ ignore_init_mismatch: false
64
+ freeze_param: []
65
+ num_iters_per_epoch: 40000
66
+ batch_size: 20
67
+ valid_batch_size: null
68
+ batch_bins: 100000
69
+ valid_batch_bins: null
70
+ train_shape_file:
71
+ - exp/hubert_iter1_stats_raw/splits16/speech_shape
72
+ - exp/hubert_iter1_stats_raw/splits16/text_shape.word
73
+ valid_shape_file:
74
+ - exp/hubert_iter1_stats_raw/valid/speech_shape
75
+ - exp/hubert_iter1_stats_raw/valid/text_shape.word
76
+ batch_type: numel
77
+ valid_batch_type: null
78
+ fold_length:
79
+ - 80000
80
+ - 400
81
+ sort_in_batch: descending
82
+ sort_batch: descending
83
+ multiple_iterator: true
84
+ chunk_length: 500
85
+ chunk_shift_ratio: 0.5
86
+ num_cache_chunks: 1024
87
+ train_data_path_and_name_and_type:
88
+ - - exp/hubert_iter1_stats_raw/splits16/wav.scp
89
+ - speech
90
+ - sound
91
+ - - exp/hubert_iter1_stats_raw/splits16/text.km.kmeans_iter1_hubert_train_60k_portion0.1_gigaspeech
92
+ - text
93
+ - text
94
+ valid_data_path_and_name_and_type:
95
+ - - dump/raw/dev/wav.scp
96
+ - speech
97
+ - sound
98
+ - - dump/raw/dev/text.km.kmeans_iter1_hubert_train_60k_portion0.1_gigaspeech
99
+ - text
100
+ - text
101
+ allow_variable_data_keys: false
102
+ max_cache_size: 0.0
103
+ max_cache_fd: 32
104
+ valid_max_cache_size: null
105
+ exclude_weight_decay: false
106
+ exclude_weight_decay_conf: {}
107
+ optim: adam
108
+ optim_conf:
109
+ lr: 0.0005
110
+ scheduler: warmuplr
111
+ scheduler_conf:
112
+ warmup_steps: 32000
113
+ token_list:
114
+ - '6'
115
+ - '185'
116
+ - '233'
117
+ - '206'
118
+ - '200'
119
+ - '47'
120
+ - '129'
121
+ - '362'
122
+ - '436'
123
+ - '50'
124
+ - '30'
125
+ - '137'
126
+ - '39'
127
+ - '126'
128
+ - '81'
129
+ - '78'
130
+ - '444'
131
+ - '439'
132
+ - '230'
133
+ - '33'
134
+ - '14'
135
+ - '61'
136
+ - '450'
137
+ - '239'
138
+ - '293'
139
+ - '161'
140
+ - '410'
141
+ - '355'
142
+ - '262'
143
+ - '475'
144
+ - '338'
145
+ - '201'
146
+ - '242'
147
+ - '318'
148
+ - '159'
149
+ - '56'
150
+ - '190'
151
+ - '21'
152
+ - '259'
153
+ - '458'
154
+ - '187'
155
+ - '268'
156
+ - '7'
157
+ - '398'
158
+ - '67'
159
+ - '11'
160
+ - '455'
161
+ - '241'
162
+ - '4'
163
+ - '261'
164
+ - '412'
165
+ - '388'
166
+ - '402'
167
+ - '414'
168
+ - '180'
169
+ - '41'
170
+ - '198'
171
+ - '100'
172
+ - '459'
173
+ - '96'
174
+ - '235'
175
+ - '267'
176
+ - '203'
177
+ - '189'
178
+ - '60'
179
+ - '160'
180
+ - '64'
181
+ - '300'
182
+ - '295'
183
+ - '473'
184
+ - '37'
185
+ - '130'
186
+ - '77'
187
+ - '424'
188
+ - '369'
189
+ - '217'
190
+ - '366'
191
+ - '3'
192
+ - '82'
193
+ - '149'
194
+ - '330'
195
+ - '79'
196
+ - '351'
197
+ - '223'
198
+ - '446'
199
+ - '269'
200
+ - '148'
201
+ - '186'
202
+ - '110'
203
+ - '62'
204
+ - '471'
205
+ - '316'
206
+ - '433'
207
+ - '127'
208
+ - '354'
209
+ - '243'
210
+ - '457'
211
+ - '240'
212
+ - '375'
213
+ - '46'
214
+ - '40'
215
+ - '339'
216
+ - '224'
217
+ - '183'
218
+ - '179'
219
+ - '357'
220
+ - '430'
221
+ - '83'
222
+ - '49'
223
+ - '154'
224
+ - '237'
225
+ - '460'
226
+ - '353'
227
+ - '289'
228
+ - '92'
229
+ - '109'
230
+ - '311'
231
+ - '71'
232
+ - '391'
233
+ - '406'
234
+ - '43'
235
+ - '73'
236
+ - '418'
237
+ - '437'
238
+ - '250'
239
+ - '463'
240
+ - '120'
241
+ - '346'
242
+ - '146'
243
+ - '454'
244
+ - '211'
245
+ - '274'
246
+ - '167'
247
+ - '345'
248
+ - '10'
249
+ - '68'
250
+ - '348'
251
+ - '244'
252
+ - '102'
253
+ - '474'
254
+ - '192'
255
+ - '144'
256
+ - '112'
257
+ - '25'
258
+ - '449'
259
+ - '308'
260
+ - '405'
261
+ - '48'
262
+ - '212'
263
+ - '205'
264
+ - '124'
265
+ - '153'
266
+ - '9'
267
+ - '5'
268
+ - '258'
269
+ - '306'
270
+ - '80'
271
+ - '394'
272
+ - '328'
273
+ - '208'
274
+ - '166'
275
+ - '36'
276
+ - '352'
277
+ - '18'
278
+ - '397'
279
+ - '66'
280
+ - '31'
281
+ - '16'
282
+ - '426'
283
+ - '332'
284
+ - '23'
285
+ - '281'
286
+ - '215'
287
+ - '88'
288
+ - '171'
289
+ - '221'
290
+ - '184'
291
+ - '202'
292
+ - '470'
293
+ - '247'
294
+ - '38'
295
+ - '389'
296
+ - '315'
297
+ - '197'
298
+ - '349'
299
+ - '304'
300
+ - '393'
301
+ - '380'
302
+ - '132'
303
+ - '456'
304
+ - '367'
305
+ - '479'
306
+ - '360'
307
+ - '123'
308
+ - '162'
309
+ - '365'
310
+ - '337'
311
+ - '467'
312
+ - '234'
313
+ - '364'
314
+ - '376'
315
+ - '173'
316
+ - '478'
317
+ - '425'
318
+ - '218'
319
+ - '297'
320
+ - '469'
321
+ - '282'
322
+ - '298'
323
+ - '451'
324
+ - '20'
325
+ - '117'
326
+ - '52'
327
+ - '113'
328
+ - '165'
329
+ - '280'
330
+ - '292'
331
+ - '226'
332
+ - '104'
333
+ - '55'
334
+ - '145'
335
+ - '286'
336
+ - '86'
337
+ - '294'
338
+ - '15'
339
+ - '216'
340
+ - '279'
341
+ - '275'
342
+ - '253'
343
+ - '312'
344
+ - '378'
345
+ - '287'
346
+ - '76'
347
+ - '168'
348
+ - '116'
349
+ - '368'
350
+ - '396'
351
+ - '336'
352
+ - '290'
353
+ - '53'
354
+ - '103'
355
+ - '0'
356
+ - '411'
357
+ - '228'
358
+ - '408'
359
+ - '285'
360
+ - '151'
361
+ - '325'
362
+ - '193'
363
+ - '428'
364
+ - '401'
365
+ - '320'
366
+ - '182'
367
+ - '480'
368
+ - '264'
369
+ - '383'
370
+ - '114'
371
+ - '115'
372
+ - '374'
373
+ - '141'
374
+ - '22'
375
+ - '466'
376
+ - '384'
377
+ - '174'
378
+ - '59'
379
+ - '326'
380
+ - '105'
381
+ - '232'
382
+ - '464'
383
+ - '251'
384
+ - '24'
385
+ - '172'
386
+ - '150'
387
+ - '299'
388
+ - '89'
389
+ - '344'
390
+ - '427'
391
+ - '333'
392
+ - '434'
393
+ - '107'
394
+ - '291'
395
+ - '194'
396
+ - '497'
397
+ - '452'
398
+ - '317'
399
+ - '254'
400
+ - '213'
401
+ - '499'
402
+ - '483'
403
+ - '432'
404
+ - '95'
405
+ - '321'
406
+ - '111'
407
+ - '8'
408
+ - '175'
409
+ - '277'
410
+ - '65'
411
+ - '342'
412
+ - '382'
413
+ - '301'
414
+ - '45'
415
+ - '443'
416
+ - '63'
417
+ - '93'
418
+ - '489'
419
+ - '74'
420
+ - '387'
421
+ - '370'
422
+ - '340'
423
+ - '358'
424
+ - '220'
425
+ - '429'
426
+ - '2'
427
+ - '331'
428
+ - '181'
429
+ - '32'
430
+ - '324'
431
+ - '191'
432
+ - '238'
433
+ - '313'
434
+ - '157'
435
+ - '91'
436
+ - '101'
437
+ - '118'
438
+ - '350'
439
+ - '356'
440
+ - '486'
441
+ - '188'
442
+ - '142'
443
+ - '419'
444
+ - '195'
445
+ - '164'
446
+ - '487'
447
+ - '255'
448
+ - '323'
449
+ - '222'
450
+ - '35'
451
+ - '245'
452
+ - '359'
453
+ - '249'
454
+ - '98'
455
+ - '271'
456
+ - '231'
457
+ - '125'
458
+ - '29'
459
+ - '34'
460
+ - '119'
461
+ - '134'
462
+ - '284'
463
+ - '309'
464
+ - '409'
465
+ - '422'
466
+ - '147'
467
+ - '484'
468
+ - '462'
469
+ - '390'
470
+ - '440'
471
+ - '283'
472
+ - '84'
473
+ - '108'
474
+ - '139'
475
+ - '170'
476
+ - '303'
477
+ - '371'
478
+ - '381'
479
+ - '278'
480
+ - '329'
481
+ - '28'
482
+ - '87'
483
+ - '403'
484
+ - '256'
485
+ - '441'
486
+ - '334'
487
+ - '12'
488
+ - '260'
489
+ - '265'
490
+ - '69'
491
+ - '122'
492
+ - '488'
493
+ - '99'
494
+ - '42'
495
+ - '302'
496
+ - '97'
497
+ - '70'
498
+ - '152'
499
+ - '177'
500
+ - '138'
501
+ - '296'
502
+ - '51'
503
+ - '491'
504
+ - '199'
505
+ - '176'
506
+ - '204'
507
+ - '169'
508
+ - '386'
509
+ - '494'
510
+ - '400'
511
+ - '341'
512
+ - '229'
513
+ - '273'
514
+ - '485'
515
+ - '135'
516
+ - '227'
517
+ - '54'
518
+ - '314'
519
+ - '343'
520
+ - '477'
521
+ - '465'
522
+ - '482'
523
+ - '257'
524
+ - '435'
525
+ - '423'
526
+ - '121'
527
+ - '496'
528
+ - '448'
529
+ - '453'
530
+ - '85'
531
+ - '57'
532
+ - '276'
533
+ - '210'
534
+ - '272'
535
+ - '236'
536
+ - '407'
537
+ - '445'
538
+ - '90'
539
+ - '266'
540
+ - '490'
541
+ - '307'
542
+ - '155'
543
+ - '136'
544
+ - '19'
545
+ - '319'
546
+ - '498'
547
+ - '163'
548
+ - '75'
549
+ - '442'
550
+ - '495'
551
+ - '421'
552
+ - '209'
553
+ - '361'
554
+ - '156'
555
+ - '395'
556
+ - '472'
557
+ - '415'
558
+ - '347'
559
+ - '252'
560
+ - '468'
561
+ - '476'
562
+ - '106'
563
+ - '143'
564
+ - '263'
565
+ - '373'
566
+ - '327'
567
+ - '322'
568
+ - '399'
569
+ - '404'
570
+ - '13'
571
+ - '288'
572
+ - '207'
573
+ - '58'
574
+ - '481'
575
+ - '131'
576
+ - '385'
577
+ - '447'
578
+ - '219'
579
+ - '438'
580
+ - '461'
581
+ - '416'
582
+ - '246'
583
+ - '417'
584
+ - '26'
585
+ - '158'
586
+ - '431'
587
+ - '270'
588
+ - '128'
589
+ - '413'
590
+ - '310'
591
+ - '140'
592
+ - '17'
593
+ - '392'
594
+ - '44'
595
+ - '27'
596
+ - '214'
597
+ - '377'
598
+ - '305'
599
+ - '72'
600
+ - '420'
601
+ - '133'
602
+ - '363'
603
+ - '379'
604
+ - '94'
605
+ - '225'
606
+ - '335'
607
+ - '493'
608
+ - '492'
609
+ - '372'
610
+ - '196'
611
+ - '248'
612
+ - '178'
613
+ - '1'
614
+ - <unk>
615
+ - <sos/eos>
616
+ init: null
617
+ collate_fn_conf:
618
+ label_downsampling: 1
619
+ pad: false
620
+ rand_crop: true
621
+ input_size: 1
622
+ num_classes: 500
623
+ use_preprocessor: true
624
+ token_type: word
625
+ bpemodel: null
626
+ non_linguistic_symbols: null
627
+ cleaner: null
628
+ g2p: null
629
+ speech_volume_normalize: null
630
+ rir_scp: null
631
+ rir_apply_prob: 1.0
632
+ noise_scp: null
633
+ noise_apply_prob: 1.0
634
+ noise_db_range: '13_15'
635
+ pred_masked_weight: 1.0
636
+ pred_nomask_weight: 0.0
637
+ loss_weights: 0.0
638
+ frontend: null
639
+ frontend_conf: {}
640
+ specaug: null
641
+ specaug_conf: {}
642
+ normalize: null
643
+ normalize_conf: {}
644
+ preencoder: null
645
+ preencoder_conf: {}
646
+ encoder: torchaudio_hubert
647
+ encoder_conf:
648
+ encoder_projection_dropout: 0.0
649
+ encoder_attention_dropout: 0.0
650
+ encoder_ff_interm_dropout: 0.0
651
+ encoder_dropout: 0.0
652
+ encoder_layer_drop: 0.0
653
+ extractor_mode: layer_norm
654
+ encoder_embed_dim: 1024
655
+ encoder_num_layers: 24
656
+ encoder_num_heads: 16
657
+ encoder_ff_interm_features: 4096
658
+ encoder_layer_norm_first: true
659
+ normalize_feats: true
660
+ final_dim: 768
661
+ model: torchaudio
662
+ model_conf: {}
663
+ required:
664
+ - output_dir
665
+ - token_list
666
+ version: '202301'
667
+ distributed: true
mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/acc_m.png ADDED
mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/acc_u.png ADDED
mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/backward_time.png ADDED
mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/correct_m.png ADDED
mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/correct_u.png ADDED
mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/count_m.png ADDED
mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/count_u.png ADDED
mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/forward_time.png ADDED
mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/gpu_max_cached_mem_GB.png ADDED
mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/iter_time.png ADDED
mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/loss.png ADDED
mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/optim0_lr0.png ADDED
mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/optim_step_time.png ADDED
mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/images/train_time.png ADDED
mnt/datastore/exp/hubert_iter1_train_ssl_torchaudiohubert_large_960h_pretrain_it2_bins_raw/valid.loss.ave_10best.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:baed99a6ea2a0558fca545e2001eca82b8f894f7c044783b35a8409e00ded604
3
+ size 1266628481
mnt/datastore/exp/kmeans_iter1_hubert_train_960_portion0.1_gigaspeech/km_500.mdl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a20709ca2cbaa7e30232b2a51bfabfb5e887387311c8bd7eeb41d07c9d905917
3
+ size 1538858