ESPnet
audio
self-supervised-learning
speech-recognition
William Chen commited on
Commit
921b02e
1 Parent(s): d280e69
Files changed (19) hide show
  1. .gitattributes +1 -0
  2. exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/config.yaml +672 -0
  3. exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/acc_m.png +0 -0
  4. exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/acc_u.png +0 -0
  5. exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/backward_time.png +0 -0
  6. exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/correct_m.png +0 -0
  7. exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/correct_u.png +0 -0
  8. exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/count_m.png +0 -0
  9. exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/count_u.png +0 -0
  10. exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/forward_time.png +0 -0
  11. exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/gpu_max_cached_mem_GB.png +0 -0
  12. exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/iter_time.png +0 -0
  13. exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/loss.png +0 -0
  14. exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/optim0_lr0.png +0 -0
  15. exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/optim_step_time.png +0 -0
  16. exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/train_time.png +0 -0
  17. exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/valid.acc_m.ave_10best.pth +3 -0
  18. exp_li/kmeans_iter2_hubert_train_li110_lid_portion0.1/km_500.mdl +3 -0
  19. meta.yaml +8 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ exp_li/kmeans_iter2_hubert_train_li110_lid_portion0.1/km_500.mdl filter=lfs diff=lfs merge=lfs -text
exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/config.yaml ADDED
@@ -0,0 +1,672 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/tuning/train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ dry_run: false
5
+ iterator_type: sequence
6
+ output_dir: exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9
7
+ ngpu: 1
8
+ seed: 0
9
+ num_workers: 4
10
+ num_att_plot: 0
11
+ dist_backend: nccl
12
+ dist_init_method: file:///scratch/bbjs/chen26/espnet_01_23/egs2/librispeech/ssl1/exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/.dist_init_a1240dd2-c062-43da-80c3-13d77add8604
13
+ dist_world_size: 32
14
+ dist_rank: 0
15
+ local_rank: 0
16
+ dist_master_addr: null
17
+ dist_master_port: null
18
+ dist_launcher: slurm
19
+ multiprocessing_distributed: true
20
+ unused_parameters: true
21
+ sharded_ddp: false
22
+ cudnn_enabled: true
23
+ cudnn_benchmark: false
24
+ cudnn_deterministic: true
25
+ collect_stats: false
26
+ write_collected_feats: false
27
+ max_epoch: 22
28
+ patience: null
29
+ val_scheduler_criterion:
30
+ - valid
31
+ - loss
32
+ early_stopping_criterion:
33
+ - valid
34
+ - loss
35
+ - min
36
+ best_model_criterion:
37
+ - - valid
38
+ - acc_m
39
+ - max
40
+ keep_nbest_models: 10
41
+ nbest_averaging_interval: 0
42
+ grad_clip: 5.0
43
+ grad_clip_type: 2.0
44
+ grad_noise: false
45
+ accum_grad: 1
46
+ no_forward_run: false
47
+ resume: true
48
+ train_dtype: float32
49
+ use_amp: true
50
+ drop_last: true
51
+ debug_grad: false
52
+ log_interval: null
53
+ use_matplotlib: true
54
+ use_tensorboard: true
55
+ create_graph_in_tensorboard: false
56
+ use_wandb: false
57
+ wandb_project: null
58
+ wandb_id: null
59
+ wandb_entity: null
60
+ wandb_name: null
61
+ wandb_model_log_interval: -1
62
+ detect_anomaly: false
63
+ pretrain_path: null
64
+ init_param: []
65
+ ignore_init_mismatch: false
66
+ freeze_param: []
67
+ num_iters_per_epoch: 2000
68
+ batch_size: 20
69
+ valid_batch_size: null
70
+ batch_bins: 35000000
71
+ valid_batch_bins: null
72
+ train_shape_file:
73
+ - exp_li/hubert_iter2_stats_raw/splits16/speech_shape
74
+ - exp_li/hubert_iter2_stats_raw/splits16/text_shape.word
75
+ valid_shape_file:
76
+ - exp_li/hubert_iter2_stats_raw/valid/speech_shape
77
+ - exp_li/hubert_iter2_stats_raw/valid/text_shape.word
78
+ batch_type: numel
79
+ valid_batch_type: null
80
+ fold_length:
81
+ - 80000
82
+ - 400
83
+ sort_in_batch: descending
84
+ sort_batch: descending
85
+ multiple_iterator: true
86
+ chunk_length: 500
87
+ chunk_shift_ratio: 0.5
88
+ num_cache_chunks: 1024
89
+ train_data_path_and_name_and_type:
90
+ - - exp_li/hubert_iter2_stats_raw/splits16/wav.scp
91
+ - speech
92
+ - kaldi_ark
93
+ - - exp_li/hubert_iter2_stats_raw/splits16/text.km.kmeans_iter2_hubert_train_li110_lid_portion0.1
94
+ - text
95
+ - text
96
+ valid_data_path_and_name_and_type:
97
+ - - dump/raw/dev_all_li/wav.scp
98
+ - speech
99
+ - kaldi_ark
100
+ - - dump/raw/dev_all_li/text.km.kmeans_iter2_hubert_train_li110_lid_portion0.1
101
+ - text
102
+ - text
103
+ allow_variable_data_keys: false
104
+ max_cache_size: 0.0
105
+ max_cache_fd: 32
106
+ valid_max_cache_size: null
107
+ optim: adam
108
+ optim_conf:
109
+ lr: 0.0005
110
+ scheduler: warmuplr
111
+ scheduler_conf:
112
+ warmup_steps: 32000
113
+ token_list:
114
+ - '55'
115
+ - '477'
116
+ - '43'
117
+ - '405'
118
+ - '468'
119
+ - '486'
120
+ - '41'
121
+ - '34'
122
+ - '0'
123
+ - '415'
124
+ - '409'
125
+ - '367'
126
+ - '224'
127
+ - '436'
128
+ - '17'
129
+ - '462'
130
+ - '32'
131
+ - '481'
132
+ - '332'
133
+ - '291'
134
+ - '395'
135
+ - '336'
136
+ - '147'
137
+ - '364'
138
+ - '430'
139
+ - '454'
140
+ - '44'
141
+ - '196'
142
+ - '269'
143
+ - '230'
144
+ - '189'
145
+ - '274'
146
+ - '305'
147
+ - '419'
148
+ - '444'
149
+ - '352'
150
+ - '72'
151
+ - '158'
152
+ - '349'
153
+ - '212'
154
+ - '148'
155
+ - '13'
156
+ - '140'
157
+ - '164'
158
+ - '329'
159
+ - '288'
160
+ - '259'
161
+ - '9'
162
+ - '249'
163
+ - '30'
164
+ - '198'
165
+ - '299'
166
+ - '427'
167
+ - '301'
168
+ - '107'
169
+ - '344'
170
+ - '213'
171
+ - '36'
172
+ - '203'
173
+ - '120'
174
+ - '208'
175
+ - '285'
176
+ - '69'
177
+ - '181'
178
+ - '166'
179
+ - '130'
180
+ - '402'
181
+ - '194'
182
+ - '37'
183
+ - '106'
184
+ - '330'
185
+ - '407'
186
+ - '242'
187
+ - '412'
188
+ - '167'
189
+ - '133'
190
+ - '40'
191
+ - '211'
192
+ - '57'
193
+ - '389'
194
+ - '325'
195
+ - '197'
196
+ - '170'
197
+ - '190'
198
+ - '260'
199
+ - '286'
200
+ - '257'
201
+ - '374'
202
+ - '116'
203
+ - '38'
204
+ - '221'
205
+ - '81'
206
+ - '87'
207
+ - '4'
208
+ - '173'
209
+ - '94'
210
+ - '83'
211
+ - '200'
212
+ - '331'
213
+ - '143'
214
+ - '248'
215
+ - '22'
216
+ - '26'
217
+ - '388'
218
+ - '174'
219
+ - '488'
220
+ - '320'
221
+ - '397'
222
+ - '188'
223
+ - '401'
224
+ - '126'
225
+ - '28'
226
+ - '11'
227
+ - '304'
228
+ - '135'
229
+ - '33'
230
+ - '109'
231
+ - '202'
232
+ - '267'
233
+ - '86'
234
+ - '487'
235
+ - '490'
236
+ - '482'
237
+ - '426'
238
+ - '103'
239
+ - '151'
240
+ - '324'
241
+ - '492'
242
+ - '238'
243
+ - '483'
244
+ - '467'
245
+ - '1'
246
+ - '20'
247
+ - '268'
248
+ - '21'
249
+ - '47'
250
+ - '377'
251
+ - '351'
252
+ - '297'
253
+ - '398'
254
+ - '348'
255
+ - '157'
256
+ - '303'
257
+ - '100'
258
+ - '68'
259
+ - '254'
260
+ - '216'
261
+ - '177'
262
+ - '491'
263
+ - '171'
264
+ - '361'
265
+ - '24'
266
+ - '338'
267
+ - '129'
268
+ - '154'
269
+ - '192'
270
+ - '222'
271
+ - '8'
272
+ - '156'
273
+ - '7'
274
+ - '78'
275
+ - '64'
276
+ - '29'
277
+ - '146'
278
+ - '90'
279
+ - '263'
280
+ - '393'
281
+ - '95'
282
+ - '102'
283
+ - '433'
284
+ - '480'
285
+ - '225'
286
+ - '59'
287
+ - '66'
288
+ - '82'
289
+ - '85'
290
+ - '54'
291
+ - '310'
292
+ - '429'
293
+ - '176'
294
+ - '366'
295
+ - '42'
296
+ - '298'
297
+ - '144'
298
+ - '215'
299
+ - '318'
300
+ - '136'
301
+ - '122'
302
+ - '459'
303
+ - '205'
304
+ - '498'
305
+ - '112'
306
+ - '52'
307
+ - '396'
308
+ - '282'
309
+ - '428'
310
+ - '335'
311
+ - '339'
312
+ - '386'
313
+ - '289'
314
+ - '187'
315
+ - '333'
316
+ - '449'
317
+ - '458'
318
+ - '233'
319
+ - '35'
320
+ - '400'
321
+ - '223'
322
+ - '375'
323
+ - '70'
324
+ - '134'
325
+ - '127'
326
+ - '410'
327
+ - '71'
328
+ - '312'
329
+ - '73'
330
+ - '341'
331
+ - '326'
332
+ - '273'
333
+ - '472'
334
+ - '23'
335
+ - '113'
336
+ - '117'
337
+ - '387'
338
+ - '207'
339
+ - '342'
340
+ - '12'
341
+ - '49'
342
+ - '281'
343
+ - '65'
344
+ - '356'
345
+ - '99'
346
+ - '423'
347
+ - '141'
348
+ - '493'
349
+ - '61'
350
+ - '494'
351
+ - '277'
352
+ - '453'
353
+ - '362'
354
+ - '185'
355
+ - '460'
356
+ - '256'
357
+ - '159'
358
+ - '302'
359
+ - '88'
360
+ - '53'
361
+ - '76'
362
+ - '243'
363
+ - '235'
364
+ - '306'
365
+ - '278'
366
+ - '15'
367
+ - '56'
368
+ - '25'
369
+ - '115'
370
+ - '48'
371
+ - '264'
372
+ - '363'
373
+ - '110'
374
+ - '204'
375
+ - '414'
376
+ - '287'
377
+ - '184'
378
+ - '172'
379
+ - '383'
380
+ - '316'
381
+ - '424'
382
+ - '169'
383
+ - '358'
384
+ - '14'
385
+ - '206'
386
+ - '91'
387
+ - '245'
388
+ - '447'
389
+ - '60'
390
+ - '125'
391
+ - '283'
392
+ - '246'
393
+ - '255'
394
+ - '313'
395
+ - '97'
396
+ - '89'
397
+ - '321'
398
+ - '214'
399
+ - '314'
400
+ - '464'
401
+ - '27'
402
+ - '294'
403
+ - '497'
404
+ - '128'
405
+ - '451'
406
+ - '365'
407
+ - '478'
408
+ - '337'
409
+ - '226'
410
+ - '422'
411
+ - '471'
412
+ - '381'
413
+ - '63'
414
+ - '452'
415
+ - '290'
416
+ - '118'
417
+ - '51'
418
+ - '261'
419
+ - '432'
420
+ - '376'
421
+ - '31'
422
+ - '80'
423
+ - '142'
424
+ - '295'
425
+ - '275'
426
+ - '272'
427
+ - '123'
428
+ - '270'
429
+ - '236'
430
+ - '195'
431
+ - '469'
432
+ - '50'
433
+ - '218'
434
+ - '435'
435
+ - '479'
436
+ - '315'
437
+ - '182'
438
+ - '372'
439
+ - '446'
440
+ - '132'
441
+ - '327'
442
+ - '229'
443
+ - '217'
444
+ - '373'
445
+ - '340'
446
+ - '153'
447
+ - '2'
448
+ - '163'
449
+ - '199'
450
+ - '378'
451
+ - '101'
452
+ - '79'
453
+ - '96'
454
+ - '434'
455
+ - '489'
456
+ - '247'
457
+ - '440'
458
+ - '448'
459
+ - '139'
460
+ - '466'
461
+ - '150'
462
+ - '465'
463
+ - '62'
464
+ - '421'
465
+ - '252'
466
+ - '104'
467
+ - '180'
468
+ - '232'
469
+ - '108'
470
+ - '307'
471
+ - '219'
472
+ - '228'
473
+ - '322'
474
+ - '455'
475
+ - '370'
476
+ - '39'
477
+ - '280'
478
+ - '114'
479
+ - '240'
480
+ - '137'
481
+ - '179'
482
+ - '162'
483
+ - '406'
484
+ - '168'
485
+ - '368'
486
+ - '473'
487
+ - '75'
488
+ - '441'
489
+ - '266'
490
+ - '442'
491
+ - '119'
492
+ - '347'
493
+ - '92'
494
+ - '209'
495
+ - '470'
496
+ - '296'
497
+ - '476'
498
+ - '93'
499
+ - '191'
500
+ - '437'
501
+ - '293'
502
+ - '186'
503
+ - '111'
504
+ - '265'
505
+ - '183'
506
+ - '145'
507
+ - '394'
508
+ - '155'
509
+ - '420'
510
+ - '438'
511
+ - '5'
512
+ - '463'
513
+ - '431'
514
+ - '334'
515
+ - '138'
516
+ - '3'
517
+ - '369'
518
+ - '403'
519
+ - '84'
520
+ - '152'
521
+ - '392'
522
+ - '18'
523
+ - '231'
524
+ - '417'
525
+ - '160'
526
+ - '357'
527
+ - '323'
528
+ - '475'
529
+ - '131'
530
+ - '485'
531
+ - '350'
532
+ - '450'
533
+ - '439'
534
+ - '353'
535
+ - '443'
536
+ - '384'
537
+ - '16'
538
+ - '201'
539
+ - '346'
540
+ - '253'
541
+ - '404'
542
+ - '445'
543
+ - '250'
544
+ - '165'
545
+ - '98'
546
+ - '193'
547
+ - '300'
548
+ - '328'
549
+ - '234'
550
+ - '496'
551
+ - '67'
552
+ - '359'
553
+ - '46'
554
+ - '345'
555
+ - '317'
556
+ - '354'
557
+ - '385'
558
+ - '276'
559
+ - '309'
560
+ - '425'
561
+ - '311'
562
+ - '456'
563
+ - '220'
564
+ - '178'
565
+ - '124'
566
+ - '244'
567
+ - '416'
568
+ - '399'
569
+ - '161'
570
+ - '413'
571
+ - '308'
572
+ - '371'
573
+ - '258'
574
+ - '45'
575
+ - '360'
576
+ - '149'
577
+ - '284'
578
+ - '241'
579
+ - '319'
580
+ - '411'
581
+ - '461'
582
+ - '237'
583
+ - '408'
584
+ - '390'
585
+ - '227'
586
+ - '382'
587
+ - '10'
588
+ - '292'
589
+ - '355'
590
+ - '262'
591
+ - '418'
592
+ - '379'
593
+ - '6'
594
+ - '271'
595
+ - '380'
596
+ - '105'
597
+ - '251'
598
+ - '175'
599
+ - '239'
600
+ - '210'
601
+ - '74'
602
+ - '495'
603
+ - '279'
604
+ - '457'
605
+ - '343'
606
+ - '77'
607
+ - '19'
608
+ - '391'
609
+ - '121'
610
+ - '499'
611
+ - '474'
612
+ - '484'
613
+ - '58'
614
+ - <unk>
615
+ - <sos/eos>
616
+ init: null
617
+ collate_fn_conf:
618
+ label_downsampling: 1
619
+ pad: false
620
+ rand_crop: true
621
+ mix_speech: true
622
+ noise_apply_prob: 0.2
623
+ input_size: 1
624
+ num_classes: 500
625
+ use_preprocessor: true
626
+ use_mixing: true
627
+ cs_aug: false
628
+ mixing_splits: 16
629
+ token_type: word
630
+ bpemodel: null
631
+ non_linguistic_symbols: null
632
+ cleaner: null
633
+ g2p: null
634
+ speech_volume_normalize: null
635
+ rir_scp: null
636
+ rir_apply_prob: 1.0
637
+ noise_scp: data/noise/wav.scp
638
+ noise_apply_prob: 0.2
639
+ noise_db_range: '13_15'
640
+ pred_masked_weight: 1.0
641
+ pred_nomask_weight: 0.0
642
+ loss_weights: 0.0
643
+ frontend: null
644
+ frontend_conf: {}
645
+ specaug: null
646
+ specaug_conf: {}
647
+ normalize: null
648
+ normalize_conf: {}
649
+ preencoder: null
650
+ preencoder_conf: {}
651
+ encoder: torchaudio_hubert
652
+ encoder_conf:
653
+ encoder_projection_dropout: 0.0
654
+ encoder_attention_dropout: 0.0
655
+ encoder_ff_interm_dropout: 0.0
656
+ encoder_dropout: 0.0
657
+ encoder_layer_drop: 0.0
658
+ extractor_mode: layer_norm
659
+ encoder_embed_dim: 1024
660
+ encoder_num_layers: 24
661
+ encoder_num_heads: 16
662
+ encoder_ff_interm_features: 4096
663
+ encoder_layer_norm_first: true
664
+ final_dim: 768
665
+ feature_grad_mult: null
666
+ model: torchaudio
667
+ model_conf: {}
668
+ required:
669
+ - output_dir
670
+ - token_list
671
+ version: '202211'
672
+ distributed: true
exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/acc_m.png ADDED
exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/acc_u.png ADDED
exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/backward_time.png ADDED
exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/correct_m.png ADDED
exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/correct_u.png ADDED
exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/count_m.png ADDED
exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/count_u.png ADDED
exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/forward_time.png ADDED
exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/gpu_max_cached_mem_GB.png ADDED
exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/iter_time.png ADDED
exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/loss.png ADDED
exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/optim0_lr0.png ADDED
exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/optim_step_time.png ADDED
exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/images/train_time.png ADDED
exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/valid.acc_m.ave_10best.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f76d44067300e75f862cdece5daf6062b4c75c6274292238e6495c811fa71124
3
+ size 1266628966
exp_li/kmeans_iter2_hubert_train_li110_lid_portion0.1/km_500.mdl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7497b3a32380a6e3c3e8f09ae2e007bd3bb8e9d10bc3ba8a225d3714a5b4cf8f
3
+ size 1538858
meta.yaml ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ espnet: '202211'
2
+ files:
3
+ model_file: exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/valid.acc_m.ave_10best.pth
4
+ python: "3.8.16 (default, Jan 17 2023, 23:13:24) \n[GCC 11.2.0]"
5
+ timestamp: 1696274467.929186
6
+ torch: 2.0.1+cu117
7
+ yaml_files:
8
+ train_config: exp_li/hubert_iter2_train_ssl_torchaudiohubert_large_960h_pretrain_it2_wavlm_raw_layer_9/config.yaml