JinchuanTian commited on
Commit
09ecea1
·
verified ·
1 Parent(s): dcb376f

Upload folder using huggingface_hub

Browse files
exp/kmeans/38epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fd02581b4dd06736d1a6aa29e20c442afe3d9b299c88359f63320292a5c5cff
3
+ size 2306233340
exp/kmeans/config.yaml ADDED
@@ -0,0 +1,706 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/tuning/train_xeus.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ drop_last_iter: false
5
+ dry_run: false
6
+ iterator_type: sequence
7
+ valid_iterator_type: null
8
+ output_dir: exp/ssl_train_xeus_raw
9
+ ngpu: 1
10
+ seed: 1
11
+ num_workers: 4
12
+ num_att_plot: 0
13
+ dist_backend: nccl
14
+ dist_init_method: env://
15
+ dist_world_size: null
16
+ dist_rank: null
17
+ local_rank: 0
18
+ dist_master_addr: null
19
+ dist_master_port: null
20
+ dist_launcher: null
21
+ multiprocessing_distributed: false
22
+ unused_parameters: false
23
+ sharded_ddp: false
24
+ use_deepspeed: false
25
+ deepspeed_config: null
26
+ gradient_as_bucket_view: true
27
+ ddp_comm_hook: null
28
+ cudnn_enabled: true
29
+ cudnn_benchmark: false
30
+ cudnn_deterministic: true
31
+ use_tf32: false
32
+ collect_stats: false
33
+ write_collected_feats: false
34
+ max_epoch: 1
35
+ patience: null
36
+ val_scheduler_criterion:
37
+ - valid
38
+ - loss
39
+ early_stopping_criterion:
40
+ - valid
41
+ - loss
42
+ - min
43
+ best_model_criterion:
44
+ - - valid
45
+ - loss
46
+ - min
47
+ keep_nbest_models: 5
48
+ nbest_averaging_interval: 0
49
+ grad_clip: 10.0
50
+ grad_clip_type: 2.0
51
+ grad_noise: false
52
+ accum_grad: 1
53
+ no_forward_run: false
54
+ resume: true
55
+ train_dtype: float32
56
+ use_amp: true
57
+ log_interval: null
58
+ use_matplotlib: true
59
+ use_tensorboard: false
60
+ create_graph_in_tensorboard: false
61
+ use_wandb: false
62
+ wandb_project: null
63
+ wandb_id: null
64
+ wandb_entity: null
65
+ wandb_name: null
66
+ wandb_model_log_interval: -1
67
+ detect_anomaly: false
68
+ use_adapter: false
69
+ adapter: lora
70
+ save_strategy: all
71
+ adapter_conf: {}
72
+ pretrain_path: null
73
+ init_param: []
74
+ ignore_init_mismatch: false
75
+ freeze_param: []
76
+ num_iters_per_epoch: 10
77
+ batch_size: 20
78
+ valid_batch_size: null
79
+ batch_bins: 1600000
80
+ valid_batch_bins: null
81
+ category_sample_size: 10
82
+ train_shape_file:
83
+ - exp/ssl_stats_raw/train/speech_shape
84
+ valid_shape_file:
85
+ - exp/ssl_stats_raw/valid/speech_shape
86
+ batch_type: numel
87
+ valid_batch_type: null
88
+ fold_length:
89
+ - 80000
90
+ - 400
91
+ sort_in_batch: descending
92
+ shuffle_within_batch: false
93
+ sort_batch: descending
94
+ multiple_iterator: false
95
+ chunk_length: 500
96
+ chunk_shift_ratio: 0.5
97
+ num_cache_chunks: 1024
98
+ chunk_excluded_key_prefixes: []
99
+ chunk_default_fs: null
100
+ chunk_max_abs_length: null
101
+ chunk_discard_short_samples: true
102
+ train_data_path_and_name_and_type:
103
+ - - dump/raw/train_960/wav.scp
104
+ - speech
105
+ - sound
106
+ - - dump/raw/train_960/text
107
+ - text
108
+ - text
109
+ valid_data_path_and_name_and_type:
110
+ - - dump/raw/dev/wav.scp
111
+ - speech
112
+ - sound
113
+ - - dump/raw/dev/text
114
+ - text
115
+ - text
116
+ multi_task_dataset: false
117
+ allow_variable_data_keys: false
118
+ max_cache_size: 0.0
119
+ max_cache_fd: 32
120
+ allow_multi_rates: false
121
+ valid_max_cache_size: null
122
+ exclude_weight_decay: false
123
+ exclude_weight_decay_conf: {}
124
+ optim: adam
125
+ optim_conf:
126
+ lr: 0.0003
127
+ scheduler: warmuplr
128
+ scheduler_conf:
129
+ warmup_steps: 32000
130
+ token_list:
131
+ - '30'
132
+ - '4'
133
+ - '72'
134
+ - '305'
135
+ - '275'
136
+ - '24'
137
+ - '369'
138
+ - '125'
139
+ - '202'
140
+ - '368'
141
+ - '270'
142
+ - '296'
143
+ - '68'
144
+ - '188'
145
+ - '418'
146
+ - '223'
147
+ - '8'
148
+ - '338'
149
+ - '437'
150
+ - '14'
151
+ - '299'
152
+ - '469'
153
+ - '415'
154
+ - '11'
155
+ - '41'
156
+ - '227'
157
+ - '44'
158
+ - '35'
159
+ - '179'
160
+ - '449'
161
+ - '23'
162
+ - '10'
163
+ - '416'
164
+ - '291'
165
+ - '100'
166
+ - '74'
167
+ - '327'
168
+ - '107'
169
+ - '321'
170
+ - '208'
171
+ - '76'
172
+ - '267'
173
+ - '130'
174
+ - '173'
175
+ - '96'
176
+ - '162'
177
+ - '456'
178
+ - '84'
179
+ - '98'
180
+ - '217'
181
+ - '48'
182
+ - '482'
183
+ - '127'
184
+ - '110'
185
+ - '366'
186
+ - '336'
187
+ - '387'
188
+ - '105'
189
+ - '373'
190
+ - '139'
191
+ - '61'
192
+ - '370'
193
+ - '464'
194
+ - '397'
195
+ - '281'
196
+ - '151'
197
+ - '154'
198
+ - '155'
199
+ - '203'
200
+ - '440'
201
+ - '119'
202
+ - '71'
203
+ - '320'
204
+ - '93'
205
+ - '20'
206
+ - '138'
207
+ - '78'
208
+ - '216'
209
+ - '104'
210
+ - '205'
211
+ - '38'
212
+ - '382'
213
+ - '238'
214
+ - '474'
215
+ - '225'
216
+ - '465'
217
+ - '309'
218
+ - '17'
219
+ - '285'
220
+ - '90'
221
+ - '375'
222
+ - '356'
223
+ - '256'
224
+ - '392'
225
+ - '311'
226
+ - '398'
227
+ - '9'
228
+ - '264'
229
+ - '341'
230
+ - '168'
231
+ - '339'
232
+ - '40'
233
+ - '344'
234
+ - '422'
235
+ - '63'
236
+ - '396'
237
+ - '51'
238
+ - '184'
239
+ - '441'
240
+ - '346'
241
+ - '252'
242
+ - '206'
243
+ - '322'
244
+ - '444'
245
+ - '198'
246
+ - '66'
247
+ - '269'
248
+ - '145'
249
+ - '69'
250
+ - '244'
251
+ - '463'
252
+ - '37'
253
+ - '172'
254
+ - '271'
255
+ - '313'
256
+ - '279'
257
+ - '106'
258
+ - '377'
259
+ - '158'
260
+ - '5'
261
+ - '445'
262
+ - '455'
263
+ - '134'
264
+ - '287'
265
+ - '7'
266
+ - '297'
267
+ - '420'
268
+ - '13'
269
+ - '31'
270
+ - '484'
271
+ - '91'
272
+ - '34'
273
+ - '488'
274
+ - '468'
275
+ - '21'
276
+ - '193'
277
+ - '288'
278
+ - '159'
279
+ - '247'
280
+ - '476'
281
+ - '25'
282
+ - '265'
283
+ - '115'
284
+ - '50'
285
+ - '394'
286
+ - '197'
287
+ - '116'
288
+ - '57'
289
+ - '182'
290
+ - '378'
291
+ - '135'
292
+ - '89'
293
+ - '167'
294
+ - '19'
295
+ - '148'
296
+ - '425'
297
+ - '103'
298
+ - '95'
299
+ - '454'
300
+ - '376'
301
+ - '178'
302
+ - '79'
303
+ - '424'
304
+ - '261'
305
+ - '36'
306
+ - '426'
307
+ - '152'
308
+ - '102'
309
+ - '292'
310
+ - '258'
311
+ - '60'
312
+ - '328'
313
+ - '280'
314
+ - '273'
315
+ - '111'
316
+ - '240'
317
+ - '213'
318
+ - '483'
319
+ - '300'
320
+ - '363'
321
+ - '174'
322
+ - '317'
323
+ - '419'
324
+ - '439'
325
+ - '42'
326
+ - '118'
327
+ - '222'
328
+ - '15'
329
+ - '276'
330
+ - '277'
331
+ - '166'
332
+ - '304'
333
+ - '114'
334
+ - '329'
335
+ - '395'
336
+ - '413'
337
+ - '435'
338
+ - '33'
339
+ - '266'
340
+ - '133'
341
+ - '210'
342
+ - '408'
343
+ - '330'
344
+ - '315'
345
+ - '251'
346
+ - '6'
347
+ - '357'
348
+ - '171'
349
+ - '56'
350
+ - '1'
351
+ - '59'
352
+ - '359'
353
+ - '28'
354
+ - '215'
355
+ - '97'
356
+ - '274'
357
+ - '170'
358
+ - '49'
359
+ - '81'
360
+ - '108'
361
+ - '282'
362
+ - '85'
363
+ - '200'
364
+ - '80'
365
+ - '243'
366
+ - '364'
367
+ - '113'
368
+ - '176'
369
+ - '433'
370
+ - '77'
371
+ - '335'
372
+ - '231'
373
+ - '462'
374
+ - '62'
375
+ - '286'
376
+ - '67'
377
+ - '191'
378
+ - '228'
379
+ - '16'
380
+ - '22'
381
+ - '122'
382
+ - '235'
383
+ - '331'
384
+ - '137'
385
+ - '289'
386
+ - '92'
387
+ - '157'
388
+ - '417'
389
+ - '319'
390
+ - '2'
391
+ - '101'
392
+ - '129'
393
+ - '169'
394
+ - '26'
395
+ - '165'
396
+ - '143'
397
+ - '229'
398
+ - '220'
399
+ - '324'
400
+ - '393'
401
+ - '272'
402
+ - '43'
403
+ - '367'
404
+ - '204'
405
+ - '410'
406
+ - '278'
407
+ - '73'
408
+ - '65'
409
+ - '428'
410
+ - '411'
411
+ - '380'
412
+ - '99'
413
+ - '83'
414
+ - '412'
415
+ - '307'
416
+ - '306'
417
+ - '201'
418
+ - '361'
419
+ - '232'
420
+ - '290'
421
+ - '109'
422
+ - '140'
423
+ - '438'
424
+ - '64'
425
+ - '447'
426
+ - '374'
427
+ - '301'
428
+ - '249'
429
+ - '186'
430
+ - '234'
431
+ - '121'
432
+ - '239'
433
+ - '255'
434
+ - '82'
435
+ - '384'
436
+ - '160'
437
+ - '494'
438
+ - '351'
439
+ - '283'
440
+ - '32'
441
+ - '54'
442
+ - '52'
443
+ - '187'
444
+ - '337'
445
+ - '112'
446
+ - '260'
447
+ - '132'
448
+ - '47'
449
+ - '457'
450
+ - '211'
451
+ - '490'
452
+ - '430'
453
+ - '423'
454
+ - '175'
455
+ - '142'
456
+ - '499'
457
+ - '407'
458
+ - '303'
459
+ - '12'
460
+ - '403'
461
+ - '209'
462
+ - '233'
463
+ - '262'
464
+ - '146'
465
+ - '436'
466
+ - '219'
467
+ - '316'
468
+ - '123'
469
+ - '460'
470
+ - '39'
471
+ - '58'
472
+ - '333'
473
+ - '475'
474
+ - '70'
475
+ - '218'
476
+ - '199'
477
+ - '295'
478
+ - '389'
479
+ - '345'
480
+ - '156'
481
+ - '383'
482
+ - '390'
483
+ - '192'
484
+ - '343'
485
+ - '150'
486
+ - '318'
487
+ - '196'
488
+ - '94'
489
+ - '194'
490
+ - '27'
491
+ - '459'
492
+ - '257'
493
+ - '371'
494
+ - '498'
495
+ - '485'
496
+ - '190'
497
+ - '402'
498
+ - '163'
499
+ - '491'
500
+ - '0'
501
+ - '241'
502
+ - '467'
503
+ - '149'
504
+ - '18'
505
+ - '429'
506
+ - '421'
507
+ - '189'
508
+ - '365'
509
+ - '3'
510
+ - '75'
511
+ - '141'
512
+ - '259'
513
+ - '120'
514
+ - '372'
515
+ - '405'
516
+ - '354'
517
+ - '446'
518
+ - '340'
519
+ - '406'
520
+ - '353'
521
+ - '53'
522
+ - '334'
523
+ - '427'
524
+ - '432'
525
+ - '442'
526
+ - '131'
527
+ - '88'
528
+ - '470'
529
+ - '473'
530
+ - '254'
531
+ - '349'
532
+ - '214'
533
+ - '153'
534
+ - '342'
535
+ - '212'
536
+ - '434'
537
+ - '46'
538
+ - '86'
539
+ - '350'
540
+ - '284'
541
+ - '308'
542
+ - '323'
543
+ - '381'
544
+ - '161'
545
+ - '391'
546
+ - '248'
547
+ - '180'
548
+ - '230'
549
+ - '452'
550
+ - '325'
551
+ - '246'
552
+ - '224'
553
+ - '347'
554
+ - '195'
555
+ - '128'
556
+ - '55'
557
+ - '314'
558
+ - '126'
559
+ - '147'
560
+ - '481'
561
+ - '185'
562
+ - '358'
563
+ - '478'
564
+ - '400'
565
+ - '495'
566
+ - '388'
567
+ - '177'
568
+ - '181'
569
+ - '466'
570
+ - '362'
571
+ - '268'
572
+ - '326'
573
+ - '144'
574
+ - '493'
575
+ - '489'
576
+ - '450'
577
+ - '399'
578
+ - '443'
579
+ - '253'
580
+ - '236'
581
+ - '117'
582
+ - '448'
583
+ - '312'
584
+ - '379'
585
+ - '492'
586
+ - '496'
587
+ - '87'
588
+ - '332'
589
+ - '298'
590
+ - '497'
591
+ - '221'
592
+ - '480'
593
+ - '226'
594
+ - '302'
595
+ - '348'
596
+ - '136'
597
+ - '451'
598
+ - '479'
599
+ - '183'
600
+ - '45'
601
+ - '404'
602
+ - '263'
603
+ - '477'
604
+ - '355'
605
+ - '29'
606
+ - '414'
607
+ - '237'
608
+ - '409'
609
+ - '385'
610
+ - '461'
611
+ - '386'
612
+ - '124'
613
+ - '401'
614
+ - '352'
615
+ - '293'
616
+ - '471'
617
+ - '458'
618
+ - '472'
619
+ - '486'
620
+ - '164'
621
+ - '453'
622
+ - '310'
623
+ - '207'
624
+ - '487'
625
+ - '294'
626
+ - '360'
627
+ - '245'
628
+ - '242'
629
+ - '431'
630
+ - '250'
631
+ - <unk>
632
+ - <sos/eos>
633
+ init: xavier_uniform
634
+ collate_fn_conf:
635
+ label_downsampling: 1
636
+ pad: false
637
+ rand_crop: true
638
+ crop_audio: true
639
+ input_size: null
640
+ num_classes: null
641
+ use_preprocessor: true
642
+ token_type: word
643
+ bpemodel: null
644
+ non_linguistic_symbols: null
645
+ cleaner: null
646
+ g2p: null
647
+ speech_volume_normalize: null
648
+ rir_scp: null
649
+ rir_apply_prob: 1.0
650
+ noise_scp: null
651
+ noise_apply_prob: 1.0
652
+ noise_db_range: '13_15'
653
+ window_size: null
654
+ window_shift: null
655
+ loss:
656
+ - name: hubert
657
+ conf:
658
+ num_classes: 2048
659
+ final_dim: 768
660
+ util:
661
+ - name: mask
662
+ conf: {}
663
+ frontend: wav2vec_cnn
664
+ frontend_conf:
665
+ norm_mode: layer_norm
666
+ conv_mode: standard
667
+ bias: true
668
+ normalize_audio: true
669
+ normalize_output: false
670
+ fs: 16k
671
+ specaug: null
672
+ specaug_conf: {}
673
+ normalize: null
674
+ normalize_conf: {}
675
+ preencoder: linear
676
+ preencoder_conf:
677
+ output_size: 1024
678
+ encoder: e_branchformer
679
+ encoder_conf:
680
+ output_size: 1024
681
+ attention_heads: 8
682
+ attention_layer_type: selfattn
683
+ pos_enc_layer_type: conv
684
+ rel_pos_type: latest
685
+ cgmlp_linear_units: 4096
686
+ cgmlp_conv_kernel: 31
687
+ use_linear_after_conv: false
688
+ gate_activation: identity
689
+ num_blocks: 19
690
+ dropout_rate: 0.1
691
+ positional_dropout_rate: 0.1
692
+ attention_dropout_rate: 0.1
693
+ input_layer: null
694
+ layer_drop_rate: 0.0
695
+ linear_units: 4096
696
+ positionwise_layer_type: linear
697
+ macaron_ffn: true
698
+ use_ffn: true
699
+ merge_conv_kernel: 31
700
+ model: espnet
701
+ model_conf: {}
702
+ required:
703
+ - output_dir
704
+ - token_list
705
+ version: '202412'
706
+ distributed: false
exp/kmeans/xeus_18_5000clusters/km_5000.mdl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9954425d38ea74b0fed2ea2a26a70406ef34441c8a643284e02a3bc73320fbd9
3
+ size 20500858
exp/kmeans/xeus_18_5000clusters/logdir/learn_kmeans.log ADDED
The diff for this file is too large to render. See raw diff
 
exp/kmeans/xeus_18_5000clusters/train.scp ADDED
The diff for this file is too large to render. See raw diff