Shikhar Bharadwaj commited on
Commit
25042ab
·
1 Parent(s): 2036284

Update model

Browse files
Files changed (24) hide show
  1. README.md +1263 -0
  2. meta.yaml +8 -0
  3. work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/config.yaml +1206 -0
  4. work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/epoch_latest.pt +3 -0
  5. work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/acc.png +0 -0
  6. work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/acc_mask.png +0 -0
  7. work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/acc_unmask.png +0 -0
  8. work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/count_masked.png +0 -0
  9. work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/count_unmask.png +0 -0
  10. work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/entropy.png +0 -0
  11. work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/gpu_max_cached_mem_GB.png +0 -0
  12. work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/grad_norm.png +0 -0
  13. work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/iter_time.png +0 -0
  14. work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/learning_rate.png +0 -0
  15. work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/loss.png +0 -0
  16. work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/loss_scale.png +0 -0
  17. work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/n_uniq_pred.png +0 -0
  18. work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/n_uniq_pred_msk.png +0 -0
  19. work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/n_uniq_pred_unmsk.png +0 -0
  20. work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/n_uniq_tgt.png +0 -0
  21. work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/n_uniq_tgt_msk.png +0 -0
  22. work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/step_time.png +0 -0
  23. work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/vocab_cov_pred.png +0 -0
  24. work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/vocab_cov_tgt.png +0 -0
README.md ADDED
@@ -0,0 +1,1263 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - espnet
4
+ - audio
5
+ - self-supervised-learning
6
+ datasets:
7
+ - as2m
8
+ license: cc-by-4.0
9
+ ---
10
+
11
+ ## ESPnet2 SSL model
12
+
13
+ ### `shikhar7ssu/OpenBEATs-Large-i3`
14
+
15
+ This model was trained by Shikhar Bharadwaj using as2m recipe in [espnet](https://github.com/espnet/espnet/).
16
+
17
+ ## SSL config
18
+
19
+ <details><summary>expand</summary>
20
+
21
+ ```
22
+ config: conf/ear_large.yaml
23
+ print_config: false
24
+ log_level: INFO
25
+ drop_last_iter: false
26
+ dry_run: false
27
+ iterator_type: sequence
28
+ valid_iterator_type: null
29
+ output_dir: /work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000
30
+ ngpu: 1
31
+ seed: 0
32
+ num_workers: 4
33
+ num_att_plot: 0
34
+ dist_backend: nccl
35
+ dist_init_method: env://
36
+ dist_world_size: 4
37
+ dist_rank: 0
38
+ local_rank: 0
39
+ dist_master_addr: localhost
40
+ dist_master_port: 60649
41
+ dist_launcher: null
42
+ multiprocessing_distributed: true
43
+ unused_parameters: false
44
+ sharded_ddp: false
45
+ use_deepspeed: true
46
+ deepspeed_config: ewogICJ0cmFpbl9taWNyb19iYXRjaF9zaXplX3Blcl9ncHUiOiAxLAogICJncmFkaWVudF9hY2N1bXVsYXRpb25fc3RlcHMiOiAxLAogICJncmFkaWVudF9jbGlwcGluZyI6IDEuMCwKICAiYmYxNiI6IHsKICAgICJlbmFibGVkIjogdHJ1ZQogIH0sCiAgIm9wdGltaXplciI6IHsKICAgICJ0eXBlIjogIkFkYW0iLAogICAgInBhcmFtcyI6IHsKICAgICAgImxyIjogMS4wZS00LAogICAgICAiYmV0YXMiOiBbMC45LCAwLjk4XSwKICAgICAgImVwcyI6IDFlLTEyLAogICAgICAid2VpZ2h0X2RlY2F5IjogMS4wZS0yLAogICAgICAiYWRhbV93X21vZGUiOiB0cnVlCiAgICB9CiAgfSwKICAic2NoZWR1bGVyIjogewogICAgInR5cGUiOiAiV2FybXVwRGVjYXlMUiIsCiAgICAicGFyYW1zIjogewogICAgICAid2FybXVwX3R5cGUiOiAibGluZWFyIiwKICAgICAgInRvdGFsX251bV9zdGVwcyI6IDQwMDAwMCwKICAgICAgIndhcm11cF9udW1fc3RlcHMiOiA0MDAwMCwKICAgICAgIndhcm11cF9tYXhfbHIiOiAxLjBlLTQsCiAgICAgICJ3YXJtdXBfbWluX2xyIjogMS4wZS02CiAgICB9CiAgfSwKICAid2FsbF9jbG9ja19icmVha2Rvd24iOiBmYWxzZSwKICAic3RlcHNfcGVyX3ByaW50IjogMzAwMAp9Cg==
47
+ gradient_as_bucket_view: true
48
+ ddp_comm_hook: null
49
+ cudnn_enabled: true
50
+ cudnn_benchmark: false
51
+ cudnn_deterministic: true
52
+ use_tf32: false
53
+ collect_stats: false
54
+ write_collected_feats: false
55
+ max_epoch: 59
56
+ patience: null
57
+ val_scheduler_criterion:
58
+ - valid
59
+ - loss
60
+ early_stopping_criterion:
61
+ - valid
62
+ - loss
63
+ - min
64
+ best_model_criterion:
65
+ - - train
66
+ - loss
67
+ - min
68
+ - - valid
69
+ - loss
70
+ - min
71
+ - - train
72
+ - acc
73
+ - max
74
+ - - valid
75
+ - acc
76
+ - max
77
+ keep_nbest_models:
78
+ - 10
79
+ nbest_averaging_interval: 0
80
+ grad_clip: 5.0
81
+ grad_clip_type: 2.0
82
+ grad_noise: false
83
+ accum_grad: 1
84
+ no_forward_run: false
85
+ resume: true
86
+ train_dtype: float32
87
+ use_amp: false
88
+ log_interval: null
89
+ use_matplotlib: true
90
+ use_tensorboard: true
91
+ create_graph_in_tensorboard: false
92
+ use_wandb: true
93
+ wandb_project: EARlarge.PT
94
+ wandb_id: null
95
+ wandb_entity: shikhar
96
+ wandb_name: large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000
97
+ wandb_model_log_interval: -1
98
+ detect_anomaly: false
99
+ use_adapter: false
100
+ adapter: lora
101
+ save_strategy: all
102
+ adapter_conf: {}
103
+ pretrain_path: null
104
+ init_param: []
105
+ ignore_init_mismatch: false
106
+ freeze_param: []
107
+ num_iters_per_epoch: null
108
+ batch_size: 20
109
+ valid_batch_size: null
110
+ batch_bins: 1600000
111
+ valid_batch_bins: null
112
+ category_sample_size: 10
113
+ train_shape_file:
114
+ - /work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_stats_fbank/train/speech_shape
115
+ - /work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_stats_fbank/train/target_shape.word
116
+ valid_shape_file:
117
+ - /work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_stats_fbank/valid/speech_shape
118
+ - /work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_stats_fbank/valid/target_shape.word
119
+ batch_type: length
120
+ valid_batch_type: null
121
+ fold_length:
122
+ - 160000
123
+ - 600
124
+ sort_in_batch: descending
125
+ shuffle_within_batch: false
126
+ sort_batch: descending
127
+ multiple_iterator: false
128
+ utt2weight_file: null
129
+ chunk_length: 500
130
+ chunk_shift_ratio: 0.5
131
+ num_cache_chunks: 1024
132
+ chunk_excluded_key_prefixes: []
133
+ chunk_default_fs: null
134
+ chunk_max_abs_length: null
135
+ chunk_discard_short_samples: true
136
+ train_data_path_and_name_and_type:
137
+ - - /work/nvme/bbjs/sbharadwaj/7Msounds/dump/fbank/train/feats.scp
138
+ - speech
139
+ - kaldi_ark
140
+ - - /work/nvme/bbjs/sbharadwaj/7Msounds/dump/fbank/train/target_iter2_tokenizer_large_100k_steps
141
+ - target
142
+ - text
143
+ valid_data_path_and_name_and_type:
144
+ - - /work/nvme/bbjs/sbharadwaj/7Msounds/dump/fbank/eval/feats.scp
145
+ - speech
146
+ - kaldi_ark
147
+ - - /work/nvme/bbjs/sbharadwaj/7Msounds/dump/fbank/eval/target_iter2_tokenizer_large_100k_steps
148
+ - target
149
+ - text
150
+ multi_task_dataset: false
151
+ allow_variable_data_keys: false
152
+ max_cache_size: 0.0
153
+ max_cache_fd: 32
154
+ allow_multi_rates: false
155
+ valid_max_cache_size: null
156
+ exclude_weight_decay: false
157
+ exclude_weight_decay_conf: {}
158
+ optim: adadelta
159
+ optim_conf: {}
160
+ scheduler: null
161
+ scheduler_conf: {}
162
+ lightning_conf: {}
163
+ token_list:
164
+ - <unk>
165
+ - '0'
166
+ - '1'
167
+ - '2'
168
+ - '3'
169
+ - '4'
170
+ - '5'
171
+ - '6'
172
+ - '7'
173
+ - '8'
174
+ - '9'
175
+ - '10'
176
+ - '11'
177
+ - '12'
178
+ - '13'
179
+ - '14'
180
+ - '15'
181
+ - '16'
182
+ - '17'
183
+ - '18'
184
+ - '19'
185
+ - '20'
186
+ - '21'
187
+ - '22'
188
+ - '23'
189
+ - '24'
190
+ - '25'
191
+ - '26'
192
+ - '27'
193
+ - '28'
194
+ - '29'
195
+ - '30'
196
+ - '31'
197
+ - '32'
198
+ - '33'
199
+ - '34'
200
+ - '35'
201
+ - '36'
202
+ - '37'
203
+ - '38'
204
+ - '39'
205
+ - '40'
206
+ - '41'
207
+ - '42'
208
+ - '43'
209
+ - '44'
210
+ - '45'
211
+ - '46'
212
+ - '47'
213
+ - '48'
214
+ - '49'
215
+ - '50'
216
+ - '51'
217
+ - '52'
218
+ - '53'
219
+ - '54'
220
+ - '55'
221
+ - '56'
222
+ - '57'
223
+ - '58'
224
+ - '59'
225
+ - '60'
226
+ - '61'
227
+ - '62'
228
+ - '63'
229
+ - '64'
230
+ - '65'
231
+ - '66'
232
+ - '67'
233
+ - '68'
234
+ - '69'
235
+ - '70'
236
+ - '71'
237
+ - '72'
238
+ - '73'
239
+ - '74'
240
+ - '75'
241
+ - '76'
242
+ - '77'
243
+ - '78'
244
+ - '79'
245
+ - '80'
246
+ - '81'
247
+ - '82'
248
+ - '83'
249
+ - '84'
250
+ - '85'
251
+ - '86'
252
+ - '87'
253
+ - '88'
254
+ - '89'
255
+ - '90'
256
+ - '91'
257
+ - '92'
258
+ - '93'
259
+ - '94'
260
+ - '95'
261
+ - '96'
262
+ - '97'
263
+ - '98'
264
+ - '99'
265
+ - '100'
266
+ - '101'
267
+ - '102'
268
+ - '103'
269
+ - '104'
270
+ - '105'
271
+ - '106'
272
+ - '107'
273
+ - '108'
274
+ - '109'
275
+ - '110'
276
+ - '111'
277
+ - '112'
278
+ - '113'
279
+ - '114'
280
+ - '115'
281
+ - '116'
282
+ - '117'
283
+ - '118'
284
+ - '119'
285
+ - '120'
286
+ - '121'
287
+ - '122'
288
+ - '123'
289
+ - '124'
290
+ - '125'
291
+ - '126'
292
+ - '127'
293
+ - '128'
294
+ - '129'
295
+ - '130'
296
+ - '131'
297
+ - '132'
298
+ - '133'
299
+ - '134'
300
+ - '135'
301
+ - '136'
302
+ - '137'
303
+ - '138'
304
+ - '139'
305
+ - '140'
306
+ - '141'
307
+ - '142'
308
+ - '143'
309
+ - '144'
310
+ - '145'
311
+ - '146'
312
+ - '147'
313
+ - '148'
314
+ - '149'
315
+ - '150'
316
+ - '151'
317
+ - '152'
318
+ - '153'
319
+ - '154'
320
+ - '155'
321
+ - '156'
322
+ - '157'
323
+ - '158'
324
+ - '159'
325
+ - '160'
326
+ - '161'
327
+ - '162'
328
+ - '163'
329
+ - '164'
330
+ - '165'
331
+ - '166'
332
+ - '167'
333
+ - '168'
334
+ - '169'
335
+ - '170'
336
+ - '171'
337
+ - '172'
338
+ - '173'
339
+ - '174'
340
+ - '175'
341
+ - '176'
342
+ - '177'
343
+ - '178'
344
+ - '179'
345
+ - '180'
346
+ - '181'
347
+ - '182'
348
+ - '183'
349
+ - '184'
350
+ - '185'
351
+ - '186'
352
+ - '187'
353
+ - '188'
354
+ - '189'
355
+ - '190'
356
+ - '191'
357
+ - '192'
358
+ - '193'
359
+ - '194'
360
+ - '195'
361
+ - '196'
362
+ - '197'
363
+ - '198'
364
+ - '199'
365
+ - '200'
366
+ - '201'
367
+ - '202'
368
+ - '203'
369
+ - '204'
370
+ - '205'
371
+ - '206'
372
+ - '207'
373
+ - '208'
374
+ - '209'
375
+ - '210'
376
+ - '211'
377
+ - '212'
378
+ - '213'
379
+ - '214'
380
+ - '215'
381
+ - '216'
382
+ - '217'
383
+ - '218'
384
+ - '219'
385
+ - '220'
386
+ - '221'
387
+ - '222'
388
+ - '223'
389
+ - '224'
390
+ - '225'
391
+ - '226'
392
+ - '227'
393
+ - '228'
394
+ - '229'
395
+ - '230'
396
+ - '231'
397
+ - '232'
398
+ - '233'
399
+ - '234'
400
+ - '235'
401
+ - '236'
402
+ - '237'
403
+ - '238'
404
+ - '239'
405
+ - '240'
406
+ - '241'
407
+ - '242'
408
+ - '243'
409
+ - '244'
410
+ - '245'
411
+ - '246'
412
+ - '247'
413
+ - '248'
414
+ - '249'
415
+ - '250'
416
+ - '251'
417
+ - '252'
418
+ - '253'
419
+ - '254'
420
+ - '255'
421
+ - '256'
422
+ - '257'
423
+ - '258'
424
+ - '259'
425
+ - '260'
426
+ - '261'
427
+ - '262'
428
+ - '263'
429
+ - '264'
430
+ - '265'
431
+ - '266'
432
+ - '267'
433
+ - '268'
434
+ - '269'
435
+ - '270'
436
+ - '271'
437
+ - '272'
438
+ - '273'
439
+ - '274'
440
+ - '275'
441
+ - '276'
442
+ - '277'
443
+ - '278'
444
+ - '279'
445
+ - '280'
446
+ - '281'
447
+ - '282'
448
+ - '283'
449
+ - '284'
450
+ - '285'
451
+ - '286'
452
+ - '287'
453
+ - '288'
454
+ - '289'
455
+ - '290'
456
+ - '291'
457
+ - '292'
458
+ - '293'
459
+ - '294'
460
+ - '295'
461
+ - '296'
462
+ - '297'
463
+ - '298'
464
+ - '299'
465
+ - '300'
466
+ - '301'
467
+ - '302'
468
+ - '303'
469
+ - '304'
470
+ - '305'
471
+ - '306'
472
+ - '307'
473
+ - '308'
474
+ - '309'
475
+ - '310'
476
+ - '311'
477
+ - '312'
478
+ - '313'
479
+ - '314'
480
+ - '315'
481
+ - '316'
482
+ - '317'
483
+ - '318'
484
+ - '319'
485
+ - '320'
486
+ - '321'
487
+ - '322'
488
+ - '323'
489
+ - '324'
490
+ - '325'
491
+ - '326'
492
+ - '327'
493
+ - '328'
494
+ - '329'
495
+ - '330'
496
+ - '331'
497
+ - '332'
498
+ - '333'
499
+ - '334'
500
+ - '335'
501
+ - '336'
502
+ - '337'
503
+ - '338'
504
+ - '339'
505
+ - '340'
506
+ - '341'
507
+ - '342'
508
+ - '343'
509
+ - '344'
510
+ - '345'
511
+ - '346'
512
+ - '347'
513
+ - '348'
514
+ - '349'
515
+ - '350'
516
+ - '351'
517
+ - '352'
518
+ - '353'
519
+ - '354'
520
+ - '355'
521
+ - '356'
522
+ - '357'
523
+ - '358'
524
+ - '359'
525
+ - '360'
526
+ - '361'
527
+ - '362'
528
+ - '363'
529
+ - '364'
530
+ - '365'
531
+ - '366'
532
+ - '367'
533
+ - '368'
534
+ - '369'
535
+ - '370'
536
+ - '371'
537
+ - '372'
538
+ - '373'
539
+ - '374'
540
+ - '375'
541
+ - '376'
542
+ - '377'
543
+ - '378'
544
+ - '379'
545
+ - '380'
546
+ - '381'
547
+ - '382'
548
+ - '383'
549
+ - '384'
550
+ - '385'
551
+ - '386'
552
+ - '387'
553
+ - '388'
554
+ - '389'
555
+ - '390'
556
+ - '391'
557
+ - '392'
558
+ - '393'
559
+ - '394'
560
+ - '395'
561
+ - '396'
562
+ - '397'
563
+ - '398'
564
+ - '399'
565
+ - '400'
566
+ - '401'
567
+ - '402'
568
+ - '403'
569
+ - '404'
570
+ - '405'
571
+ - '406'
572
+ - '407'
573
+ - '408'
574
+ - '409'
575
+ - '410'
576
+ - '411'
577
+ - '412'
578
+ - '413'
579
+ - '414'
580
+ - '415'
581
+ - '416'
582
+ - '417'
583
+ - '418'
584
+ - '419'
585
+ - '420'
586
+ - '421'
587
+ - '422'
588
+ - '423'
589
+ - '424'
590
+ - '425'
591
+ - '426'
592
+ - '427'
593
+ - '428'
594
+ - '429'
595
+ - '430'
596
+ - '431'
597
+ - '432'
598
+ - '433'
599
+ - '434'
600
+ - '435'
601
+ - '436'
602
+ - '437'
603
+ - '438'
604
+ - '439'
605
+ - '440'
606
+ - '441'
607
+ - '442'
608
+ - '443'
609
+ - '444'
610
+ - '445'
611
+ - '446'
612
+ - '447'
613
+ - '448'
614
+ - '449'
615
+ - '450'
616
+ - '451'
617
+ - '452'
618
+ - '453'
619
+ - '454'
620
+ - '455'
621
+ - '456'
622
+ - '457'
623
+ - '458'
624
+ - '459'
625
+ - '460'
626
+ - '461'
627
+ - '462'
628
+ - '463'
629
+ - '464'
630
+ - '465'
631
+ - '466'
632
+ - '467'
633
+ - '468'
634
+ - '469'
635
+ - '470'
636
+ - '471'
637
+ - '472'
638
+ - '473'
639
+ - '474'
640
+ - '475'
641
+ - '476'
642
+ - '477'
643
+ - '478'
644
+ - '479'
645
+ - '480'
646
+ - '481'
647
+ - '482'
648
+ - '483'
649
+ - '484'
650
+ - '485'
651
+ - '486'
652
+ - '487'
653
+ - '488'
654
+ - '489'
655
+ - '490'
656
+ - '491'
657
+ - '492'
658
+ - '493'
659
+ - '494'
660
+ - '495'
661
+ - '496'
662
+ - '497'
663
+ - '498'
664
+ - '499'
665
+ - '500'
666
+ - '501'
667
+ - '502'
668
+ - '503'
669
+ - '504'
670
+ - '505'
671
+ - '506'
672
+ - '507'
673
+ - '508'
674
+ - '509'
675
+ - '510'
676
+ - '511'
677
+ - '512'
678
+ - '513'
679
+ - '514'
680
+ - '515'
681
+ - '516'
682
+ - '517'
683
+ - '518'
684
+ - '519'
685
+ - '520'
686
+ - '521'
687
+ - '522'
688
+ - '523'
689
+ - '524'
690
+ - '525'
691
+ - '526'
692
+ - '527'
693
+ - '528'
694
+ - '529'
695
+ - '530'
696
+ - '531'
697
+ - '532'
698
+ - '533'
699
+ - '534'
700
+ - '535'
701
+ - '536'
702
+ - '537'
703
+ - '538'
704
+ - '539'
705
+ - '540'
706
+ - '541'
707
+ - '542'
708
+ - '543'
709
+ - '544'
710
+ - '545'
711
+ - '546'
712
+ - '547'
713
+ - '548'
714
+ - '549'
715
+ - '550'
716
+ - '551'
717
+ - '552'
718
+ - '553'
719
+ - '554'
720
+ - '555'
721
+ - '556'
722
+ - '557'
723
+ - '558'
724
+ - '559'
725
+ - '560'
726
+ - '561'
727
+ - '562'
728
+ - '563'
729
+ - '564'
730
+ - '565'
731
+ - '566'
732
+ - '567'
733
+ - '568'
734
+ - '569'
735
+ - '570'
736
+ - '571'
737
+ - '572'
738
+ - '573'
739
+ - '574'
740
+ - '575'
741
+ - '576'
742
+ - '577'
743
+ - '578'
744
+ - '579'
745
+ - '580'
746
+ - '581'
747
+ - '582'
748
+ - '583'
749
+ - '584'
750
+ - '585'
751
+ - '586'
752
+ - '587'
753
+ - '588'
754
+ - '589'
755
+ - '590'
756
+ - '591'
757
+ - '592'
758
+ - '593'
759
+ - '594'
760
+ - '595'
761
+ - '596'
762
+ - '597'
763
+ - '598'
764
+ - '599'
765
+ - '600'
766
+ - '601'
767
+ - '602'
768
+ - '603'
769
+ - '604'
770
+ - '605'
771
+ - '606'
772
+ - '607'
773
+ - '608'
774
+ - '609'
775
+ - '610'
776
+ - '611'
777
+ - '612'
778
+ - '613'
779
+ - '614'
780
+ - '615'
781
+ - '616'
782
+ - '617'
783
+ - '618'
784
+ - '619'
785
+ - '620'
786
+ - '621'
787
+ - '622'
788
+ - '623'
789
+ - '624'
790
+ - '625'
791
+ - '626'
792
+ - '627'
793
+ - '628'
794
+ - '629'
795
+ - '630'
796
+ - '631'
797
+ - '632'
798
+ - '633'
799
+ - '634'
800
+ - '635'
801
+ - '636'
802
+ - '637'
803
+ - '638'
804
+ - '639'
805
+ - '640'
806
+ - '641'
807
+ - '642'
808
+ - '643'
809
+ - '644'
810
+ - '645'
811
+ - '646'
812
+ - '647'
813
+ - '648'
814
+ - '649'
815
+ - '650'
816
+ - '651'
817
+ - '652'
818
+ - '653'
819
+ - '654'
820
+ - '655'
821
+ - '656'
822
+ - '657'
823
+ - '658'
824
+ - '659'
825
+ - '660'
826
+ - '661'
827
+ - '662'
828
+ - '663'
829
+ - '664'
830
+ - '665'
831
+ - '666'
832
+ - '667'
833
+ - '668'
834
+ - '669'
835
+ - '670'
836
+ - '671'
837
+ - '672'
838
+ - '673'
839
+ - '674'
840
+ - '675'
841
+ - '676'
842
+ - '677'
843
+ - '678'
844
+ - '679'
845
+ - '680'
846
+ - '681'
847
+ - '682'
848
+ - '683'
849
+ - '684'
850
+ - '685'
851
+ - '686'
852
+ - '687'
853
+ - '688'
854
+ - '689'
855
+ - '690'
856
+ - '691'
857
+ - '692'
858
+ - '693'
859
+ - '694'
860
+ - '695'
861
+ - '696'
862
+ - '697'
863
+ - '698'
864
+ - '699'
865
+ - '700'
866
+ - '701'
867
+ - '702'
868
+ - '703'
869
+ - '704'
870
+ - '705'
871
+ - '706'
872
+ - '707'
873
+ - '708'
874
+ - '709'
875
+ - '710'
876
+ - '711'
877
+ - '712'
878
+ - '713'
879
+ - '714'
880
+ - '715'
881
+ - '716'
882
+ - '717'
883
+ - '718'
884
+ - '719'
885
+ - '720'
886
+ - '721'
887
+ - '722'
888
+ - '723'
889
+ - '724'
890
+ - '725'
891
+ - '726'
892
+ - '727'
893
+ - '728'
894
+ - '729'
895
+ - '730'
896
+ - '731'
897
+ - '732'
898
+ - '733'
899
+ - '734'
900
+ - '735'
901
+ - '736'
902
+ - '737'
903
+ - '738'
904
+ - '739'
905
+ - '740'
906
+ - '741'
907
+ - '742'
908
+ - '743'
909
+ - '744'
910
+ - '745'
911
+ - '746'
912
+ - '747'
913
+ - '748'
914
+ - '749'
915
+ - '750'
916
+ - '751'
917
+ - '752'
918
+ - '753'
919
+ - '754'
920
+ - '755'
921
+ - '756'
922
+ - '757'
923
+ - '758'
924
+ - '759'
925
+ - '760'
926
+ - '761'
927
+ - '762'
928
+ - '763'
929
+ - '764'
930
+ - '765'
931
+ - '766'
932
+ - '767'
933
+ - '768'
934
+ - '769'
935
+ - '770'
936
+ - '771'
937
+ - '772'
938
+ - '773'
939
+ - '774'
940
+ - '775'
941
+ - '776'
942
+ - '777'
943
+ - '778'
944
+ - '779'
945
+ - '780'
946
+ - '781'
947
+ - '782'
948
+ - '783'
949
+ - '784'
950
+ - '785'
951
+ - '786'
952
+ - '787'
953
+ - '788'
954
+ - '789'
955
+ - '790'
956
+ - '791'
957
+ - '792'
958
+ - '793'
959
+ - '794'
960
+ - '795'
961
+ - '796'
962
+ - '797'
963
+ - '798'
964
+ - '799'
965
+ - '800'
966
+ - '801'
967
+ - '802'
968
+ - '803'
969
+ - '804'
970
+ - '805'
971
+ - '806'
972
+ - '807'
973
+ - '808'
974
+ - '809'
975
+ - '810'
976
+ - '811'
977
+ - '812'
978
+ - '813'
979
+ - '814'
980
+ - '815'
981
+ - '816'
982
+ - '817'
983
+ - '818'
984
+ - '819'
985
+ - '820'
986
+ - '821'
987
+ - '822'
988
+ - '823'
989
+ - '824'
990
+ - '825'
991
+ - '826'
992
+ - '827'
993
+ - '828'
994
+ - '829'
995
+ - '830'
996
+ - '831'
997
+ - '832'
998
+ - '833'
999
+ - '834'
1000
+ - '835'
1001
+ - '836'
1002
+ - '837'
1003
+ - '838'
1004
+ - '839'
1005
+ - '840'
1006
+ - '841'
1007
+ - '842'
1008
+ - '843'
1009
+ - '844'
1010
+ - '845'
1011
+ - '846'
1012
+ - '847'
1013
+ - '848'
1014
+ - '849'
1015
+ - '850'
1016
+ - '851'
1017
+ - '852'
1018
+ - '853'
1019
+ - '854'
1020
+ - '855'
1021
+ - '856'
1022
+ - '857'
1023
+ - '858'
1024
+ - '859'
1025
+ - '860'
1026
+ - '861'
1027
+ - '862'
1028
+ - '863'
1029
+ - '864'
1030
+ - '865'
1031
+ - '866'
1032
+ - '867'
1033
+ - '868'
1034
+ - '869'
1035
+ - '870'
1036
+ - '871'
1037
+ - '872'
1038
+ - '873'
1039
+ - '874'
1040
+ - '875'
1041
+ - '876'
1042
+ - '877'
1043
+ - '878'
1044
+ - '879'
1045
+ - '880'
1046
+ - '881'
1047
+ - '882'
1048
+ - '883'
1049
+ - '884'
1050
+ - '885'
1051
+ - '886'
1052
+ - '887'
1053
+ - '888'
1054
+ - '889'
1055
+ - '890'
1056
+ - '891'
1057
+ - '892'
1058
+ - '893'
1059
+ - '894'
1060
+ - '895'
1061
+ - '896'
1062
+ - '897'
1063
+ - '898'
1064
+ - '899'
1065
+ - '900'
1066
+ - '901'
1067
+ - '902'
1068
+ - '903'
1069
+ - '904'
1070
+ - '905'
1071
+ - '906'
1072
+ - '907'
1073
+ - '908'
1074
+ - '909'
1075
+ - '910'
1076
+ - '911'
1077
+ - '912'
1078
+ - '913'
1079
+ - '914'
1080
+ - '915'
1081
+ - '916'
1082
+ - '917'
1083
+ - '918'
1084
+ - '919'
1085
+ - '920'
1086
+ - '921'
1087
+ - '922'
1088
+ - '923'
1089
+ - '924'
1090
+ - '925'
1091
+ - '926'
1092
+ - '927'
1093
+ - '928'
1094
+ - '929'
1095
+ - '930'
1096
+ - '931'
1097
+ - '932'
1098
+ - '933'
1099
+ - '934'
1100
+ - '935'
1101
+ - '936'
1102
+ - '937'
1103
+ - '938'
1104
+ - '939'
1105
+ - '940'
1106
+ - '941'
1107
+ - '942'
1108
+ - '943'
1109
+ - '944'
1110
+ - '945'
1111
+ - '946'
1112
+ - '947'
1113
+ - '948'
1114
+ - '949'
1115
+ - '950'
1116
+ - '951'
1117
+ - '952'
1118
+ - '953'
1119
+ - '954'
1120
+ - '955'
1121
+ - '956'
1122
+ - '957'
1123
+ - '958'
1124
+ - '959'
1125
+ - '960'
1126
+ - '961'
1127
+ - '962'
1128
+ - '963'
1129
+ - '964'
1130
+ - '965'
1131
+ - '966'
1132
+ - '967'
1133
+ - '968'
1134
+ - '969'
1135
+ - '970'
1136
+ - '971'
1137
+ - '972'
1138
+ - '973'
1139
+ - '974'
1140
+ - '975'
1141
+ - '976'
1142
+ - '977'
1143
+ - '978'
1144
+ - '979'
1145
+ - '980'
1146
+ - '981'
1147
+ - '982'
1148
+ - '983'
1149
+ - '984'
1150
+ - '985'
1151
+ - '986'
1152
+ - '987'
1153
+ - '988'
1154
+ - '989'
1155
+ - '990'
1156
+ - '991'
1157
+ - '992'
1158
+ - '993'
1159
+ - '994'
1160
+ - '995'
1161
+ - '996'
1162
+ - '997'
1163
+ - '998'
1164
+ - '999'
1165
+ - '1000'
1166
+ - '1001'
1167
+ - '1002'
1168
+ - '1003'
1169
+ - '1004'
1170
+ - '1005'
1171
+ - '1006'
1172
+ - '1007'
1173
+ - '1008'
1174
+ - '1009'
1175
+ - '1010'
1176
+ - '1011'
1177
+ - '1012'
1178
+ - '1013'
1179
+ - '1014'
1180
+ - '1015'
1181
+ - '1016'
1182
+ - '1017'
1183
+ - '1018'
1184
+ - '1019'
1185
+ - '1020'
1186
+ - '1021'
1187
+ - '1022'
1188
+ - '1023'
1189
+ init: null
1190
+ collate_fn_conf: {}
1191
+ use_preprocessor: true
1192
+ waveform_input: false
1193
+ encoder: beats
1194
+ encoder_conf:
1195
+ use_weighted_representation: false
1196
+ is_pretraining: true
1197
+ beats_config:
1198
+ layer_wise_gradient_decay_ratio: 1.0
1199
+ encoder_layerdrop: 0.0
1200
+ dropout: 0.1
1201
+ codebook_vocab_size: 1024
1202
+ fbank_mean: 15.2913
1203
+ fbank_std: 5.90532
1204
+ decoder_layers: 3
1205
+ deep_norm: true
1206
+ use_flash_attn: false
1207
+ relative_position_embedding: true
1208
+ num_buckets: 320
1209
+ max_distance: 800
1210
+ gru_rel_pos: true
1211
+ encoder_layers: 24
1212
+ encoder_embed_dim: 1024
1213
+ encoder_ffn_embed_dim: 4096
1214
+ encoder_attention_heads: 16
1215
+ decoder_embed_dim: 1024
1216
+ decoder_attention_heads: 16
1217
+ model: beats
1218
+ model_conf:
1219
+ ignore_id: -2
1220
+ label_smoothing: 0.1
1221
+ waveform_input: false
1222
+ mixup_probability: 0.0
1223
+ required:
1224
+ - output_dir
1225
+ - token_list
1226
+ version: '202412'
1227
+ distributed: true
1228
+ ```
1229
+
1230
+ </details>
1231
+
1232
+ ### Citing ESPnet
1233
+
1234
+ ```BibTex
1235
+ @inproceedings{watanabe2018espnet,
1236
+ author={Shinji Watanabe and Takaaki Hori and Shigeki Karita and Tomoki Hayashi and Jiro Nishitoba and Yuya Unno and Nelson Yalta and Jahn Heymann and Matthew Wiesner and Nanxin Chen and Adithya Renduchintala and Tsubasa Ochiai},
1237
+ title={{ESPnet}: End-to-End Speech Processing Toolkit},
1238
+ year={2018},
1239
+ booktitle={Proceedings of Interspeech},
1240
+ pages={2207--2211},
1241
+ doi={10.21437/Interspeech.2018-1456},
1242
+ url={http://dx.doi.org/10.21437/Interspeech.2018-1456}
1243
+ }
1244
+
1245
+
1246
+
1247
+
1248
+
1249
+
1250
+ ```
1251
+
1252
+ or arXiv:
1253
+
1254
+ ```bibtex
1255
+ @misc{watanabe2018espnet,
1256
+ title={ESPnet: End-to-End Speech Processing Toolkit},
1257
+ author={Shinji Watanabe and Takaaki Hori and Shigeki Karita and Tomoki Hayashi and Jiro Nishitoba and Yuya Unno and Nelson Yalta and Jahn Heymann and Matthew Wiesner and Nanxin Chen and Adithya Renduchintala and Tsubasa Ochiai},
1258
+ year={2018},
1259
+ eprint={1804.00015},
1260
+ archivePrefix={arXiv},
1261
+ primaryClass={cs.CL}
1262
+ }
1263
+ ```
meta.yaml ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ espnet: '202503'
2
+ files:
3
+ ssl_model_file: /work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/epoch_latest.pt
4
+ python: "3.9.18 | packaged by conda-forge | (main, Dec 23 2023, 17:20:25) \n[GCC 12.3.0]"
5
+ timestamp: 1752692937.535911
6
+ torch: 2.6.0.dev20241210+cu124
7
+ yaml_files:
8
+ ssl_train_config: /work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/config.yaml
work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/config.yaml ADDED
@@ -0,0 +1,1206 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/ear_large.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ drop_last_iter: false
5
+ dry_run: false
6
+ iterator_type: sequence
7
+ valid_iterator_type: null
8
+ output_dir: /work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000
9
+ ngpu: 1
10
+ seed: 0
11
+ num_workers: 4
12
+ num_att_plot: 0
13
+ dist_backend: nccl
14
+ dist_init_method: env://
15
+ dist_world_size: 4
16
+ dist_rank: 0
17
+ local_rank: 0
18
+ dist_master_addr: localhost
19
+ dist_master_port: 60649
20
+ dist_launcher: null
21
+ multiprocessing_distributed: true
22
+ unused_parameters: false
23
+ sharded_ddp: false
24
+ use_deepspeed: true
25
+ deepspeed_config: ewogICJ0cmFpbl9taWNyb19iYXRjaF9zaXplX3Blcl9ncHUiOiAxLAogICJncmFkaWVudF9hY2N1bXVsYXRpb25fc3RlcHMiOiAxLAogICJncmFkaWVudF9jbGlwcGluZyI6IDEuMCwKICAiYmYxNiI6IHsKICAgICJlbmFibGVkIjogdHJ1ZQogIH0sCiAgIm9wdGltaXplciI6IHsKICAgICJ0eXBlIjogIkFkYW0iLAogICAgInBhcmFtcyI6IHsKICAgICAgImxyIjogMS4wZS00LAogICAgICAiYmV0YXMiOiBbMC45LCAwLjk4XSwKICAgICAgImVwcyI6IDFlLTEyLAogICAgICAid2VpZ2h0X2RlY2F5IjogMS4wZS0yLAogICAgICAiYWRhbV93X21vZGUiOiB0cnVlCiAgICB9CiAgfSwKICAic2NoZWR1bGVyIjogewogICAgInR5cGUiOiAiV2FybXVwRGVjYXlMUiIsCiAgICAicGFyYW1zIjogewogICAgICAid2FybXVwX3R5cGUiOiAibGluZWFyIiwKICAgICAgInRvdGFsX251bV9zdGVwcyI6IDQwMDAwMCwKICAgICAgIndhcm11cF9udW1fc3RlcHMiOiA0MDAwMCwKICAgICAgIndhcm11cF9tYXhfbHIiOiAxLjBlLTQsCiAgICAgICJ3YXJtdXBfbWluX2xyIjogMS4wZS02CiAgICB9CiAgfSwKICAid2FsbF9jbG9ja19icmVha2Rvd24iOiBmYWxzZSwKICAic3RlcHNfcGVyX3ByaW50IjogMzAwMAp9Cg==
26
+ gradient_as_bucket_view: true
27
+ ddp_comm_hook: null
28
+ cudnn_enabled: true
29
+ cudnn_benchmark: false
30
+ cudnn_deterministic: true
31
+ use_tf32: false
32
+ collect_stats: false
33
+ write_collected_feats: false
34
+ max_epoch: 59
35
+ patience: null
36
+ val_scheduler_criterion:
37
+ - valid
38
+ - loss
39
+ early_stopping_criterion:
40
+ - valid
41
+ - loss
42
+ - min
43
+ best_model_criterion:
44
+ - - train
45
+ - loss
46
+ - min
47
+ - - valid
48
+ - loss
49
+ - min
50
+ - - train
51
+ - acc
52
+ - max
53
+ - - valid
54
+ - acc
55
+ - max
56
+ keep_nbest_models:
57
+ - 10
58
+ nbest_averaging_interval: 0
59
+ grad_clip: 5.0
60
+ grad_clip_type: 2.0
61
+ grad_noise: false
62
+ accum_grad: 1
63
+ no_forward_run: false
64
+ resume: true
65
+ train_dtype: float32
66
+ use_amp: false
67
+ log_interval: null
68
+ use_matplotlib: true
69
+ use_tensorboard: true
70
+ create_graph_in_tensorboard: false
71
+ use_wandb: true
72
+ wandb_project: EARlarge.PT
73
+ wandb_id: null
74
+ wandb_entity: shikhar
75
+ wandb_name: large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000
76
+ wandb_model_log_interval: -1
77
+ detect_anomaly: false
78
+ use_adapter: false
79
+ adapter: lora
80
+ save_strategy: all
81
+ adapter_conf: {}
82
+ pretrain_path: null
83
+ init_param: []
84
+ ignore_init_mismatch: false
85
+ freeze_param: []
86
+ num_iters_per_epoch: null
87
+ batch_size: 20
88
+ valid_batch_size: null
89
+ batch_bins: 1600000
90
+ valid_batch_bins: null
91
+ category_sample_size: 10
92
+ train_shape_file:
93
+ - /work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_stats_fbank/train/speech_shape
94
+ - /work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_stats_fbank/train/target_shape.word
95
+ valid_shape_file:
96
+ - /work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_stats_fbank/valid/speech_shape
97
+ - /work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_stats_fbank/valid/target_shape.word
98
+ batch_type: length
99
+ valid_batch_type: null
100
+ fold_length:
101
+ - 160000
102
+ - 600
103
+ sort_in_batch: descending
104
+ shuffle_within_batch: false
105
+ sort_batch: descending
106
+ multiple_iterator: false
107
+ utt2weight_file: null
108
+ chunk_length: 500
109
+ chunk_shift_ratio: 0.5
110
+ num_cache_chunks: 1024
111
+ chunk_excluded_key_prefixes: []
112
+ chunk_default_fs: null
113
+ chunk_max_abs_length: null
114
+ chunk_discard_short_samples: true
115
+ train_data_path_and_name_and_type:
116
+ - - /work/nvme/bbjs/sbharadwaj/7Msounds/dump/fbank/train/feats.scp
117
+ - speech
118
+ - kaldi_ark
119
+ - - /work/nvme/bbjs/sbharadwaj/7Msounds/dump/fbank/train/target_iter2_tokenizer_large_100k_steps
120
+ - target
121
+ - text
122
+ valid_data_path_and_name_and_type:
123
+ - - /work/nvme/bbjs/sbharadwaj/7Msounds/dump/fbank/eval/feats.scp
124
+ - speech
125
+ - kaldi_ark
126
+ - - /work/nvme/bbjs/sbharadwaj/7Msounds/dump/fbank/eval/target_iter2_tokenizer_large_100k_steps
127
+ - target
128
+ - text
129
+ multi_task_dataset: false
130
+ allow_variable_data_keys: false
131
+ max_cache_size: 0.0
132
+ max_cache_fd: 32
133
+ allow_multi_rates: false
134
+ valid_max_cache_size: null
135
+ exclude_weight_decay: false
136
+ exclude_weight_decay_conf: {}
137
+ optim: adadelta
138
+ optim_conf: {}
139
+ scheduler: null
140
+ scheduler_conf: {}
141
+ lightning_conf: {}
142
+ token_list:
143
+ - <unk>
144
+ - '0'
145
+ - '1'
146
+ - '2'
147
+ - '3'
148
+ - '4'
149
+ - '5'
150
+ - '6'
151
+ - '7'
152
+ - '8'
153
+ - '9'
154
+ - '10'
155
+ - '11'
156
+ - '12'
157
+ - '13'
158
+ - '14'
159
+ - '15'
160
+ - '16'
161
+ - '17'
162
+ - '18'
163
+ - '19'
164
+ - '20'
165
+ - '21'
166
+ - '22'
167
+ - '23'
168
+ - '24'
169
+ - '25'
170
+ - '26'
171
+ - '27'
172
+ - '28'
173
+ - '29'
174
+ - '30'
175
+ - '31'
176
+ - '32'
177
+ - '33'
178
+ - '34'
179
+ - '35'
180
+ - '36'
181
+ - '37'
182
+ - '38'
183
+ - '39'
184
+ - '40'
185
+ - '41'
186
+ - '42'
187
+ - '43'
188
+ - '44'
189
+ - '45'
190
+ - '46'
191
+ - '47'
192
+ - '48'
193
+ - '49'
194
+ - '50'
195
+ - '51'
196
+ - '52'
197
+ - '53'
198
+ - '54'
199
+ - '55'
200
+ - '56'
201
+ - '57'
202
+ - '58'
203
+ - '59'
204
+ - '60'
205
+ - '61'
206
+ - '62'
207
+ - '63'
208
+ - '64'
209
+ - '65'
210
+ - '66'
211
+ - '67'
212
+ - '68'
213
+ - '69'
214
+ - '70'
215
+ - '71'
216
+ - '72'
217
+ - '73'
218
+ - '74'
219
+ - '75'
220
+ - '76'
221
+ - '77'
222
+ - '78'
223
+ - '79'
224
+ - '80'
225
+ - '81'
226
+ - '82'
227
+ - '83'
228
+ - '84'
229
+ - '85'
230
+ - '86'
231
+ - '87'
232
+ - '88'
233
+ - '89'
234
+ - '90'
235
+ - '91'
236
+ - '92'
237
+ - '93'
238
+ - '94'
239
+ - '95'
240
+ - '96'
241
+ - '97'
242
+ - '98'
243
+ - '99'
244
+ - '100'
245
+ - '101'
246
+ - '102'
247
+ - '103'
248
+ - '104'
249
+ - '105'
250
+ - '106'
251
+ - '107'
252
+ - '108'
253
+ - '109'
254
+ - '110'
255
+ - '111'
256
+ - '112'
257
+ - '113'
258
+ - '114'
259
+ - '115'
260
+ - '116'
261
+ - '117'
262
+ - '118'
263
+ - '119'
264
+ - '120'
265
+ - '121'
266
+ - '122'
267
+ - '123'
268
+ - '124'
269
+ - '125'
270
+ - '126'
271
+ - '127'
272
+ - '128'
273
+ - '129'
274
+ - '130'
275
+ - '131'
276
+ - '132'
277
+ - '133'
278
+ - '134'
279
+ - '135'
280
+ - '136'
281
+ - '137'
282
+ - '138'
283
+ - '139'
284
+ - '140'
285
+ - '141'
286
+ - '142'
287
+ - '143'
288
+ - '144'
289
+ - '145'
290
+ - '146'
291
+ - '147'
292
+ - '148'
293
+ - '149'
294
+ - '150'
295
+ - '151'
296
+ - '152'
297
+ - '153'
298
+ - '154'
299
+ - '155'
300
+ - '156'
301
+ - '157'
302
+ - '158'
303
+ - '159'
304
+ - '160'
305
+ - '161'
306
+ - '162'
307
+ - '163'
308
+ - '164'
309
+ - '165'
310
+ - '166'
311
+ - '167'
312
+ - '168'
313
+ - '169'
314
+ - '170'
315
+ - '171'
316
+ - '172'
317
+ - '173'
318
+ - '174'
319
+ - '175'
320
+ - '176'
321
+ - '177'
322
+ - '178'
323
+ - '179'
324
+ - '180'
325
+ - '181'
326
+ - '182'
327
+ - '183'
328
+ - '184'
329
+ - '185'
330
+ - '186'
331
+ - '187'
332
+ - '188'
333
+ - '189'
334
+ - '190'
335
+ - '191'
336
+ - '192'
337
+ - '193'
338
+ - '194'
339
+ - '195'
340
+ - '196'
341
+ - '197'
342
+ - '198'
343
+ - '199'
344
+ - '200'
345
+ - '201'
346
+ - '202'
347
+ - '203'
348
+ - '204'
349
+ - '205'
350
+ - '206'
351
+ - '207'
352
+ - '208'
353
+ - '209'
354
+ - '210'
355
+ - '211'
356
+ - '212'
357
+ - '213'
358
+ - '214'
359
+ - '215'
360
+ - '216'
361
+ - '217'
362
+ - '218'
363
+ - '219'
364
+ - '220'
365
+ - '221'
366
+ - '222'
367
+ - '223'
368
+ - '224'
369
+ - '225'
370
+ - '226'
371
+ - '227'
372
+ - '228'
373
+ - '229'
374
+ - '230'
375
+ - '231'
376
+ - '232'
377
+ - '233'
378
+ - '234'
379
+ - '235'
380
+ - '236'
381
+ - '237'
382
+ - '238'
383
+ - '239'
384
+ - '240'
385
+ - '241'
386
+ - '242'
387
+ - '243'
388
+ - '244'
389
+ - '245'
390
+ - '246'
391
+ - '247'
392
+ - '248'
393
+ - '249'
394
+ - '250'
395
+ - '251'
396
+ - '252'
397
+ - '253'
398
+ - '254'
399
+ - '255'
400
+ - '256'
401
+ - '257'
402
+ - '258'
403
+ - '259'
404
+ - '260'
405
+ - '261'
406
+ - '262'
407
+ - '263'
408
+ - '264'
409
+ - '265'
410
+ - '266'
411
+ - '267'
412
+ - '268'
413
+ - '269'
414
+ - '270'
415
+ - '271'
416
+ - '272'
417
+ - '273'
418
+ - '274'
419
+ - '275'
420
+ - '276'
421
+ - '277'
422
+ - '278'
423
+ - '279'
424
+ - '280'
425
+ - '281'
426
+ - '282'
427
+ - '283'
428
+ - '284'
429
+ - '285'
430
+ - '286'
431
+ - '287'
432
+ - '288'
433
+ - '289'
434
+ - '290'
435
+ - '291'
436
+ - '292'
437
+ - '293'
438
+ - '294'
439
+ - '295'
440
+ - '296'
441
+ - '297'
442
+ - '298'
443
+ - '299'
444
+ - '300'
445
+ - '301'
446
+ - '302'
447
+ - '303'
448
+ - '304'
449
+ - '305'
450
+ - '306'
451
+ - '307'
452
+ - '308'
453
+ - '309'
454
+ - '310'
455
+ - '311'
456
+ - '312'
457
+ - '313'
458
+ - '314'
459
+ - '315'
460
+ - '316'
461
+ - '317'
462
+ - '318'
463
+ - '319'
464
+ - '320'
465
+ - '321'
466
+ - '322'
467
+ - '323'
468
+ - '324'
469
+ - '325'
470
+ - '326'
471
+ - '327'
472
+ - '328'
473
+ - '329'
474
+ - '330'
475
+ - '331'
476
+ - '332'
477
+ - '333'
478
+ - '334'
479
+ - '335'
480
+ - '336'
481
+ - '337'
482
+ - '338'
483
+ - '339'
484
+ - '340'
485
+ - '341'
486
+ - '342'
487
+ - '343'
488
+ - '344'
489
+ - '345'
490
+ - '346'
491
+ - '347'
492
+ - '348'
493
+ - '349'
494
+ - '350'
495
+ - '351'
496
+ - '352'
497
+ - '353'
498
+ - '354'
499
+ - '355'
500
+ - '356'
501
+ - '357'
502
+ - '358'
503
+ - '359'
504
+ - '360'
505
+ - '361'
506
+ - '362'
507
+ - '363'
508
+ - '364'
509
+ - '365'
510
+ - '366'
511
+ - '367'
512
+ - '368'
513
+ - '369'
514
+ - '370'
515
+ - '371'
516
+ - '372'
517
+ - '373'
518
+ - '374'
519
+ - '375'
520
+ - '376'
521
+ - '377'
522
+ - '378'
523
+ - '379'
524
+ - '380'
525
+ - '381'
526
+ - '382'
527
+ - '383'
528
+ - '384'
529
+ - '385'
530
+ - '386'
531
+ - '387'
532
+ - '388'
533
+ - '389'
534
+ - '390'
535
+ - '391'
536
+ - '392'
537
+ - '393'
538
+ - '394'
539
+ - '395'
540
+ - '396'
541
+ - '397'
542
+ - '398'
543
+ - '399'
544
+ - '400'
545
+ - '401'
546
+ - '402'
547
+ - '403'
548
+ - '404'
549
+ - '405'
550
+ - '406'
551
+ - '407'
552
+ - '408'
553
+ - '409'
554
+ - '410'
555
+ - '411'
556
+ - '412'
557
+ - '413'
558
+ - '414'
559
+ - '415'
560
+ - '416'
561
+ - '417'
562
+ - '418'
563
+ - '419'
564
+ - '420'
565
+ - '421'
566
+ - '422'
567
+ - '423'
568
+ - '424'
569
+ - '425'
570
+ - '426'
571
+ - '427'
572
+ - '428'
573
+ - '429'
574
+ - '430'
575
+ - '431'
576
+ - '432'
577
+ - '433'
578
+ - '434'
579
+ - '435'
580
+ - '436'
581
+ - '437'
582
+ - '438'
583
+ - '439'
584
+ - '440'
585
+ - '441'
586
+ - '442'
587
+ - '443'
588
+ - '444'
589
+ - '445'
590
+ - '446'
591
+ - '447'
592
+ - '448'
593
+ - '449'
594
+ - '450'
595
+ - '451'
596
+ - '452'
597
+ - '453'
598
+ - '454'
599
+ - '455'
600
+ - '456'
601
+ - '457'
602
+ - '458'
603
+ - '459'
604
+ - '460'
605
+ - '461'
606
+ - '462'
607
+ - '463'
608
+ - '464'
609
+ - '465'
610
+ - '466'
611
+ - '467'
612
+ - '468'
613
+ - '469'
614
+ - '470'
615
+ - '471'
616
+ - '472'
617
+ - '473'
618
+ - '474'
619
+ - '475'
620
+ - '476'
621
+ - '477'
622
+ - '478'
623
+ - '479'
624
+ - '480'
625
+ - '481'
626
+ - '482'
627
+ - '483'
628
+ - '484'
629
+ - '485'
630
+ - '486'
631
+ - '487'
632
+ - '488'
633
+ - '489'
634
+ - '490'
635
+ - '491'
636
+ - '492'
637
+ - '493'
638
+ - '494'
639
+ - '495'
640
+ - '496'
641
+ - '497'
642
+ - '498'
643
+ - '499'
644
+ - '500'
645
+ - '501'
646
+ - '502'
647
+ - '503'
648
+ - '504'
649
+ - '505'
650
+ - '506'
651
+ - '507'
652
+ - '508'
653
+ - '509'
654
+ - '510'
655
+ - '511'
656
+ - '512'
657
+ - '513'
658
+ - '514'
659
+ - '515'
660
+ - '516'
661
+ - '517'
662
+ - '518'
663
+ - '519'
664
+ - '520'
665
+ - '521'
666
+ - '522'
667
+ - '523'
668
+ - '524'
669
+ - '525'
670
+ - '526'
671
+ - '527'
672
+ - '528'
673
+ - '529'
674
+ - '530'
675
+ - '531'
676
+ - '532'
677
+ - '533'
678
+ - '534'
679
+ - '535'
680
+ - '536'
681
+ - '537'
682
+ - '538'
683
+ - '539'
684
+ - '540'
685
+ - '541'
686
+ - '542'
687
+ - '543'
688
+ - '544'
689
+ - '545'
690
+ - '546'
691
+ - '547'
692
+ - '548'
693
+ - '549'
694
+ - '550'
695
+ - '551'
696
+ - '552'
697
+ - '553'
698
+ - '554'
699
+ - '555'
700
+ - '556'
701
+ - '557'
702
+ - '558'
703
+ - '559'
704
+ - '560'
705
+ - '561'
706
+ - '562'
707
+ - '563'
708
+ - '564'
709
+ - '565'
710
+ - '566'
711
+ - '567'
712
+ - '568'
713
+ - '569'
714
+ - '570'
715
+ - '571'
716
+ - '572'
717
+ - '573'
718
+ - '574'
719
+ - '575'
720
+ - '576'
721
+ - '577'
722
+ - '578'
723
+ - '579'
724
+ - '580'
725
+ - '581'
726
+ - '582'
727
+ - '583'
728
+ - '584'
729
+ - '585'
730
+ - '586'
731
+ - '587'
732
+ - '588'
733
+ - '589'
734
+ - '590'
735
+ - '591'
736
+ - '592'
737
+ - '593'
738
+ - '594'
739
+ - '595'
740
+ - '596'
741
+ - '597'
742
+ - '598'
743
+ - '599'
744
+ - '600'
745
+ - '601'
746
+ - '602'
747
+ - '603'
748
+ - '604'
749
+ - '605'
750
+ - '606'
751
+ - '607'
752
+ - '608'
753
+ - '609'
754
+ - '610'
755
+ - '611'
756
+ - '612'
757
+ - '613'
758
+ - '614'
759
+ - '615'
760
+ - '616'
761
+ - '617'
762
+ - '618'
763
+ - '619'
764
+ - '620'
765
+ - '621'
766
+ - '622'
767
+ - '623'
768
+ - '624'
769
+ - '625'
770
+ - '626'
771
+ - '627'
772
+ - '628'
773
+ - '629'
774
+ - '630'
775
+ - '631'
776
+ - '632'
777
+ - '633'
778
+ - '634'
779
+ - '635'
780
+ - '636'
781
+ - '637'
782
+ - '638'
783
+ - '639'
784
+ - '640'
785
+ - '641'
786
+ - '642'
787
+ - '643'
788
+ - '644'
789
+ - '645'
790
+ - '646'
791
+ - '647'
792
+ - '648'
793
+ - '649'
794
+ - '650'
795
+ - '651'
796
+ - '652'
797
+ - '653'
798
+ - '654'
799
+ - '655'
800
+ - '656'
801
+ - '657'
802
+ - '658'
803
+ - '659'
804
+ - '660'
805
+ - '661'
806
+ - '662'
807
+ - '663'
808
+ - '664'
809
+ - '665'
810
+ - '666'
811
+ - '667'
812
+ - '668'
813
+ - '669'
814
+ - '670'
815
+ - '671'
816
+ - '672'
817
+ - '673'
818
+ - '674'
819
+ - '675'
820
+ - '676'
821
+ - '677'
822
+ - '678'
823
+ - '679'
824
+ - '680'
825
+ - '681'
826
+ - '682'
827
+ - '683'
828
+ - '684'
829
+ - '685'
830
+ - '686'
831
+ - '687'
832
+ - '688'
833
+ - '689'
834
+ - '690'
835
+ - '691'
836
+ - '692'
837
+ - '693'
838
+ - '694'
839
+ - '695'
840
+ - '696'
841
+ - '697'
842
+ - '698'
843
+ - '699'
844
+ - '700'
845
+ - '701'
846
+ - '702'
847
+ - '703'
848
+ - '704'
849
+ - '705'
850
+ - '706'
851
+ - '707'
852
+ - '708'
853
+ - '709'
854
+ - '710'
855
+ - '711'
856
+ - '712'
857
+ - '713'
858
+ - '714'
859
+ - '715'
860
+ - '716'
861
+ - '717'
862
+ - '718'
863
+ - '719'
864
+ - '720'
865
+ - '721'
866
+ - '722'
867
+ - '723'
868
+ - '724'
869
+ - '725'
870
+ - '726'
871
+ - '727'
872
+ - '728'
873
+ - '729'
874
+ - '730'
875
+ - '731'
876
+ - '732'
877
+ - '733'
878
+ - '734'
879
+ - '735'
880
+ - '736'
881
+ - '737'
882
+ - '738'
883
+ - '739'
884
+ - '740'
885
+ - '741'
886
+ - '742'
887
+ - '743'
888
+ - '744'
889
+ - '745'
890
+ - '746'
891
+ - '747'
892
+ - '748'
893
+ - '749'
894
+ - '750'
895
+ - '751'
896
+ - '752'
897
+ - '753'
898
+ - '754'
899
+ - '755'
900
+ - '756'
901
+ - '757'
902
+ - '758'
903
+ - '759'
904
+ - '760'
905
+ - '761'
906
+ - '762'
907
+ - '763'
908
+ - '764'
909
+ - '765'
910
+ - '766'
911
+ - '767'
912
+ - '768'
913
+ - '769'
914
+ - '770'
915
+ - '771'
916
+ - '772'
917
+ - '773'
918
+ - '774'
919
+ - '775'
920
+ - '776'
921
+ - '777'
922
+ - '778'
923
+ - '779'
924
+ - '780'
925
+ - '781'
926
+ - '782'
927
+ - '783'
928
+ - '784'
929
+ - '785'
930
+ - '786'
931
+ - '787'
932
+ - '788'
933
+ - '789'
934
+ - '790'
935
+ - '791'
936
+ - '792'
937
+ - '793'
938
+ - '794'
939
+ - '795'
940
+ - '796'
941
+ - '797'
942
+ - '798'
943
+ - '799'
944
+ - '800'
945
+ - '801'
946
+ - '802'
947
+ - '803'
948
+ - '804'
949
+ - '805'
950
+ - '806'
951
+ - '807'
952
+ - '808'
953
+ - '809'
954
+ - '810'
955
+ - '811'
956
+ - '812'
957
+ - '813'
958
+ - '814'
959
+ - '815'
960
+ - '816'
961
+ - '817'
962
+ - '818'
963
+ - '819'
964
+ - '820'
965
+ - '821'
966
+ - '822'
967
+ - '823'
968
+ - '824'
969
+ - '825'
970
+ - '826'
971
+ - '827'
972
+ - '828'
973
+ - '829'
974
+ - '830'
975
+ - '831'
976
+ - '832'
977
+ - '833'
978
+ - '834'
979
+ - '835'
980
+ - '836'
981
+ - '837'
982
+ - '838'
983
+ - '839'
984
+ - '840'
985
+ - '841'
986
+ - '842'
987
+ - '843'
988
+ - '844'
989
+ - '845'
990
+ - '846'
991
+ - '847'
992
+ - '848'
993
+ - '849'
994
+ - '850'
995
+ - '851'
996
+ - '852'
997
+ - '853'
998
+ - '854'
999
+ - '855'
1000
+ - '856'
1001
+ - '857'
1002
+ - '858'
1003
+ - '859'
1004
+ - '860'
1005
+ - '861'
1006
+ - '862'
1007
+ - '863'
1008
+ - '864'
1009
+ - '865'
1010
+ - '866'
1011
+ - '867'
1012
+ - '868'
1013
+ - '869'
1014
+ - '870'
1015
+ - '871'
1016
+ - '872'
1017
+ - '873'
1018
+ - '874'
1019
+ - '875'
1020
+ - '876'
1021
+ - '877'
1022
+ - '878'
1023
+ - '879'
1024
+ - '880'
1025
+ - '881'
1026
+ - '882'
1027
+ - '883'
1028
+ - '884'
1029
+ - '885'
1030
+ - '886'
1031
+ - '887'
1032
+ - '888'
1033
+ - '889'
1034
+ - '890'
1035
+ - '891'
1036
+ - '892'
1037
+ - '893'
1038
+ - '894'
1039
+ - '895'
1040
+ - '896'
1041
+ - '897'
1042
+ - '898'
1043
+ - '899'
1044
+ - '900'
1045
+ - '901'
1046
+ - '902'
1047
+ - '903'
1048
+ - '904'
1049
+ - '905'
1050
+ - '906'
1051
+ - '907'
1052
+ - '908'
1053
+ - '909'
1054
+ - '910'
1055
+ - '911'
1056
+ - '912'
1057
+ - '913'
1058
+ - '914'
1059
+ - '915'
1060
+ - '916'
1061
+ - '917'
1062
+ - '918'
1063
+ - '919'
1064
+ - '920'
1065
+ - '921'
1066
+ - '922'
1067
+ - '923'
1068
+ - '924'
1069
+ - '925'
1070
+ - '926'
1071
+ - '927'
1072
+ - '928'
1073
+ - '929'
1074
+ - '930'
1075
+ - '931'
1076
+ - '932'
1077
+ - '933'
1078
+ - '934'
1079
+ - '935'
1080
+ - '936'
1081
+ - '937'
1082
+ - '938'
1083
+ - '939'
1084
+ - '940'
1085
+ - '941'
1086
+ - '942'
1087
+ - '943'
1088
+ - '944'
1089
+ - '945'
1090
+ - '946'
1091
+ - '947'
1092
+ - '948'
1093
+ - '949'
1094
+ - '950'
1095
+ - '951'
1096
+ - '952'
1097
+ - '953'
1098
+ - '954'
1099
+ - '955'
1100
+ - '956'
1101
+ - '957'
1102
+ - '958'
1103
+ - '959'
1104
+ - '960'
1105
+ - '961'
1106
+ - '962'
1107
+ - '963'
1108
+ - '964'
1109
+ - '965'
1110
+ - '966'
1111
+ - '967'
1112
+ - '968'
1113
+ - '969'
1114
+ - '970'
1115
+ - '971'
1116
+ - '972'
1117
+ - '973'
1118
+ - '974'
1119
+ - '975'
1120
+ - '976'
1121
+ - '977'
1122
+ - '978'
1123
+ - '979'
1124
+ - '980'
1125
+ - '981'
1126
+ - '982'
1127
+ - '983'
1128
+ - '984'
1129
+ - '985'
1130
+ - '986'
1131
+ - '987'
1132
+ - '988'
1133
+ - '989'
1134
+ - '990'
1135
+ - '991'
1136
+ - '992'
1137
+ - '993'
1138
+ - '994'
1139
+ - '995'
1140
+ - '996'
1141
+ - '997'
1142
+ - '998'
1143
+ - '999'
1144
+ - '1000'
1145
+ - '1001'
1146
+ - '1002'
1147
+ - '1003'
1148
+ - '1004'
1149
+ - '1005'
1150
+ - '1006'
1151
+ - '1007'
1152
+ - '1008'
1153
+ - '1009'
1154
+ - '1010'
1155
+ - '1011'
1156
+ - '1012'
1157
+ - '1013'
1158
+ - '1014'
1159
+ - '1015'
1160
+ - '1016'
1161
+ - '1017'
1162
+ - '1018'
1163
+ - '1019'
1164
+ - '1020'
1165
+ - '1021'
1166
+ - '1022'
1167
+ - '1023'
1168
+ init: null
1169
+ collate_fn_conf: {}
1170
+ use_preprocessor: true
1171
+ waveform_input: false
1172
+ encoder: beats
1173
+ encoder_conf:
1174
+ use_weighted_representation: false
1175
+ is_pretraining: true
1176
+ beats_config:
1177
+ layer_wise_gradient_decay_ratio: 1.0
1178
+ encoder_layerdrop: 0.0
1179
+ dropout: 0.1
1180
+ codebook_vocab_size: 1024
1181
+ fbank_mean: 15.2913
1182
+ fbank_std: 5.90532
1183
+ decoder_layers: 3
1184
+ deep_norm: true
1185
+ use_flash_attn: false
1186
+ relative_position_embedding: true
1187
+ num_buckets: 320
1188
+ max_distance: 800
1189
+ gru_rel_pos: true
1190
+ encoder_layers: 24
1191
+ encoder_embed_dim: 1024
1192
+ encoder_ffn_embed_dim: 4096
1193
+ encoder_attention_heads: 16
1194
+ decoder_embed_dim: 1024
1195
+ decoder_attention_heads: 16
1196
+ model: beats
1197
+ model_conf:
1198
+ ignore_id: -2
1199
+ label_smoothing: 0.1
1200
+ waveform_input: false
1201
+ mixup_probability: 0.0
1202
+ required:
1203
+ - output_dir
1204
+ - token_list
1205
+ version: '202412'
1206
+ distributed: true
work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/epoch_latest.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a869b833640b9bb9803851e34df4e3efe42992b9c7f2e2cdbc7cea771320d56
3
+ size 1246137546
work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/acc.png ADDED
work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/acc_mask.png ADDED
work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/acc_unmask.png ADDED
work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/count_masked.png ADDED
work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/count_unmask.png ADDED
work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/entropy.png ADDED
work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/gpu_max_cached_mem_GB.png ADDED
work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/grad_norm.png ADDED
work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/iter_time.png ADDED
work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/learning_rate.png ADDED
work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/loss.png ADDED
work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/loss_scale.png ADDED
work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/n_uniq_pred.png ADDED
work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/n_uniq_pred_msk.png ADDED
work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/n_uniq_pred_unmsk.png ADDED
work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/n_uniq_tgt.png ADDED
work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/n_uniq_tgt_msk.png ADDED
work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/step_time.png ADDED
work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/vocab_cov_pred.png ADDED
work/nvme/bbjs/sbharadwaj/7Msounds/exp/beats_iter2_large2.tune_lr1.0e-4_warmup40000_bins1600000_totalsteps400000/images/vocab_cov_tgt.png ADDED