satvik-dixit commited on
Commit
86ba4b6
1 Parent(s): 80ea880

Create config.yaml

Browse files
Files changed (1) hide show
  1. config.yaml +508 -0
config.yaml ADDED
@@ -0,0 +1,508 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/train_asr_demo_branchformer.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ drop_last_iter: false
5
+ dry_run: false
6
+ iterator_type: sequence
7
+ valid_iterator_type: null
8
+ output_dir: exp/asr_train_asr_demo_branchformer_raw_en_bpe300_sp
9
+ ngpu: 1
10
+ seed: 0
11
+ num_workers: 2
12
+ num_att_plot: 0
13
+ dist_backend: nccl
14
+ dist_init_method: env://
15
+ dist_world_size: null
16
+ dist_rank: null
17
+ local_rank: 0
18
+ dist_master_addr: null
19
+ dist_master_port: null
20
+ dist_launcher: null
21
+ multiprocessing_distributed: false
22
+ unused_parameters: false
23
+ sharded_ddp: false
24
+ cudnn_enabled: true
25
+ cudnn_benchmark: false
26
+ cudnn_deterministic: true
27
+ collect_stats: false
28
+ write_collected_feats: false
29
+ max_epoch: 100
30
+ patience: null
31
+ val_scheduler_criterion:
32
+ - valid
33
+ - loss
34
+ early_stopping_criterion:
35
+ - valid
36
+ - loss
37
+ - min
38
+ best_model_criterion:
39
+ - - valid
40
+ - acc
41
+ - max
42
+ keep_nbest_models: 10
43
+ nbest_averaging_interval: 0
44
+ grad_clip: 5.0
45
+ grad_clip_type: 2.0
46
+ grad_noise: false
47
+ accum_grad: 2
48
+ no_forward_run: false
49
+ resume: true
50
+ train_dtype: float32
51
+ use_amp: true
52
+ log_interval: null
53
+ use_matplotlib: true
54
+ use_tensorboard: true
55
+ create_graph_in_tensorboard: false
56
+ use_wandb: false
57
+ wandb_project: null
58
+ wandb_id: null
59
+ wandb_entity: null
60
+ wandb_name: null
61
+ wandb_model_log_interval: -1
62
+ detect_anomaly: false
63
+ use_adapter: false
64
+ adapter: lora
65
+ save_strategy: all
66
+ adapter_conf: {}
67
+ pretrain_path: null
68
+ init_param: []
69
+ ignore_init_mismatch: false
70
+ freeze_param: []
71
+ num_iters_per_epoch: null
72
+ batch_size: 64
73
+ valid_batch_size: null
74
+ batch_bins: 1000000
75
+ valid_batch_bins: null
76
+ train_shape_file:
77
+ - exp/asr_stats_raw_en_bpe300_sp/train/speech_shape
78
+ - exp/asr_stats_raw_en_bpe300_sp/train/text_shape.bpe
79
+ valid_shape_file:
80
+ - exp/asr_stats_raw_en_bpe300_sp/valid/speech_shape
81
+ - exp/asr_stats_raw_en_bpe300_sp/valid/text_shape.bpe
82
+ batch_type: folded
83
+ valid_batch_type: null
84
+ fold_length:
85
+ - 80000
86
+ - 150
87
+ sort_in_batch: descending
88
+ shuffle_within_batch: false
89
+ sort_batch: descending
90
+ multiple_iterator: false
91
+ chunk_length: 500
92
+ chunk_shift_ratio: 0.5
93
+ num_cache_chunks: 1024
94
+ chunk_excluded_key_prefixes: []
95
+ chunk_default_fs: null
96
+ train_data_path_and_name_and_type:
97
+ - - dump/raw/train_nodev_sp/wav.scp
98
+ - speech
99
+ - sound
100
+ - - dump/raw/train_nodev_sp/text
101
+ - text
102
+ - text
103
+ valid_data_path_and_name_and_type:
104
+ - - dump/raw/train_dev/wav.scp
105
+ - speech
106
+ - sound
107
+ - - dump/raw/train_dev/text
108
+ - text
109
+ - text
110
+ allow_variable_data_keys: false
111
+ max_cache_size: 0.0
112
+ max_cache_fd: 32
113
+ allow_multi_rates: false
114
+ valid_max_cache_size: null
115
+ exclude_weight_decay: false
116
+ exclude_weight_decay_conf: {}
117
+ optim: adam
118
+ optim_conf:
119
+ lr: 0.001
120
+ scheduler: warmuplr
121
+ scheduler_conf:
122
+ warmup_steps: 800
123
+ token_list:
124
+ - <blank>
125
+ - <unk>
126
+ - ▁
127
+ - o
128
+ - a
129
+ - ▁e
130
+ - ''''
131
+ - ▁um
132
+ - ▁o
133
+ - e
134
+ - ba
135
+ - ▁mu
136
+ - n
137
+ - la
138
+ - ▁n
139
+ - mu
140
+ - ka
141
+ - ▁ku
142
+ - li
143
+ - ▁oku
144
+ - ▁nga
145
+ - ra
146
+ - ko
147
+ - sa
148
+ - ▁a
149
+ - u
150
+ - ▁ki
151
+ - yo
152
+ - ta
153
+ - ki
154
+ - i
155
+ - tu
156
+ - ku
157
+ - zi
158
+ - t
159
+ - wa
160
+ - ▁tu
161
+ - za
162
+ - ga
163
+ - 'no'
164
+ - si
165
+ - ma
166
+ - ▁nti
167
+ - ▁ne
168
+ - ri
169
+ - ▁ba
170
+ - ▁sebo
171
+ - wo
172
+ - re
173
+ - s
174
+ - r
175
+ - ▁eki
176
+ - ze
177
+ - dde
178
+ - bi
179
+ - na
180
+ - te
181
+ - le
182
+ - se
183
+ - ya
184
+ - nya
185
+ - ge
186
+ - ▁ye
187
+ - bu
188
+ - z
189
+ - ▁ebi
190
+ - jja
191
+ - m
192
+ - ▁ka
193
+ - k
194
+ - ▁na
195
+ - ▁bu
196
+ - ▁omu
197
+ - l
198
+ - g
199
+ - ▁wa
200
+ - b
201
+ - lu
202
+ - ▁obu
203
+ - y
204
+ - ti
205
+ - ▁bi
206
+ - ▁oba
207
+ - p
208
+ - lo
209
+ - gi
210
+ - c
211
+ - ▁aba
212
+ - ro
213
+ - nge
214
+ - ▁nnyo
215
+ - nga
216
+ - ngi
217
+ - j
218
+ - ndi
219
+ - me
220
+ - genda
221
+ - ▁te
222
+ - ▁en
223
+ - fu
224
+ - we
225
+ - ke
226
+ - f
227
+ - gu
228
+ - beera
229
+ - ni
230
+ - d
231
+ - mba
232
+ - yi
233
+ - so
234
+ - sobola
235
+ - nyi
236
+ - kola
237
+ - to
238
+ - wu
239
+ - mi
240
+ - ▁bwe
241
+ - ▁we
242
+ - bo
243
+ - ▁naye
244
+ - nda
245
+ - ▁aka
246
+ - ▁ya
247
+ - ▁kye
248
+ - yina
249
+ - bwa
250
+ - ▁ate
251
+ - ▁era
252
+ - ▁ma
253
+ - ntu
254
+ - ▁s
255
+ - h
256
+ - ▁m
257
+ - be
258
+ - kya
259
+ - ffe
260
+ - yita
261
+ - teeka
262
+ - ▁bw
263
+ - va
264
+ - ▁zi
265
+ - ne
266
+ - gamba
267
+ - go
268
+ - ye
269
+ - vu
270
+ - biri
271
+ - lwa
272
+ - nna
273
+ - ▁p
274
+ - ▁ama
275
+ - yinza
276
+ - ▁ng
277
+ - en
278
+ - ▁ky
279
+ - dd
280
+ - gala
281
+ - twa
282
+ - lira
283
+ - singa
284
+ - su
285
+ - ru
286
+ - oku
287
+ - dda
288
+ - ▁kubanga
289
+ - ana
290
+ - funa
291
+ - mwa
292
+ - nja
293
+ - badde
294
+ - mwaanyi
295
+ - mp
296
+ - ▁to
297
+ - ▁bulungi
298
+ - ▁eddagala
299
+ - ▁by
300
+ - limi
301
+ - ▁w
302
+ - kuba
303
+ - lina
304
+ - ▁gye
305
+ - nye
306
+ - kwa
307
+ - ▁li
308
+ - ▁gu
309
+ - ▁kya
310
+ - nde
311
+ - ▁eby
312
+ - ▁okuba
313
+ - mbe
314
+ - ▁olu
315
+ - ▁sente
316
+ - ▁eri
317
+ - lya
318
+ - ▁buli
319
+ - kozesa
320
+ - ter
321
+ - w
322
+ - ▁y
323
+ - ▁c
324
+ - ▁emi
325
+ - ▁kati
326
+ - gimusa
327
+ - ▁awo
328
+ - mbi
329
+ - ▁so
330
+ - ▁si
331
+ - simba
332
+ - ▁gwe
333
+ - ly
334
+ - ▁d
335
+ - v
336
+ - ▁mwe
337
+ - ngu
338
+ - ▁bwo
339
+ - koola
340
+ - ▁ga
341
+ - ▁ddala
342
+ - ▁be
343
+ - tunu
344
+ - ▁okulaba
345
+ - ngo
346
+ - ▁ekyo
347
+ - ▁mi
348
+ - ▁co
349
+ - manyi
350
+ - sanga
351
+ - mbu
352
+ - ▁okwe
353
+ - ▁gw
354
+ - ▁gy
355
+ - koze
356
+ - gwa
357
+ - ▁kwe
358
+ - ▁bye
359
+ - kwata
360
+ - bwe
361
+ - kulu
362
+ - wuliriza
363
+ - de
364
+ - ▁lye
365
+ - bye
366
+ - ogera
367
+ - ▁bbiri
368
+ - tya
369
+ - ndo
370
+ - ▁no
371
+ - ▁abalimi
372
+ - gambye
373
+ - ve
374
+ - tegeeza
375
+ - ▁olw
376
+ - gya
377
+ - di
378
+ - ▁waliwo
379
+ - ▁eky
380
+ - tandika
381
+ - ▁ddagala
382
+ - buuza
383
+ - emwanyi
384
+ - ▁kaakati
385
+ - mbo
386
+ - tuufu
387
+ - ▁wansi
388
+ - ▁amazzi
389
+ - nyu
390
+ - ch
391
+ - tundu
392
+ - ▁kasooli
393
+ - ▁lw
394
+ - tuuka
395
+ - sooka
396
+ - ▁ssatu
397
+ - tereka
398
+ - ▁ettaka
399
+ - ▁ttaka
400
+ - kiseera
401
+ - ▁byona
402
+ - ▁ensigo
403
+ - ▁nnimiro
404
+ - leeta
405
+ - ▁kw
406
+ - ▁kkumi
407
+ - taano
408
+ - kungula
409
+ - etaaga
410
+ - ▁musanvu
411
+ - ▁okw
412
+ - ��obulungi
413
+ - ▁then
414
+ - ▁ttaano
415
+ - emmwanyi
416
+ - ▁program
417
+ - ▁obulwadde
418
+ - ▁ogw
419
+ - ▁ndowooza
420
+ - ▁season
421
+ - x
422
+ - q
423
+ - <sos/eos>
424
+ init: xavier_uniform
425
+ input_size: null
426
+ ctc_conf:
427
+ dropout_rate: 0.0
428
+ ctc_type: builtin
429
+ reduce: true
430
+ ignore_nan_grad: null
431
+ zero_infinity: true
432
+ brctc_risk_strategy: exp
433
+ brctc_group_strategy: end
434
+ brctc_risk_factor: 0.0
435
+ joint_net_conf: null
436
+ use_preprocessor: true
437
+ use_lang_prompt: false
438
+ use_nlp_prompt: false
439
+ token_type: bpe
440
+ bpemodel: data/en_token_list/bpe_unigram300/bpe.model
441
+ non_linguistic_symbols: null
442
+ cleaner: null
443
+ g2p: null
444
+ speech_volume_normalize: null
445
+ rir_scp: null
446
+ rir_apply_prob: 1.0
447
+ noise_scp: null
448
+ noise_apply_prob: 1.0
449
+ noise_db_range: '13_15'
450
+ short_noise_thres: 0.5
451
+ aux_ctc_tasks: []
452
+ frontend: default
453
+ frontend_conf:
454
+ fs: 16k
455
+ specaug: specaug
456
+ specaug_conf:
457
+ apply_time_warp: true
458
+ time_warp_window: 5
459
+ time_warp_mode: bicubic
460
+ apply_freq_mask: true
461
+ freq_mask_width_range:
462
+ - 0
463
+ - 30
464
+ num_freq_mask: 2
465
+ apply_time_mask: true
466
+ time_mask_width_range:
467
+ - 0
468
+ - 40
469
+ num_time_mask: 2
470
+ normalize: global_mvn
471
+ normalize_conf:
472
+ stats_file: exp/asr_stats_raw_en_bpe300_sp/train/feats_stats.npz
473
+ model: espnet
474
+ model_conf:
475
+ ctc_weight: 0.3
476
+ lsm_weight: 0.1
477
+ length_normalized_loss: false
478
+ preencoder: null
479
+ preencoder_conf: {}
480
+ encoder: transformer
481
+ encoder_conf:
482
+ output_size: 256
483
+ attention_heads: 4
484
+ linear_units: 1024
485
+ num_blocks: 12
486
+ dropout_rate: 0.1
487
+ positional_dropout_rate: 0.1
488
+ attention_dropout_rate: 0.1
489
+ input_layer: conv2d
490
+ normalize_before: true
491
+ postencoder: null
492
+ postencoder_conf: {}
493
+ decoder: transformer
494
+ decoder_conf:
495
+ attention_heads: 4
496
+ linear_units: 1024
497
+ num_blocks: 6
498
+ dropout_rate: 0.1
499
+ positional_dropout_rate: 0.1
500
+ self_attention_dropout_rate: 0.1
501
+ src_attention_dropout_rate: 0.1
502
+ preprocessor: default
503
+ preprocessor_conf: {}
504
+ required:
505
+ - output_dir
506
+ - token_list
507
+ version: '202402'
508
+ distributed: false