pyf98 commited on
Commit
e64025e
1 Parent(s): 8d87401

add model files

Browse files
Files changed (32) hide show
  1. README.md +379 -0
  2. data/nlsyms.txt +3 -0
  3. exp/asr_stats_raw_en_char_sp/train/feats_stats.npz +3 -0
  4. exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/RESULTS.md +57 -0
  5. exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/config.yaml +270 -0
  6. exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/acc.png +0 -0
  7. exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/backward_time.png +0 -0
  8. exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/cer.png +0 -0
  9. exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/cer_ctc.png +0 -0
  10. exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/forward_time.png +0 -0
  11. exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/gpu_max_cached_mem_GB.png +0 -0
  12. exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/iter_time.png +0 -0
  13. exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/loss.png +0 -0
  14. exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/loss_att.png +0 -0
  15. exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/loss_ctc.png +0 -0
  16. exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/optim0_lr0.png +0 -0
  17. exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/optim_step_time.png +0 -0
  18. exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/train_time.png +0 -0
  19. exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/wer.png +0 -0
  20. exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/valid.acc.ave_10best.pth +3 -0
  21. exp/lm_train_lm_transformer_en_char/12epoch.pth +3 -0
  22. exp/lm_train_lm_transformer_en_char/config.yaml +189 -0
  23. exp/lm_train_lm_transformer_en_char/images/backward_time.png +0 -0
  24. exp/lm_train_lm_transformer_en_char/images/forward_time.png +0 -0
  25. exp/lm_train_lm_transformer_en_char/images/gpu_max_cached_mem_GB.png +0 -0
  26. exp/lm_train_lm_transformer_en_char/images/iter_time.png +0 -0
  27. exp/lm_train_lm_transformer_en_char/images/loss.png +0 -0
  28. exp/lm_train_lm_transformer_en_char/images/optim0_lr0.png +0 -0
  29. exp/lm_train_lm_transformer_en_char/images/optim_step_time.png +0 -0
  30. exp/lm_train_lm_transformer_en_char/images/train_time.png +0 -0
  31. exp/lm_train_lm_transformer_en_char/perplexity_test/ppl +1 -0
  32. meta.yaml +10 -0
README.md ADDED
@@ -0,0 +1,379 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - espnet
4
+ - audio
5
+ - automatic-speech-recognition
6
+ language: en
7
+ datasets:
8
+ - chime4
9
+ license: cc-by-4.0
10
+ ---
11
+
12
+ ## ESPnet2 ASR model
13
+
14
+ ### `pyf98/chime4_e_branchformer_e10`
15
+
16
+ This model was trained by Yifan Peng using chime4 recipe in [espnet](https://github.com/espnet/espnet/).
17
+
18
+ References:
19
+ - [E-Branchformer: Branchformer with Enhanced merging for speech recognition (SLT 2022)](https://arxiv.org/abs/2210.00077)
20
+ - [Branchformer: Parallel MLP-Attention Architectures to Capture Local and Global Context for Speech Recognition and Understanding (ICML 2022)](https://proceedings.mlr.press/v162/peng22a.html)
21
+
22
+ ### Demo: How to use in ESPnet2
23
+
24
+ Follow the [ESPnet installation instructions](https://espnet.github.io/espnet/installation.html)
25
+ if you haven't done that already.
26
+
27
+ ```bash
28
+ cd espnet
29
+ git checkout ad91279f0108d54bd22abe29671b376f048822c5
30
+ pip install -e .
31
+ cd egs2/chime4/asr1
32
+ ./run.sh --skip_data_prep false --skip_train true --download_model pyf98/chime4_e_branchformer_e10
33
+ ```
34
+
35
+ <!-- Generated by scripts/utils/show_asr_result.sh -->
36
+ # RESULTS
37
+ ## Environments
38
+ - date: `Wed Dec 28 15:49:24 EST 2022`
39
+ - python version: `3.9.15 (main, Nov 24 2022, 14:31:59) [GCC 11.2.0]`
40
+ - espnet version: `espnet 202211`
41
+ - pytorch version: `pytorch 1.12.1`
42
+ - Git hash: `f9a8009aef6ff9ba192a78c19b619ae4a9f3b9d2`
43
+ - Commit date: `Wed Dec 28 00:30:54 2022 -0500`
44
+
45
+ ## asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp
46
+ ### WER
47
+
48
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
49
+ |---|---|---|---|---|---|---|---|---|
50
+ |decode_asr_lm_lm_train_lm_transformer_en_char_valid.loss.ave_asr_model_valid.acc.ave/dt05_real_beamformit_5mics|1640|27119|93.7|5.0|1.2|0.6|6.8|52.5|
51
+ |decode_asr_lm_lm_train_lm_transformer_en_char_valid.loss.ave_asr_model_valid.acc.ave/dt05_simu_beamformit_5mics|1640|27120|92.4|6.1|1.6|0.7|8.4|58.2|
52
+ |decode_asr_lm_lm_train_lm_transformer_en_char_valid.loss.ave_asr_model_valid.acc.ave/et05_real_beamformit_5mics|1320|21409|90.2|8.0|1.8|1.0|10.8|60.2|
53
+ |decode_asr_lm_lm_train_lm_transformer_en_char_valid.loss.ave_asr_model_valid.acc.ave/et05_simu_beamformit_5mics|1320|21416|88.4|9.3|2.4|1.4|13.0|66.1|
54
+
55
+ ### CER
56
+
57
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
58
+ |---|---|---|---|---|---|---|---|---|
59
+ |decode_asr_lm_lm_train_lm_transformer_en_char_valid.loss.ave_asr_model_valid.acc.ave/dt05_real_beamformit_5mics|1640|160390|97.4|1.3|1.3|0.7|3.3|52.5|
60
+ |decode_asr_lm_lm_train_lm_transformer_en_char_valid.loss.ave_asr_model_valid.acc.ave/dt05_simu_beamformit_5mics|1640|160400|96.6|1.8|1.7|0.9|4.3|58.2|
61
+ |decode_asr_lm_lm_train_lm_transformer_en_char_valid.loss.ave_asr_model_valid.acc.ave/et05_real_beamformit_5mics|1320|126796|95.7|2.3|2.0|1.1|5.4|60.2|
62
+ |decode_asr_lm_lm_train_lm_transformer_en_char_valid.loss.ave_asr_model_valid.acc.ave/et05_simu_beamformit_5mics|1320|126812|94.4|2.8|2.8|1.5|7.2|66.1|
63
+
64
+ ### TER
65
+
66
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
67
+ |---|---|---|---|---|---|---|---|---|
68
+
69
+ ## ASR config
70
+
71
+ <details><summary>expand</summary>
72
+
73
+ ```
74
+ config: conf/tuning/train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k.yaml
75
+ print_config: false
76
+ log_level: INFO
77
+ dry_run: false
78
+ iterator_type: sequence
79
+ output_dir: exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp
80
+ ngpu: 1
81
+ seed: 2022
82
+ num_workers: 4
83
+ num_att_plot: 3
84
+ dist_backend: nccl
85
+ dist_init_method: env://
86
+ dist_world_size: 2
87
+ dist_rank: 0
88
+ local_rank: 0
89
+ dist_master_addr: localhost
90
+ dist_master_port: 33561
91
+ dist_launcher: null
92
+ multiprocessing_distributed: true
93
+ unused_parameters: false
94
+ sharded_ddp: false
95
+ cudnn_enabled: true
96
+ cudnn_benchmark: false
97
+ cudnn_deterministic: true
98
+ collect_stats: false
99
+ write_collected_feats: false
100
+ max_epoch: 50
101
+ patience: null
102
+ val_scheduler_criterion:
103
+ - valid
104
+ - loss
105
+ early_stopping_criterion:
106
+ - valid
107
+ - loss
108
+ - min
109
+ best_model_criterion:
110
+ - - valid
111
+ - acc
112
+ - max
113
+ keep_nbest_models: 10
114
+ nbest_averaging_interval: 0
115
+ grad_clip: 5.0
116
+ grad_clip_type: 2.0
117
+ grad_noise: false
118
+ accum_grad: 1
119
+ no_forward_run: false
120
+ resume: true
121
+ train_dtype: float32
122
+ use_amp: true
123
+ log_interval: null
124
+ use_matplotlib: true
125
+ use_tensorboard: true
126
+ create_graph_in_tensorboard: false
127
+ use_wandb: false
128
+ wandb_project: null
129
+ wandb_id: null
130
+ wandb_entity: null
131
+ wandb_name: null
132
+ wandb_model_log_interval: -1
133
+ detect_anomaly: false
134
+ pretrain_path: null
135
+ init_param: []
136
+ ignore_init_mismatch: false
137
+ freeze_param: []
138
+ num_iters_per_epoch: null
139
+ batch_size: 20
140
+ valid_batch_size: null
141
+ batch_bins: 15000000
142
+ valid_batch_bins: null
143
+ train_shape_file:
144
+ - exp/asr_stats_raw_en_char_sp/train/speech_shape
145
+ - exp/asr_stats_raw_en_char_sp/train/text_shape.char
146
+ valid_shape_file:
147
+ - exp/asr_stats_raw_en_char_sp/valid/speech_shape
148
+ - exp/asr_stats_raw_en_char_sp/valid/text_shape.char
149
+ batch_type: numel
150
+ valid_batch_type: null
151
+ fold_length:
152
+ - 80000
153
+ - 150
154
+ sort_in_batch: descending
155
+ sort_batch: descending
156
+ multiple_iterator: false
157
+ chunk_length: 500
158
+ chunk_shift_ratio: 0.5
159
+ num_cache_chunks: 1024
160
+ train_data_path_and_name_and_type:
161
+ - - dump/raw/tr05_multi_noisy_si284_sp/wav.scp
162
+ - speech
163
+ - kaldi_ark
164
+ - - dump/raw/tr05_multi_noisy_si284_sp/text
165
+ - text
166
+ - text
167
+ valid_data_path_and_name_and_type:
168
+ - - dump/raw/dt05_multi_isolated_1ch_track/wav.scp
169
+ - speech
170
+ - kaldi_ark
171
+ - - dump/raw/dt05_multi_isolated_1ch_track/text
172
+ - text
173
+ - text
174
+ allow_variable_data_keys: false
175
+ max_cache_size: 0.0
176
+ max_cache_fd: 32
177
+ valid_max_cache_size: null
178
+ optim: adam
179
+ optim_conf:
180
+ lr: 0.001
181
+ weight_decay: 1.0e-06
182
+ scheduler: warmuplr
183
+ scheduler_conf:
184
+ warmup_steps: 25000
185
+ token_list:
186
+ - <blank>
187
+ - <unk>
188
+ - <space>
189
+ - E
190
+ - T
191
+ - A
192
+ - N
193
+ - I
194
+ - O
195
+ - S
196
+ - R
197
+ - H
198
+ - L
199
+ - D
200
+ - C
201
+ - U
202
+ - M
203
+ - P
204
+ - F
205
+ - G
206
+ - Y
207
+ - W
208
+ - B
209
+ - V
210
+ - K
211
+ - .
212
+ - X
213
+ - ''''
214
+ - J
215
+ - Q
216
+ - Z
217
+ - ','
218
+ - '-'
219
+ - '"'
220
+ - <NOISE>
221
+ - '*'
222
+ - ':'
223
+ - (
224
+ - )
225
+ - '?'
226
+ - '&'
227
+ - ;
228
+ - '!'
229
+ - /
230
+ - '{'
231
+ - '}'
232
+ - '1'
233
+ - '2'
234
+ - '0'
235
+ - $
236
+ - '8'
237
+ - '9'
238
+ - '6'
239
+ - '3'
240
+ - '5'
241
+ - '7'
242
+ - '4'
243
+ - '~'
244
+ - '`'
245
+ - _
246
+ - <*IN*>
247
+ - <*MR.*>
248
+ - \
249
+ - ^
250
+ - <sos/eos>
251
+ init: null
252
+ input_size: null
253
+ ctc_conf:
254
+ dropout_rate: 0.0
255
+ ctc_type: builtin
256
+ reduce: true
257
+ ignore_nan_grad: null
258
+ zero_infinity: true
259
+ joint_net_conf: null
260
+ use_preprocessor: true
261
+ token_type: char
262
+ bpemodel: null
263
+ non_linguistic_symbols: data/nlsyms.txt
264
+ cleaner: null
265
+ g2p: null
266
+ speech_volume_normalize: null
267
+ rir_scp: null
268
+ rir_apply_prob: 1.0
269
+ noise_scp: null
270
+ noise_apply_prob: 1.0
271
+ noise_db_range: '13_15'
272
+ short_noise_thres: 0.5
273
+ frontend: default
274
+ frontend_conf:
275
+ n_fft: 512
276
+ win_length: 400
277
+ hop_length: 160
278
+ fs: 16k
279
+ specaug: specaug
280
+ specaug_conf:
281
+ apply_time_warp: true
282
+ time_warp_window: 5
283
+ time_warp_mode: bicubic
284
+ apply_freq_mask: true
285
+ freq_mask_width_range:
286
+ - 0
287
+ - 27
288
+ num_freq_mask: 2
289
+ apply_time_mask: true
290
+ time_mask_width_ratio_range:
291
+ - 0.0
292
+ - 0.05
293
+ num_time_mask: 2
294
+ normalize: global_mvn
295
+ normalize_conf:
296
+ stats_file: exp/asr_stats_raw_en_char_sp/train/feats_stats.npz
297
+ model: espnet
298
+ model_conf:
299
+ ctc_weight: 0.3
300
+ lsm_weight: 0.1
301
+ length_normalized_loss: false
302
+ preencoder: null
303
+ preencoder_conf: {}
304
+ encoder: e_branchformer
305
+ encoder_conf:
306
+ output_size: 256
307
+ attention_heads: 4
308
+ attention_layer_type: rel_selfattn
309
+ pos_enc_layer_type: rel_pos
310
+ rel_pos_type: latest
311
+ cgmlp_linear_units: 1024
312
+ cgmlp_conv_kernel: 31
313
+ use_linear_after_conv: false
314
+ gate_activation: identity
315
+ num_blocks: 10
316
+ dropout_rate: 0.1
317
+ positional_dropout_rate: 0.1
318
+ attention_dropout_rate: 0.1
319
+ input_layer: conv2d
320
+ layer_drop_rate: 0.0
321
+ linear_units: 1024
322
+ positionwise_layer_type: linear
323
+ use_ffn: true
324
+ macaron_ffn: true
325
+ merge_conv_kernel: 31
326
+ postencoder: null
327
+ postencoder_conf: {}
328
+ decoder: transformer
329
+ decoder_conf:
330
+ attention_heads: 4
331
+ linear_units: 2048
332
+ num_blocks: 6
333
+ dropout_rate: 0.1
334
+ positional_dropout_rate: 0.1
335
+ self_attention_dropout_rate: 0.1
336
+ src_attention_dropout_rate: 0.1
337
+ preprocessor: default
338
+ preprocessor_conf: {}
339
+ required:
340
+ - output_dir
341
+ - token_list
342
+ version: '202211'
343
+ distributed: true
344
+ ```
345
+
346
+ </details>
347
+
348
+
349
+
350
+ ### Citing ESPnet
351
+
352
+ ```BibTex
353
+ @inproceedings{watanabe2018espnet,
354
+ author={Shinji Watanabe and Takaaki Hori and Shigeki Karita and Tomoki Hayashi and Jiro Nishitoba and Yuya Unno and Nelson Yalta and Jahn Heymann and Matthew Wiesner and Nanxin Chen and Adithya Renduchintala and Tsubasa Ochiai},
355
+ title={{ESPnet}: End-to-End Speech Processing Toolkit},
356
+ year={2018},
357
+ booktitle={Proceedings of Interspeech},
358
+ pages={2207--2211},
359
+ doi={10.21437/Interspeech.2018-1456},
360
+ url={http://dx.doi.org/10.21437/Interspeech.2018-1456}
361
+ }
362
+
363
+
364
+
365
+
366
+ ```
367
+
368
+ or arXiv:
369
+
370
+ ```bibtex
371
+ @misc{watanabe2018espnet,
372
+ title={ESPnet: End-to-End Speech Processing Toolkit},
373
+ author={Shinji Watanabe and Takaaki Hori and Shigeki Karita and Tomoki Hayashi and Jiro Nishitoba and Yuya Unno and Nelson Yalta and Jahn Heymann and Matthew Wiesner and Nanxin Chen and Adithya Renduchintala and Tsubasa Ochiai},
374
+ year={2018},
375
+ eprint={1804.00015},
376
+ archivePrefix={arXiv},
377
+ primaryClass={cs.CL}
378
+ }
379
+ ```
data/nlsyms.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ <*IN*>
2
+ <*MR.*>
3
+ <NOISE>
exp/asr_stats_raw_en_char_sp/train/feats_stats.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2aca9a9d9bf95ba2222dd91ed8d62655135d2637bf76704cf984b7d0e90756c
3
+ size 1402
exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/RESULTS.md ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <!-- Generated by scripts/utils/show_asr_result.sh -->
2
+ # RESULTS
3
+ ## Environments
4
+ - date: `Wed Dec 28 15:49:24 EST 2022`
5
+ - python version: `3.9.15 (main, Nov 24 2022, 14:31:59) [GCC 11.2.0]`
6
+ - espnet version: `espnet 202211`
7
+ - pytorch version: `pytorch 1.12.1`
8
+ - Git hash: `f9a8009aef6ff9ba192a78c19b619ae4a9f3b9d2`
9
+ - Commit date: `Wed Dec 28 00:30:54 2022 -0500`
10
+
11
+ ## asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp
12
+ ### WER
13
+
14
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
15
+ |---|---|---|---|---|---|---|---|---|
16
+ |decode_asr_lm_lm_train_lm_en_char_valid.loss.ave_asr_model_valid.acc.ave/dt05_real_beamformit_2mics|1640|27119|89.0|9.1|1.9|0.9|11.9|73.1|
17
+ |decode_asr_lm_lm_train_lm_en_char_valid.loss.ave_asr_model_valid.acc.ave/dt05_real_beamformit_5mics|1640|27119|90.4|7.9|1.6|0.8|10.3|69.5|
18
+ |decode_asr_lm_lm_train_lm_en_char_valid.loss.ave_asr_model_valid.acc.ave/dt05_real_isolated_1ch_track|1640|27119|87.8|10.1|2.1|1.2|13.4|76.6|
19
+ |decode_asr_lm_lm_train_lm_en_char_valid.loss.ave_asr_model_valid.acc.ave/dt05_simu_beamformit_2mics|1640|27120|86.8|10.8|2.4|1.1|14.3|77.2|
20
+ |decode_asr_lm_lm_train_lm_en_char_valid.loss.ave_asr_model_valid.acc.ave/dt05_simu_beamformit_5mics|1640|27120|88.6|9.3|2.0|0.9|12.2|73.5|
21
+ |decode_asr_lm_lm_train_lm_en_char_valid.loss.ave_asr_model_valid.acc.ave/dt05_simu_isolated_1ch_track|1640|27120|85.4|12.1|2.5|1.5|16.0|78.4|
22
+ |decode_asr_lm_lm_train_lm_en_char_valid.loss.ave_asr_model_valid.acc.ave/et05_real_beamformit_2mics|1320|21409|83.6|13.9|2.5|1.6|18.1|79.6|
23
+ |decode_asr_lm_lm_train_lm_en_char_valid.loss.ave_asr_model_valid.acc.ave/et05_real_beamformit_5mics|1320|21409|86.1|11.8|2.2|1.3|15.2|76.4|
24
+ |decode_asr_lm_lm_train_lm_en_char_valid.loss.ave_asr_model_valid.acc.ave/et05_real_isolated_1ch_track|1320|21409|81.5|15.7|2.8|2.0|20.5|83.7|
25
+ |decode_asr_lm_lm_train_lm_en_char_valid.loss.ave_asr_model_valid.acc.ave/et05_simu_beamformit_2mics|1320|21416|81.6|15.1|3.3|1.9|20.3|82.5|
26
+ |decode_asr_lm_lm_train_lm_en_char_valid.loss.ave_asr_model_valid.acc.ave/et05_simu_beamformit_5mics|1320|21416|84.4|13.0|2.6|1.7|17.3|79.8|
27
+ |decode_asr_lm_lm_train_lm_en_char_valid.loss.ave_asr_model_valid.acc.ave/et05_simu_isolated_1ch_track|1320|21416|79.9|17.0|3.2|2.4|22.5|81.4|
28
+ |decode_asr_lm_lm_train_lm_transformer_en_char_valid.loss.ave_asr_model_valid.acc.ave/dt05_real_beamformit_5mics|1640|27119|93.7|5.0|1.2|0.6|6.8|52.5|
29
+ |decode_asr_lm_lm_train_lm_transformer_en_char_valid.loss.ave_asr_model_valid.acc.ave/dt05_simu_beamformit_5mics|1640|27120|92.4|6.1|1.6|0.7|8.4|58.2|
30
+ |decode_asr_lm_lm_train_lm_transformer_en_char_valid.loss.ave_asr_model_valid.acc.ave/et05_real_beamformit_5mics|1320|21409|90.2|8.0|1.8|1.0|10.8|60.2|
31
+ |decode_asr_lm_lm_train_lm_transformer_en_char_valid.loss.ave_asr_model_valid.acc.ave/et05_simu_beamformit_5mics|1320|21416|88.4|9.3|2.4|1.4|13.0|66.1|
32
+
33
+ ### CER
34
+
35
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
36
+ |---|---|---|---|---|---|---|---|---|
37
+ |decode_asr_lm_lm_train_lm_en_char_valid.loss.ave_asr_model_valid.acc.ave/dt05_real_beamformit_2mics|1640|160390|95.7|2.3|2.0|1.1|5.3|73.1|
38
+ |decode_asr_lm_lm_train_lm_en_char_valid.loss.ave_asr_model_valid.acc.ave/dt05_real_beamformit_5mics|1640|160390|96.4|1.9|1.7|0.9|4.5|69.5|
39
+ |decode_asr_lm_lm_train_lm_en_char_valid.loss.ave_asr_model_valid.acc.ave/dt05_real_isolated_1ch_track|1640|160390|95.2|2.6|2.2|1.3|6.2|76.6|
40
+ |decode_asr_lm_lm_train_lm_en_char_valid.loss.ave_asr_model_valid.acc.ave/dt05_simu_beamformit_2mics|1640|160400|94.4|3.0|2.6|1.4|7.0|77.2|
41
+ |decode_asr_lm_lm_train_lm_en_char_valid.loss.ave_asr_model_valid.acc.ave/dt05_simu_beamformit_5mics|1640|160400|95.4|2.4|2.2|1.1|5.7|73.5|
42
+ |decode_asr_lm_lm_train_lm_en_char_valid.loss.ave_asr_model_valid.acc.ave/dt05_simu_isolated_1ch_track|1640|160400|93.7|3.6|2.7|1.7|8.0|78.4|
43
+ |decode_asr_lm_lm_train_lm_en_char_valid.loss.ave_asr_model_valid.acc.ave/et05_real_beamformit_2mics|1320|126796|92.9|4.0|3.1|1.8|8.9|79.6|
44
+ |decode_asr_lm_lm_train_lm_en_char_valid.loss.ave_asr_model_valid.acc.ave/et05_real_beamformit_5mics|1320|126796|94.3|3.2|2.5|1.5|7.2|76.4|
45
+ |decode_asr_lm_lm_train_lm_en_char_valid.loss.ave_asr_model_valid.acc.ave/et05_real_isolated_1ch_track|1320|126796|91.8|4.8|3.4|2.2|10.4|83.7|
46
+ |decode_asr_lm_lm_train_lm_en_char_valid.loss.ave_asr_model_valid.acc.ave/et05_simu_beamformit_2mics|1320|126812|91.3|4.7|4.0|2.2|10.9|82.5|
47
+ |decode_asr_lm_lm_train_lm_en_char_valid.loss.ave_asr_model_valid.acc.ave/et05_simu_beamformit_5mics|1320|126812|93.1|3.7|3.3|1.9|8.8|79.8|
48
+ |decode_asr_lm_lm_train_lm_en_char_valid.loss.ave_asr_model_valid.acc.ave/et05_simu_isolated_1ch_track|1320|126812|90.5|5.4|4.1|2.8|12.3|81.4|
49
+ |decode_asr_lm_lm_train_lm_transformer_en_char_valid.loss.ave_asr_model_valid.acc.ave/dt05_real_beamformit_5mics|1640|160390|97.4|1.3|1.3|0.7|3.3|52.5|
50
+ |decode_asr_lm_lm_train_lm_transformer_en_char_valid.loss.ave_asr_model_valid.acc.ave/dt05_simu_beamformit_5mics|1640|160400|96.6|1.8|1.7|0.9|4.3|58.2|
51
+ |decode_asr_lm_lm_train_lm_transformer_en_char_valid.loss.ave_asr_model_valid.acc.ave/et05_real_beamformit_5mics|1320|126796|95.7|2.3|2.0|1.1|5.4|60.2|
52
+ |decode_asr_lm_lm_train_lm_transformer_en_char_valid.loss.ave_asr_model_valid.acc.ave/et05_simu_beamformit_5mics|1320|126812|94.4|2.8|2.8|1.5|7.2|66.1|
53
+
54
+ ### TER
55
+
56
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
57
+ |---|---|---|---|---|---|---|---|---|
exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/config.yaml ADDED
@@ -0,0 +1,270 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/tuning/train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ dry_run: false
5
+ iterator_type: sequence
6
+ output_dir: exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp
7
+ ngpu: 1
8
+ seed: 2022
9
+ num_workers: 4
10
+ num_att_plot: 3
11
+ dist_backend: nccl
12
+ dist_init_method: env://
13
+ dist_world_size: 2
14
+ dist_rank: 0
15
+ local_rank: 0
16
+ dist_master_addr: localhost
17
+ dist_master_port: 33561
18
+ dist_launcher: null
19
+ multiprocessing_distributed: true
20
+ unused_parameters: false
21
+ sharded_ddp: false
22
+ cudnn_enabled: true
23
+ cudnn_benchmark: false
24
+ cudnn_deterministic: true
25
+ collect_stats: false
26
+ write_collected_feats: false
27
+ max_epoch: 50
28
+ patience: null
29
+ val_scheduler_criterion:
30
+ - valid
31
+ - loss
32
+ early_stopping_criterion:
33
+ - valid
34
+ - loss
35
+ - min
36
+ best_model_criterion:
37
+ - - valid
38
+ - acc
39
+ - max
40
+ keep_nbest_models: 10
41
+ nbest_averaging_interval: 0
42
+ grad_clip: 5.0
43
+ grad_clip_type: 2.0
44
+ grad_noise: false
45
+ accum_grad: 1
46
+ no_forward_run: false
47
+ resume: true
48
+ train_dtype: float32
49
+ use_amp: true
50
+ log_interval: null
51
+ use_matplotlib: true
52
+ use_tensorboard: true
53
+ create_graph_in_tensorboard: false
54
+ use_wandb: false
55
+ wandb_project: null
56
+ wandb_id: null
57
+ wandb_entity: null
58
+ wandb_name: null
59
+ wandb_model_log_interval: -1
60
+ detect_anomaly: false
61
+ pretrain_path: null
62
+ init_param: []
63
+ ignore_init_mismatch: false
64
+ freeze_param: []
65
+ num_iters_per_epoch: null
66
+ batch_size: 20
67
+ valid_batch_size: null
68
+ batch_bins: 15000000
69
+ valid_batch_bins: null
70
+ train_shape_file:
71
+ - exp/asr_stats_raw_en_char_sp/train/speech_shape
72
+ - exp/asr_stats_raw_en_char_sp/train/text_shape.char
73
+ valid_shape_file:
74
+ - exp/asr_stats_raw_en_char_sp/valid/speech_shape
75
+ - exp/asr_stats_raw_en_char_sp/valid/text_shape.char
76
+ batch_type: numel
77
+ valid_batch_type: null
78
+ fold_length:
79
+ - 80000
80
+ - 150
81
+ sort_in_batch: descending
82
+ sort_batch: descending
83
+ multiple_iterator: false
84
+ chunk_length: 500
85
+ chunk_shift_ratio: 0.5
86
+ num_cache_chunks: 1024
87
+ train_data_path_and_name_and_type:
88
+ - - dump/raw/tr05_multi_noisy_si284_sp/wav.scp
89
+ - speech
90
+ - kaldi_ark
91
+ - - dump/raw/tr05_multi_noisy_si284_sp/text
92
+ - text
93
+ - text
94
+ valid_data_path_and_name_and_type:
95
+ - - dump/raw/dt05_multi_isolated_1ch_track/wav.scp
96
+ - speech
97
+ - kaldi_ark
98
+ - - dump/raw/dt05_multi_isolated_1ch_track/text
99
+ - text
100
+ - text
101
+ allow_variable_data_keys: false
102
+ max_cache_size: 0.0
103
+ max_cache_fd: 32
104
+ valid_max_cache_size: null
105
+ optim: adam
106
+ optim_conf:
107
+ lr: 0.001
108
+ weight_decay: 1.0e-06
109
+ scheduler: warmuplr
110
+ scheduler_conf:
111
+ warmup_steps: 25000
112
+ token_list:
113
+ - <blank>
114
+ - <unk>
115
+ - <space>
116
+ - E
117
+ - T
118
+ - A
119
+ - N
120
+ - I
121
+ - O
122
+ - S
123
+ - R
124
+ - H
125
+ - L
126
+ - D
127
+ - C
128
+ - U
129
+ - M
130
+ - P
131
+ - F
132
+ - G
133
+ - Y
134
+ - W
135
+ - B
136
+ - V
137
+ - K
138
+ - .
139
+ - X
140
+ - ''''
141
+ - J
142
+ - Q
143
+ - Z
144
+ - ','
145
+ - '-'
146
+ - '"'
147
+ - <NOISE>
148
+ - '*'
149
+ - ':'
150
+ - (
151
+ - )
152
+ - '?'
153
+ - '&'
154
+ - ;
155
+ - '!'
156
+ - /
157
+ - '{'
158
+ - '}'
159
+ - '1'
160
+ - '2'
161
+ - '0'
162
+ - $
163
+ - '8'
164
+ - '9'
165
+ - '6'
166
+ - '3'
167
+ - '5'
168
+ - '7'
169
+ - '4'
170
+ - '~'
171
+ - '`'
172
+ - _
173
+ - <*IN*>
174
+ - <*MR.*>
175
+ - \
176
+ - ^
177
+ - <sos/eos>
178
+ init: null
179
+ input_size: null
180
+ ctc_conf:
181
+ dropout_rate: 0.0
182
+ ctc_type: builtin
183
+ reduce: true
184
+ ignore_nan_grad: null
185
+ zero_infinity: true
186
+ joint_net_conf: null
187
+ use_preprocessor: true
188
+ token_type: char
189
+ bpemodel: null
190
+ non_linguistic_symbols: data/nlsyms.txt
191
+ cleaner: null
192
+ g2p: null
193
+ speech_volume_normalize: null
194
+ rir_scp: null
195
+ rir_apply_prob: 1.0
196
+ noise_scp: null
197
+ noise_apply_prob: 1.0
198
+ noise_db_range: '13_15'
199
+ short_noise_thres: 0.5
200
+ frontend: default
201
+ frontend_conf:
202
+ n_fft: 512
203
+ win_length: 400
204
+ hop_length: 160
205
+ fs: 16k
206
+ specaug: specaug
207
+ specaug_conf:
208
+ apply_time_warp: true
209
+ time_warp_window: 5
210
+ time_warp_mode: bicubic
211
+ apply_freq_mask: true
212
+ freq_mask_width_range:
213
+ - 0
214
+ - 27
215
+ num_freq_mask: 2
216
+ apply_time_mask: true
217
+ time_mask_width_ratio_range:
218
+ - 0.0
219
+ - 0.05
220
+ num_time_mask: 2
221
+ normalize: global_mvn
222
+ normalize_conf:
223
+ stats_file: exp/asr_stats_raw_en_char_sp/train/feats_stats.npz
224
+ model: espnet
225
+ model_conf:
226
+ ctc_weight: 0.3
227
+ lsm_weight: 0.1
228
+ length_normalized_loss: false
229
+ preencoder: null
230
+ preencoder_conf: {}
231
+ encoder: e_branchformer
232
+ encoder_conf:
233
+ output_size: 256
234
+ attention_heads: 4
235
+ attention_layer_type: rel_selfattn
236
+ pos_enc_layer_type: rel_pos
237
+ rel_pos_type: latest
238
+ cgmlp_linear_units: 1024
239
+ cgmlp_conv_kernel: 31
240
+ use_linear_after_conv: false
241
+ gate_activation: identity
242
+ num_blocks: 10
243
+ dropout_rate: 0.1
244
+ positional_dropout_rate: 0.1
245
+ attention_dropout_rate: 0.1
246
+ input_layer: conv2d
247
+ layer_drop_rate: 0.0
248
+ linear_units: 1024
249
+ positionwise_layer_type: linear
250
+ use_ffn: true
251
+ macaron_ffn: true
252
+ merge_conv_kernel: 31
253
+ postencoder: null
254
+ postencoder_conf: {}
255
+ decoder: transformer
256
+ decoder_conf:
257
+ attention_heads: 4
258
+ linear_units: 2048
259
+ num_blocks: 6
260
+ dropout_rate: 0.1
261
+ positional_dropout_rate: 0.1
262
+ self_attention_dropout_rate: 0.1
263
+ src_attention_dropout_rate: 0.1
264
+ preprocessor: default
265
+ preprocessor_conf: {}
266
+ required:
267
+ - output_dir
268
+ - token_list
269
+ version: '202211'
270
+ distributed: true
exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/acc.png ADDED
exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/backward_time.png ADDED
exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/cer.png ADDED
exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/cer_ctc.png ADDED
exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/forward_time.png ADDED
exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/gpu_max_cached_mem_GB.png ADDED
exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/iter_time.png ADDED
exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/loss.png ADDED
exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/loss_att.png ADDED
exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/loss_ctc.png ADDED
exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/optim0_lr0.png ADDED
exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/optim_step_time.png ADDED
exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/train_time.png ADDED
exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/images/wer.png ADDED
exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/valid.acc.ave_10best.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fedcf47686e935e0a9cbc9e9577aa2eff87ce94ae7d126a77bc837e2690f538
3
+ size 123444017
exp/lm_train_lm_transformer_en_char/12epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13dc5af025af5be3560922587402820207a78d258eb78fe1d47553a62b4b5895
3
+ size 202293743
exp/lm_train_lm_transformer_en_char/config.yaml ADDED
@@ -0,0 +1,189 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ accum_grad: 4
2
+ allow_variable_data_keys: false
3
+ batch_bins: 150000
4
+ batch_size: 20
5
+ batch_type: numel
6
+ best_model_criterion:
7
+ - - valid
8
+ - loss
9
+ - min
10
+ bpemodel: null
11
+ chunk_length: 500
12
+ chunk_shift_ratio: 0.5
13
+ cleaner: null
14
+ collect_stats: false
15
+ config: conf/train_lm_transformer.yaml
16
+ cudnn_benchmark: false
17
+ cudnn_deterministic: true
18
+ cudnn_enabled: true
19
+ detect_anomaly: false
20
+ dist_backend: nccl
21
+ dist_init_method: env://
22
+ dist_launcher: null
23
+ dist_master_addr: null
24
+ dist_master_port: null
25
+ dist_rank: null
26
+ dist_world_size: null
27
+ distributed: false
28
+ dry_run: false
29
+ early_stopping_criterion:
30
+ - valid
31
+ - loss
32
+ - min
33
+ fold_length:
34
+ - 150
35
+ freeze_param: []
36
+ g2p: null
37
+ grad_clip: 5.0
38
+ grad_clip_type: 2.0
39
+ grad_noise: false
40
+ ignore_init_mismatch: false
41
+ init: null
42
+ init_param: []
43
+ iterator_type: sequence
44
+ keep_nbest_models: 10
45
+ lm: transformer
46
+ lm_conf:
47
+ att_unit: 512
48
+ dropout_rate: 0.1
49
+ embed_unit: 128
50
+ head: 8
51
+ layer: 16
52
+ pos_enc: null
53
+ unit: 2048
54
+ local_rank: 0
55
+ log_interval: null
56
+ log_level: INFO
57
+ max_cache_fd: 32
58
+ max_cache_size: 0.0
59
+ max_epoch: 30
60
+ model_conf:
61
+ ignore_id: 0
62
+ multiple_iterator: false
63
+ multiprocessing_distributed: false
64
+ nbest_averaging_interval: 0
65
+ ngpu: 1
66
+ no_forward_run: false
67
+ non_linguistic_symbols: data/nlsyms.txt
68
+ num_att_plot: 3
69
+ num_cache_chunks: 1024
70
+ num_iters_per_epoch: null
71
+ num_workers: 1
72
+ optim: adam
73
+ optim_conf:
74
+ lr: 0.001
75
+ output_dir: exp_real2/lm_train_lm_transformer_en_char
76
+ patience: null
77
+ pretrain_path: null
78
+ print_config: false
79
+ required:
80
+ - output_dir
81
+ - token_list
82
+ resume: true
83
+ scheduler: warmuplr
84
+ scheduler_conf:
85
+ warmup_steps: 25000
86
+ seed: 0
87
+ sharded_ddp: false
88
+ sort_batch: descending
89
+ sort_in_batch: descending
90
+ token_list:
91
+ - <blank>
92
+ - <unk>
93
+ - <space>
94
+ - E
95
+ - T
96
+ - A
97
+ - N
98
+ - I
99
+ - O
100
+ - S
101
+ - R
102
+ - H
103
+ - L
104
+ - D
105
+ - C
106
+ - U
107
+ - M
108
+ - P
109
+ - F
110
+ - G
111
+ - Y
112
+ - W
113
+ - B
114
+ - V
115
+ - K
116
+ - .
117
+ - X
118
+ - ''''
119
+ - J
120
+ - Q
121
+ - Z
122
+ - ','
123
+ - '-'
124
+ - '"'
125
+ - <NOISE>
126
+ - '*'
127
+ - ':'
128
+ - (
129
+ - )
130
+ - '?'
131
+ - '&'
132
+ - ;
133
+ - '!'
134
+ - /
135
+ - '{'
136
+ - '}'
137
+ - '1'
138
+ - '2'
139
+ - '0'
140
+ - $
141
+ - '8'
142
+ - '9'
143
+ - '6'
144
+ - '3'
145
+ - '5'
146
+ - '7'
147
+ - '4'
148
+ - '~'
149
+ - '`'
150
+ - _
151
+ - <*IN*>
152
+ - <*MR.*>
153
+ - \
154
+ - ^
155
+ - <sos/eos>
156
+ token_type: char
157
+ train_data_path_and_name_and_type:
158
+ - - dump/raw/lm_train.txt
159
+ - text
160
+ - text
161
+ train_dtype: float32
162
+ train_shape_file:
163
+ - exp_real2/lm_stats_en_char/train/text_shape.char
164
+ unused_parameters: false
165
+ use_amp: false
166
+ use_matplotlib: true
167
+ use_preprocessor: true
168
+ use_tensorboard: true
169
+ use_wandb: false
170
+ val_scheduler_criterion:
171
+ - valid
172
+ - loss
173
+ valid_batch_bins: null
174
+ valid_batch_size: null
175
+ valid_batch_type: null
176
+ valid_data_path_and_name_and_type:
177
+ - - dump/raw/dt05_multi_isolated_1ch_track/text
178
+ - text
179
+ - text
180
+ valid_max_cache_size: null
181
+ valid_shape_file:
182
+ - exp_real2/lm_stats_en_char/valid/text_shape.char
183
+ version: 0.10.7a1
184
+ wandb_entity: null
185
+ wandb_id: null
186
+ wandb_model_log_interval: -1
187
+ wandb_name: null
188
+ wandb_project: null
189
+ write_collected_feats: false
exp/lm_train_lm_transformer_en_char/images/backward_time.png ADDED
exp/lm_train_lm_transformer_en_char/images/forward_time.png ADDED
exp/lm_train_lm_transformer_en_char/images/gpu_max_cached_mem_GB.png ADDED
exp/lm_train_lm_transformer_en_char/images/iter_time.png ADDED
exp/lm_train_lm_transformer_en_char/images/loss.png ADDED
exp/lm_train_lm_transformer_en_char/images/optim0_lr0.png ADDED
exp/lm_train_lm_transformer_en_char/images/optim_step_time.png ADDED
exp/lm_train_lm_transformer_en_char/images/train_time.png ADDED
exp/lm_train_lm_transformer_en_char/perplexity_test/ppl ADDED
@@ -0,0 +1 @@
 
 
1
+ 1.8016810278173603
meta.yaml ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ espnet: '202211'
2
+ files:
3
+ asr_model_file: exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/valid.acc.ave_10best.pth
4
+ lm_file: exp/lm_train_lm_transformer_en_char/12epoch.pth
5
+ python: "3.9.15 (main, Nov 24 2022, 14:31:59) \n[GCC 11.2.0]"
6
+ timestamp: 1672282149.739949
7
+ torch: 1.12.1
8
+ yaml_files:
9
+ asr_train_config: exp/asr_train_asr_e_branchformer_e10_mlp1024_linear1024_macaron_lr1e-3_warmup25k_raw_en_char_sp/config.yaml
10
+ lm_train_config: exp/lm_train_lm_transformer_en_char/config.yaml