ESPnet
English
audio
classification
shikhar7ssu commited on
Commit
94a33b0
·
verified ·
1 Parent(s): 16d46ab

Upload 19 files

Browse files
README.md ADDED
@@ -0,0 +1,291 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - espnet
4
+ - audio
5
+ - classification
6
+ language: en
7
+ datasets:
8
+ - bean
9
+ license: cc-by-4.0
10
+ ---
11
+
12
+ ## ESPnet2 CLS model
13
+
14
+ ### `espnet/BEATs-BEAN.HumBugDB`
15
+
16
+ This model was trained by Shikhar Bharadwaj using bean recipe in [espnet](https://github.com/espnet/espnet/).
17
+
18
+ ### Demo: How to use in ESPnet2
19
+
20
+ Follow the [ESPnet installation instructions](https://espnet.github.io/espnet/installation.html)
21
+ if you haven't done that already.
22
+
23
+ ```bash
24
+ cd espnet
25
+ git checkout 9191aa59acc7d3ceaca1f48dcc8fbdad2e03484b
26
+ pip install -e .
27
+ cd egs2/bean/cls1
28
+ ./run.sh --skip_data_prep false --skip_train true --download_model espnet/BEATs-BEAN.HumBugDB
29
+ ```
30
+
31
+ <!-- Generated by scripts/utils/show_cls_result.sh -->
32
+ # RESULTS
33
+ ## Environments
34
+ - date: `Tue Jan 7 19:11:31 EST 2025`
35
+ - python version: `3.9.20 (main, Oct 3 2024, 07:27:41) [GCC 11.2.0]`
36
+ - espnet version: `espnet 202412`
37
+ - pytorch version: `pytorch 2.4.0`
38
+ - Git hash: `9191aa59acc7d3ceaca1f48dcc8fbdad2e03484b`
39
+ - Commit date: `Tue Jan 7 04:34:03 2025 -0500`
40
+
41
+ ## cls_humbugdb.20250107.141123
42
+ |Dataset|Metric|Value|
43
+ |---|---|---|
44
+ /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_humbugdb.20250107.141123/cls_humbugdb.dev/score|mean_acc|86.35
45
+ /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_humbugdb.20250107.141123/cls_humbugdb.dev/score|mAP|66.74
46
+ /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_humbugdb.20250107.141123/cls_humbugdb.dev/score|mean_auc|96.32
47
+ /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_humbugdb.20250107.141123/cls_humbugdb.dev/score|n_labels|14.00
48
+ /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_humbugdb.20250107.141123/cls_humbugdb.dev/score|n_instances|1604.00
49
+ /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_humbugdb.20250107.141123/cls_humbugdb.test/score|mean_acc|80.63
50
+ /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_humbugdb.20250107.141123/cls_humbugdb.test/score|mAP|67.20
51
+ /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_humbugdb.20250107.141123/cls_humbugdb.test/score|mean_auc|94.15
52
+ /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_humbugdb.20250107.141123/cls_humbugdb.test/score|n_labels|14.00
53
+ /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_humbugdb.20250107.141123/cls_humbugdb.test/score|n_instances|1859.00
54
+
55
+ ## CLS config
56
+
57
+ <details><summary>expand</summary>
58
+
59
+ ```
60
+ config: conf/beats_humbugdb.yaml
61
+ print_config: false
62
+ log_level: INFO
63
+ drop_last_iter: false
64
+ dry_run: false
65
+ iterator_type: sequence
66
+ valid_iterator_type: null
67
+ output_dir: /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_humbugdb.20250107.141123
68
+ ngpu: 1
69
+ seed: 0
70
+ num_workers: 2
71
+ num_att_plot: 0
72
+ dist_backend: nccl
73
+ dist_init_method: env://
74
+ dist_world_size: null
75
+ dist_rank: null
76
+ local_rank: 0
77
+ dist_master_addr: null
78
+ dist_master_port: null
79
+ dist_launcher: null
80
+ multiprocessing_distributed: false
81
+ unused_parameters: true
82
+ sharded_ddp: false
83
+ use_deepspeed: false
84
+ deepspeed_config: null
85
+ cudnn_enabled: true
86
+ cudnn_benchmark: false
87
+ cudnn_deterministic: true
88
+ use_tf32: false
89
+ collect_stats: false
90
+ write_collected_feats: false
91
+ max_epoch: 250
92
+ patience: null
93
+ val_scheduler_criterion:
94
+ - valid
95
+ - loss
96
+ early_stopping_criterion:
97
+ - valid
98
+ - loss
99
+ - min
100
+ best_model_criterion:
101
+ - - valid
102
+ - acc
103
+ - max
104
+ keep_nbest_models: 1
105
+ nbest_averaging_interval: 0
106
+ grad_clip: 1
107
+ grad_clip_type: 2.0
108
+ grad_noise: false
109
+ accum_grad: 1
110
+ no_forward_run: false
111
+ resume: true
112
+ train_dtype: float32
113
+ use_amp: false
114
+ log_interval: null
115
+ use_matplotlib: true
116
+ use_tensorboard: true
117
+ create_graph_in_tensorboard: false
118
+ use_wandb: false
119
+ wandb_project: null
120
+ wandb_id: null
121
+ wandb_entity: null
122
+ wandb_name: null
123
+ wandb_model_log_interval: -1
124
+ detect_anomaly: false
125
+ use_adapter: false
126
+ adapter: lora
127
+ save_strategy: all
128
+ adapter_conf: {}
129
+ pretrain_path: null
130
+ init_param: []
131
+ ignore_init_mismatch: false
132
+ freeze_param: []
133
+ num_iters_per_epoch: null
134
+ batch_size: 32
135
+ valid_batch_size: 32
136
+ batch_bins: 1000000
137
+ valid_batch_bins: null
138
+ category_sample_size: 10
139
+ train_shape_file:
140
+ - /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_stats_16k/train/speech_shape
141
+ - /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_stats_16k/train/label_shape
142
+ valid_shape_file:
143
+ - /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_stats_16k/valid/speech_shape
144
+ - /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_stats_16k/valid/label_shape
145
+ batch_type: folded
146
+ valid_batch_type: null
147
+ fold_length:
148
+ - 160000
149
+ - 5
150
+ sort_in_batch: descending
151
+ shuffle_within_batch: false
152
+ sort_batch: descending
153
+ multiple_iterator: false
154
+ chunk_length: 500
155
+ chunk_shift_ratio: 0.5
156
+ num_cache_chunks: 1024
157
+ chunk_excluded_key_prefixes: []
158
+ chunk_default_fs: null
159
+ chunk_max_abs_length: null
160
+ chunk_discard_short_samples: true
161
+ train_data_path_and_name_and_type:
162
+ - - /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/dump/humbugdb.train/wav.scp
163
+ - speech
164
+ - sound
165
+ - - /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/dump/humbugdb.train/text
166
+ - label
167
+ - text
168
+ valid_data_path_and_name_and_type:
169
+ - - /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/dump/humbugdb.dev/wav.scp
170
+ - speech
171
+ - sound
172
+ - - /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/dump/humbugdb.dev/text
173
+ - label
174
+ - text
175
+ multi_task_dataset: false
176
+ allow_variable_data_keys: false
177
+ max_cache_size: 0.0
178
+ max_cache_fd: 32
179
+ allow_multi_rates: false
180
+ valid_max_cache_size: null
181
+ exclude_weight_decay: false
182
+ exclude_weight_decay_conf: {}
183
+ optim: adamw
184
+ optim_conf:
185
+ lr: 3.0e-05
186
+ weight_decay: 0.01
187
+ betas:
188
+ - 0.9
189
+ - 0.98
190
+ scheduler: cosineannealingwarmuprestarts
191
+ scheduler_conf:
192
+ first_cycle_steps: 95000
193
+ warmup_steps: 8000
194
+ max_lr: 3.0e-05
195
+ min_lr: 5.0e-06
196
+ token_list:
197
+ - non-mosquito
198
+ - an_arabiensis
199
+ - an_gambiae_ss
200
+ - others
201
+ - culex_quinquefasciatus
202
+ - culex_pipiens_complex
203
+ - an_funestus_ss
204
+ - an_squamosus
205
+ - ma_uniformis
206
+ - an_dirus
207
+ - an_harrisoni
208
+ - an_maculatus
209
+ - ae_aegypti
210
+ - an_funestus_sl
211
+ - <unk>
212
+ token_type: word
213
+ init: xavier_normal
214
+ input_size: 1
215
+ use_preprocessor: true
216
+ frontend: null
217
+ frontend_conf: {}
218
+ specaug: null
219
+ specaug_conf: {}
220
+ normalize: null
221
+ normalize_conf: {}
222
+ preencoder: null
223
+ preencoder_conf: {}
224
+ encoder: beats
225
+ encoder_conf:
226
+ beats_ckpt_path: /compute/babel-13-33/sbharad2/models/BEATs/BEATs_iter3.pt
227
+ beats_config:
228
+ layer_wise_gradient_decay_ratio: 0.3
229
+ encoder_layerdrop: 0.1
230
+ dropout: 0.0
231
+ use_weighted_representation: false
232
+ specaug_config:
233
+ apply_time_warp: true
234
+ apply_freq_mask: false
235
+ apply_time_mask: true
236
+ time_mask_width_ratio_range:
237
+ - 0
238
+ - 0.06
239
+ num_time_mask: 1
240
+ roll_augment: true
241
+ roll_interval: 1
242
+ decoder: linear
243
+ decoder_conf: {}
244
+ model: espnet
245
+ model_conf:
246
+ classification_type: multi-class
247
+ mixup_augmentation: false
248
+ lsm_weight: 0.1
249
+ required:
250
+ - output_dir
251
+ - token_list
252
+ version: '202412'
253
+ distributed: false
254
+ ```
255
+
256
+ </details>
257
+
258
+
259
+
260
+ ### Citing ESPnet
261
+
262
+ ```BibTex
263
+ @inproceedings{watanabe2018espnet,
264
+ author={Shinji Watanabe and Takaaki Hori and Shigeki Karita and Tomoki Hayashi and Jiro Nishitoba and Yuya Unno and Nelson Yalta and Jahn Heymann and Matthew Wiesner and Nanxin Chen and Adithya Renduchintala and Tsubasa Ochiai},
265
+ title={{ESPnet}: End-to-End Speech Processing Toolkit},
266
+ year={2018},
267
+ booktitle={Proceedings of Interspeech},
268
+ pages={2207--2211},
269
+ doi={10.21437/Interspeech.2018-1456},
270
+ url={http://dx.doi.org/10.21437/Interspeech.2018-1456}
271
+ }
272
+
273
+
274
+
275
+
276
+
277
+
278
+ ```
279
+
280
+ or arXiv:
281
+
282
+ ```bibtex
283
+ @misc{watanabe2018espnet,
284
+ title={ESPnet: End-to-End Speech Processing Toolkit},
285
+ author={Shinji Watanabe and Takaaki Hori and Shigeki Karita and Tomoki Hayashi and Jiro Nishitoba and Yuya Unno and Nelson Yalta and Jahn Heymann and Matthew Wiesner and Nanxin Chen and Adithya Renduchintala and Tsubasa Ochiai},
286
+ year={2018},
287
+ eprint={1804.00015},
288
+ archivePrefix={arXiv},
289
+ primaryClass={cs.CL}
290
+ }
291
+ ```
bean.humbugdb/data/token_list ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ non-mosquito
2
+ an_arabiensis
3
+ an_gambiae_ss
4
+ others
5
+ culex_quinquefasciatus
6
+ culex_pipiens_complex
7
+ an_funestus_ss
8
+ an_squamosus
9
+ ma_uniformis
10
+ an_dirus
11
+ an_harrisoni
12
+ an_maculatus
13
+ ae_aegypti
14
+ an_funestus_sl
15
+ <unk>
bean.humbugdb/exp/cls_humbugdb.20250107.141123/219epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05ca9274cadc60e9075f713924143ccb6ab95dc7605ae580d1148515fb9d2bbd
3
+ size 361385029
bean.humbugdb/exp/cls_humbugdb.20250107.141123/RESULTS.md ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <!-- Generated by scripts/utils/show_cls_result.sh -->
2
+ # RESULTS
3
+ ## Environments
4
+ - date: `Tue Jan 7 19:11:31 EST 2025`
5
+ - python version: `3.9.20 (main, Oct 3 2024, 07:27:41) [GCC 11.2.0]`
6
+ - espnet version: `espnet 202412`
7
+ - pytorch version: `pytorch 2.4.0`
8
+ - Git hash: `9191aa59acc7d3ceaca1f48dcc8fbdad2e03484b`
9
+ - Commit date: `Tue Jan 7 04:34:03 2025 -0500`
10
+
11
+ ## cls_humbugdb.20250107.141123
12
+ |Dataset|Metric|Value|
13
+ |---|---|---|
14
+ /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_humbugdb.20250107.141123/cls_humbugdb.dev/score|mean_acc|86.35
15
+ /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_humbugdb.20250107.141123/cls_humbugdb.dev/score|mAP|66.74
16
+ /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_humbugdb.20250107.141123/cls_humbugdb.dev/score|mean_auc|96.32
17
+ /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_humbugdb.20250107.141123/cls_humbugdb.dev/score|n_labels|14.00
18
+ /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_humbugdb.20250107.141123/cls_humbugdb.dev/score|n_instances|1604.00
19
+ /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_humbugdb.20250107.141123/cls_humbugdb.test/score|mean_acc|80.63
20
+ /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_humbugdb.20250107.141123/cls_humbugdb.test/score|mAP|67.20
21
+ /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_humbugdb.20250107.141123/cls_humbugdb.test/score|mean_auc|94.15
22
+ /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_humbugdb.20250107.141123/cls_humbugdb.test/score|n_labels|14.00
23
+ /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_humbugdb.20250107.141123/cls_humbugdb.test/score|n_instances|1859.00
24
+
bean.humbugdb/exp/cls_humbugdb.20250107.141123/config.yaml ADDED
@@ -0,0 +1,194 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/beats_humbugdb.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ drop_last_iter: false
5
+ dry_run: false
6
+ iterator_type: sequence
7
+ valid_iterator_type: null
8
+ output_dir: /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_humbugdb.20250107.141123
9
+ ngpu: 1
10
+ seed: 0
11
+ num_workers: 2
12
+ num_att_plot: 0
13
+ dist_backend: nccl
14
+ dist_init_method: env://
15
+ dist_world_size: null
16
+ dist_rank: null
17
+ local_rank: 0
18
+ dist_master_addr: null
19
+ dist_master_port: null
20
+ dist_launcher: null
21
+ multiprocessing_distributed: false
22
+ unused_parameters: true
23
+ sharded_ddp: false
24
+ use_deepspeed: false
25
+ deepspeed_config: null
26
+ cudnn_enabled: true
27
+ cudnn_benchmark: false
28
+ cudnn_deterministic: true
29
+ use_tf32: false
30
+ collect_stats: false
31
+ write_collected_feats: false
32
+ max_epoch: 250
33
+ patience: null
34
+ val_scheduler_criterion:
35
+ - valid
36
+ - loss
37
+ early_stopping_criterion:
38
+ - valid
39
+ - loss
40
+ - min
41
+ best_model_criterion:
42
+ - - valid
43
+ - acc
44
+ - max
45
+ keep_nbest_models: 1
46
+ nbest_averaging_interval: 0
47
+ grad_clip: 1
48
+ grad_clip_type: 2.0
49
+ grad_noise: false
50
+ accum_grad: 1
51
+ no_forward_run: false
52
+ resume: true
53
+ train_dtype: float32
54
+ use_amp: false
55
+ log_interval: null
56
+ use_matplotlib: true
57
+ use_tensorboard: true
58
+ create_graph_in_tensorboard: false
59
+ use_wandb: false
60
+ wandb_project: null
61
+ wandb_id: null
62
+ wandb_entity: null
63
+ wandb_name: null
64
+ wandb_model_log_interval: -1
65
+ detect_anomaly: false
66
+ use_adapter: false
67
+ adapter: lora
68
+ save_strategy: all
69
+ adapter_conf: {}
70
+ pretrain_path: null
71
+ init_param: []
72
+ ignore_init_mismatch: false
73
+ freeze_param: []
74
+ num_iters_per_epoch: null
75
+ batch_size: 32
76
+ valid_batch_size: 32
77
+ batch_bins: 1000000
78
+ valid_batch_bins: null
79
+ category_sample_size: 10
80
+ train_shape_file:
81
+ - /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_stats_16k/train/speech_shape
82
+ - /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_stats_16k/train/label_shape
83
+ valid_shape_file:
84
+ - /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_stats_16k/valid/speech_shape
85
+ - /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_stats_16k/valid/label_shape
86
+ batch_type: folded
87
+ valid_batch_type: null
88
+ fold_length:
89
+ - 160000
90
+ - 5
91
+ sort_in_batch: descending
92
+ shuffle_within_batch: false
93
+ sort_batch: descending
94
+ multiple_iterator: false
95
+ chunk_length: 500
96
+ chunk_shift_ratio: 0.5
97
+ num_cache_chunks: 1024
98
+ chunk_excluded_key_prefixes: []
99
+ chunk_default_fs: null
100
+ chunk_max_abs_length: null
101
+ chunk_discard_short_samples: true
102
+ train_data_path_and_name_and_type:
103
+ - - /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/dump/humbugdb.train/wav.scp
104
+ - speech
105
+ - sound
106
+ - - /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/dump/humbugdb.train/text
107
+ - label
108
+ - text
109
+ valid_data_path_and_name_and_type:
110
+ - - /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/dump/humbugdb.dev/wav.scp
111
+ - speech
112
+ - sound
113
+ - - /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/dump/humbugdb.dev/text
114
+ - label
115
+ - text
116
+ multi_task_dataset: false
117
+ allow_variable_data_keys: false
118
+ max_cache_size: 0.0
119
+ max_cache_fd: 32
120
+ allow_multi_rates: false
121
+ valid_max_cache_size: null
122
+ exclude_weight_decay: false
123
+ exclude_weight_decay_conf: {}
124
+ optim: adamw
125
+ optim_conf:
126
+ lr: 3.0e-05
127
+ weight_decay: 0.01
128
+ betas:
129
+ - 0.9
130
+ - 0.98
131
+ scheduler: cosineannealingwarmuprestarts
132
+ scheduler_conf:
133
+ first_cycle_steps: 95000
134
+ warmup_steps: 8000
135
+ max_lr: 3.0e-05
136
+ min_lr: 5.0e-06
137
+ token_list:
138
+ - non-mosquito
139
+ - an_arabiensis
140
+ - an_gambiae_ss
141
+ - others
142
+ - culex_quinquefasciatus
143
+ - culex_pipiens_complex
144
+ - an_funestus_ss
145
+ - an_squamosus
146
+ - ma_uniformis
147
+ - an_dirus
148
+ - an_harrisoni
149
+ - an_maculatus
150
+ - ae_aegypti
151
+ - an_funestus_sl
152
+ - <unk>
153
+ token_type: word
154
+ init: xavier_normal
155
+ input_size: 1
156
+ use_preprocessor: true
157
+ frontend: null
158
+ frontend_conf: {}
159
+ specaug: null
160
+ specaug_conf: {}
161
+ normalize: null
162
+ normalize_conf: {}
163
+ preencoder: null
164
+ preencoder_conf: {}
165
+ encoder: beats
166
+ encoder_conf:
167
+ beats_ckpt_path: /compute/babel-13-33/sbharad2/models/BEATs/BEATs_iter3.pt
168
+ beats_config:
169
+ layer_wise_gradient_decay_ratio: 0.3
170
+ encoder_layerdrop: 0.1
171
+ dropout: 0.0
172
+ use_weighted_representation: false
173
+ specaug_config:
174
+ apply_time_warp: true
175
+ apply_freq_mask: false
176
+ apply_time_mask: true
177
+ time_mask_width_ratio_range:
178
+ - 0
179
+ - 0.06
180
+ num_time_mask: 1
181
+ roll_augment: true
182
+ roll_interval: 1
183
+ decoder: linear
184
+ decoder_conf: {}
185
+ model: espnet
186
+ model_conf:
187
+ classification_type: multi-class
188
+ mixup_augmentation: false
189
+ lsm_weight: 0.1
190
+ required:
191
+ - output_dir
192
+ - token_list
193
+ version: '202412'
194
+ distributed: false
bean.humbugdb/exp/cls_humbugdb.20250107.141123/images/acc.png ADDED
bean.humbugdb/exp/cls_humbugdb.20250107.141123/images/backward_time.png ADDED
bean.humbugdb/exp/cls_humbugdb.20250107.141123/images/clip.png ADDED
bean.humbugdb/exp/cls_humbugdb.20250107.141123/images/forward_time.png ADDED
bean.humbugdb/exp/cls_humbugdb.20250107.141123/images/gpu_max_cached_mem_GB.png ADDED
bean.humbugdb/exp/cls_humbugdb.20250107.141123/images/grad_norm.png ADDED
bean.humbugdb/exp/cls_humbugdb.20250107.141123/images/iter_time.png ADDED
bean.humbugdb/exp/cls_humbugdb.20250107.141123/images/loss.png ADDED
bean.humbugdb/exp/cls_humbugdb.20250107.141123/images/loss_scale.png ADDED
bean.humbugdb/exp/cls_humbugdb.20250107.141123/images/macro_precision.png ADDED
bean.humbugdb/exp/cls_humbugdb.20250107.141123/images/optim0_lr0.png ADDED
bean.humbugdb/exp/cls_humbugdb.20250107.141123/images/optim_step_time.png ADDED
bean.humbugdb/exp/cls_humbugdb.20250107.141123/images/train_time.png ADDED
meta.yaml ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ espnet: '202412'
2
+ files:
3
+ classification_model_file: /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_humbugdb.20250107.141123/219epoch.pth
4
+ python: "3.9.20 (main, Oct 3 2024, 07:27:41) \n[GCC 11.2.0]"
5
+ timestamp: 1736336817.841514
6
+ torch: 2.4.0
7
+ yaml_files:
8
+ classification_train_config: /compute/babel-11-13/sbharad2/beats_run/bean.humbugdb/exp/cls_humbugdb.20250107.141123/config.yaml