benjamin-paine commited on
Commit
7217352
·
verified ·
1 Parent(s): beffce2

Upload speech-enhancement-deep-filter-net-3-config.ini with huggingface_hub

Browse files
speech-enhancement-deep-filter-net-3-config.ini ADDED
@@ -0,0 +1,124 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [train]
2
+ seed = 43
3
+ device =
4
+ model = deepfilternet3
5
+ jit = false
6
+ mask_only = false
7
+ df_only = false
8
+ batch_size = 64
9
+ batch_size_eval = 64
10
+ num_workers = 16
11
+ max_sample_len_s = 3.0
12
+ p_atten_lim = 0.0
13
+ overfit = false
14
+ max_epochs = 120
15
+ log_freq = 100
16
+ log_timings = True
17
+ validation_criteria = loss
18
+ validation_criteria_rule = min
19
+ early_stopping_patience = 25
20
+ global_ds_sampling_f = 1
21
+ num_prefetch_batches = 8
22
+ dataloader_snrs = -100,-5,0,5,10,20,40
23
+ detect_anomaly = false
24
+ batch_size_scheduling = 0/16,2/24,5/32,10/64,20/128,40/9999
25
+ start_eval = false
26
+ validation_set_caching = false
27
+ cp_blacklist =
28
+
29
+ [distortion]
30
+ p_reverb = 0.1
31
+ p_bandwidth_ext = 0.0
32
+ p_clipping = 0.0
33
+ p_air_absorption = 0.0
34
+ p_zeroing = 0.0
35
+ p_interfer_sp = 0.0
36
+
37
+ [df]
38
+ sr = 48000
39
+ fft_size = 960
40
+ hop_size = 480
41
+ nb_erb = 32
42
+ nb_df = 96
43
+ norm_tau = 1
44
+ lsnr_max = 35
45
+ lsnr_min = -15
46
+ min_nb_erb_freqs = 2
47
+ pad_mode = output
48
+ df_order = 5
49
+ df_lookahead = 2
50
+
51
+ [deepfilternet]
52
+ conv_lookahead = 2
53
+ conv_ch = 64
54
+ conv_depthwise = True
55
+ emb_hidden_dim = 256
56
+ emb_num_layers = 3
57
+ enc_linear_groups = 32
58
+ linear_groups = 16
59
+ conv_dec_mode = transposed
60
+ convt_depthwise = False
61
+ mask_pf = False
62
+ df_hidden_dim = 256
63
+ df_num_layers = 2
64
+ dfop_method = df
65
+ group_shuffle = False
66
+ conv_kernel = 1,3
67
+ df_gru_skip = groupedlinear
68
+ df_pathway_kernel_size_t = 5
69
+ enc_concat = False
70
+ conv_kernel_inp = 3,3
71
+ emb_gru_skip = none
72
+ df_n_iter = 1
73
+ convt_kernel = 1,3
74
+ lsnr_dropout = False
75
+
76
+ [localsnrloss]
77
+ factor = 1e-3
78
+
79
+ [maskloss]
80
+ factor = 0
81
+ mask = spec
82
+ gamma = 0.3
83
+ gamma_pred = 0.3
84
+ f_under = 1
85
+
86
+ [spectralloss]
87
+ factor_magnitude = 0
88
+ factor_complex = 0
89
+ gamma = 0.3
90
+ factor_under = 1
91
+
92
+ [dfalphaloss]
93
+ factor = 0.0
94
+
95
+ [multiresspecloss]
96
+ factor = 500
97
+ factor_complex = 500
98
+ gamma = 0.3
99
+ fft_sizes = 256,512,1024,2048
100
+
101
+ [optim]
102
+ lr = 0.001
103
+ momentum = 0
104
+ weight_decay = 1e-12
105
+ weight_decay_end = 0.01
106
+ optimizer = adamw
107
+ lr_min = 1e-06
108
+ lr_warmup = 0.0001
109
+ warmup_epochs = 3
110
+ lr_cycle_mul = 1.0
111
+ lr_cycle_decay = 0.5
112
+ lr_cycle_limit = 1
113
+ lr_update_per_epoch = False
114
+ lr_cycle_epochs = -1
115
+
116
+ [sdrloss]
117
+ factor = 0.0
118
+ segmental_ws = 0
119
+
120
+ [asrloss]
121
+ factor = 0
122
+ factor_lm = 0
123
+ loss_lm = CrossEntropy
124
+ model = base.en