File size: 801 Bytes
868e3b5 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 |
seed: 1234
# Data
f0_path: ''
p_train: 0.95
min_frames: null
batch_size: 128
features: f0_interp,vuv
out_features: norm_f0_interp,vuv
segment_size: null
segment_multi: 16
num_workers: 4
vuv_scale: 2
speaker_stats: ''
recon_loss_fn: l1_loss
# Optimization
learning_rate: 0.0002
adam_b1: 0.8
adam_b2: 0.99
lr_decay: 0.999
lambda_commit: 0.02
# VQ params
vq_params:
l_bins: 64
emb_width: 128
mu: 0.99
levels: 1
# Encoder params
encoder_params:
input_emb_width: 2
output_emb_width: 128
levels: 1
downs_t:
- 4
strides_t:
- 2
width: 32
depth: 4
m_conv: 1.0
dilation_growth_rate: 3
# Decoder params
decoder_params:
input_emb_width: 2
output_emb_width: 128
levels: 1
downs_t:
- 4
strides_t:
- 2
width: 32
depth: 4
m_conv: 1.0
dilation_growth_rate: 3
|