File size: 801 Bytes
868e3b5
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60

seed: 1234

# Data
f0_path: ''
p_train: 0.95
min_frames: null
batch_size: 128
features: f0_interp,vuv
out_features: norm_f0_interp,vuv
segment_size: null
segment_multi: 16
num_workers: 4
vuv_scale: 2
speaker_stats: ''
recon_loss_fn: l1_loss


# Optimization
learning_rate: 0.0002
adam_b1: 0.8
adam_b2: 0.99
lr_decay: 0.999
lambda_commit: 0.02

# VQ params
vq_params:
  l_bins: 64
  emb_width: 128
  mu: 0.99
  levels: 1

# Encoder params
encoder_params:
  input_emb_width: 2
  output_emb_width: 128
  levels: 1
  downs_t:
  - 4
  strides_t:
  - 2
  width: 32
  depth: 4
  m_conv: 1.0
  dilation_growth_rate: 3

# Decoder params
decoder_params:
  input_emb_width: 2
  output_emb_width: 128
  levels: 1
  downs_t:
  - 4
  strides_t:
  - 2
  width: 32
  depth: 4
  m_conv: 1.0
  dilation_growth_rate: 3