|
|
|
inference: |
|
batch_size: 1 |
|
frame: |
|
h: 224 |
|
w: 224 |
|
model: |
|
wav2lip: |
|
checkpoint: "checkpoints/lrs3-wav2lip.pth" |
|
nota_wav2lip: |
|
checkpoint: "checkpoints/lrs3-nota-wav2lip.pth" |
|
|
|
audio: |
|
num_mels: 80 |
|
rescale: True |
|
rescaling_max: 0.9 |
|
|
|
use_lws: False |
|
|
|
n_fft: 800 |
|
hop_size: 200 |
|
win_size: 800 |
|
sample_rate: 16000 |
|
|
|
frame_shift_ms: ~ |
|
|
|
signal_normalization: True |
|
allow_clipping_in_normalization: True |
|
symmetric_mels: True |
|
max_abs_value: 4. |
|
preemphasize: True |
|
preemphasis: 0.97 |
|
|
|
|
|
min_level_db: -100 |
|
ref_level_db: 20 |
|
fmin: 55 |
|
fmax: 7600 |
|
|
|
face: |
|
video_fps: 25 |
|
img_size: 96 |
|
mel_step_size: 16 |
|
|
|
|