{ "seed": 1234, "epochs": 10000, "learning_rate": 0.0002, "betas": [ 0.8, 0.99 ], "eps": 1e-09, "batch_size": 32, "fp16_run": true, "lr_decay": 0.999875, "segment_size": 8192, "init_lr_ratio": 1.0, "warmup_epochs": 0, "c_mel": 45, "c_kl": 1.0, "grad_clip": null, "min_seq_length": null, "max_seq_length": 400, "min_spec_length": null, "max_spec_length": null, "min_speaker_utterances": null, "last_epoch": 1, "global_step": 1, "best_loss": null, "audio": { "filter_length": 1024, "hop_length": 256, "win_length": 1024, "mel_channels": 80, "sample_rate": 22050, "sample_bytes": 2, "channels": 1, "mel_fmin": 0.0, "mel_fmax": null, "ref_level_db": 20.0, "spec_gain": 1.0, "signal_norm": true, "min_level_db": -100.0, "max_norm": 1.0, "clip_norm": true, "symmetric_norm": true, "do_dynamic_range_compression": true, "convert_db_to_amp": true, "do_trim_silence": false, "trim_silence_db": 40.0, "trim_margin_sec": 0.01, "trim_keep_sec": 0.25, "scale_mels": false }, "model": { "num_symbols": 74, "n_speakers": 6, "inter_channels": 192, "hidden_channels": 192, "filter_channels": 768, "n_heads": 2, "n_layers": 6, "kernel_size": 3, "p_dropout": 0.1, "resblock": "2", "resblock_kernel_sizes": [ 3, 5, 7 ], "resblock_dilation_sizes": [ [ 1, 2 ], [ 2, 6 ], [ 3, 12 ] ], "upsample_rates": [ 8, 8, 4 ], "upsample_initial_channel": 256, "upsample_kernel_sizes": [ 16, 16, 8 ], "n_layers_q": 3, "use_spectral_norm": false, "gin_channels": 512, "use_sdp": true }, "phonemes": { "phoneme_separator": "_", "word_separator": " ", "phoneme_to_id": null, "pad": "_", "bos": "^", "eos": "$", "blank": "_", "blank_word": "#", "blank_between": "tokens_and_words", "blank_at_start": true, "blank_at_end": true, "simple_punctuation": true, "punctuation_map": null, "separate": null, "separate_graphemes": false, "separate_tones": false, "tone_before": false, "phoneme_map": { ":": ",", ";": "," }, "auto_bos_eos": true, "minor_break": ",", "major_break": ".", "break_phonemes_into_graphemes": false, "drop_stress": false, "symbols": [ "!", "'", ",", "-", ".", ":", ";", "?", "\u0410", "\u0411", "\u0412", "\u0413", "\u0490", "\u0414", "\u0415", "\u0404", "\u0416", "\u0417", "\u0418", "\u0406", "\u0407", "\u0419", "\u041a", "\u041b", "\u041c", "\u041d", "\u041e", "\u041f", "\u0420", "\u0421", "\u0422", "\u0423", "\u0424", "\u0425", "\u0426", "\u0427", "\u0428", "\u0429", "\u042c", "\u042e", "\u042f", "\u0430", "\u0431", "\u0432", "\u0433", "\u0491", "\u0434", "\u0435", "\u0454", "\u0436", "\u0437", "\u0438", "\u0456", "\u0457", "\u0439", "\u043a", "\u043b", "\u043c", "\u043d", "\u043e", "\u043f", "\u0440", "\u0441", "\u0442", "\u0443", "\u0444", "\u0445", "\u0446", "\u0447", "\u0448", "\u0449", "\u044c", "\u044e", "\u044f" ] }, "text_aligner": { "aligner": null, "casing": null }, "text_language": "en_US", "phonemizer": "symbols", "datasets": [ { "name": "m-ailabs", "metadata_format": "text", "multispeaker": true, "text_language": null, "audio_dir": "/media/12tb/uk-uk/m-ailabs/uk_UK", "cache_dir": "/media/cache/m-ailabs/uk_UK" } ], "inference": { "length_scale": 1.0, "noise_scale": 0.667, "noise_w": 0.8, "auto_append_text": "." }, "version": 1, "git_commit": "" }