{ | |
"seed": 1234, | |
"epochs": 10000, | |
"learning_rate": 0.0002, | |
"betas": [ | |
0.8, | |
0.99 | |
], | |
"eps": 1e-09, | |
"batch_size": 32, | |
"fp16_run": true, | |
"lr_decay": 0.999875, | |
"segment_size": 8192, | |
"init_lr_ratio": 1.0, | |
"warmup_epochs": 0, | |
"c_mel": 45, | |
"c_kl": 1.0, | |
"grad_clip": null, | |
"min_seq_length": null, | |
"max_seq_length": 400, | |
"min_spec_length": null, | |
"max_spec_length": null, | |
"min_speaker_utterances": null, | |
"last_epoch": 1, | |
"global_step": 1, | |
"best_loss": null, | |
"audio": { | |
"filter_length": 1024, | |
"hop_length": 256, | |
"win_length": 1024, | |
"mel_channels": 80, | |
"sample_rate": 22050, | |
"sample_bytes": 2, | |
"channels": 1, | |
"mel_fmin": 0.0, | |
"mel_fmax": null, | |
"ref_level_db": 20.0, | |
"spec_gain": 1.0, | |
"signal_norm": true, | |
"min_level_db": -100.0, | |
"max_norm": 1.0, | |
"clip_norm": true, | |
"symmetric_norm": true, | |
"do_dynamic_range_compression": true, | |
"convert_db_to_amp": true, | |
"do_trim_silence": false, | |
"trim_silence_db": 40.0, | |
"trim_margin_sec": 0.01, | |
"trim_keep_sec": 0.25, | |
"scale_mels": false | |
}, | |
"model": { | |
"num_symbols": 37, | |
"n_speakers": 1, | |
"inter_channels": 192, | |
"hidden_channels": 192, | |
"filter_channels": 768, | |
"n_heads": 2, | |
"n_layers": 6, | |
"kernel_size": 3, | |
"p_dropout": 0.1, | |
"resblock": "2", | |
"resblock_kernel_sizes": [ | |
3, | |
5, | |
7 | |
], | |
"resblock_dilation_sizes": [ | |
[ | |
1, | |
2 | |
], | |
[ | |
2, | |
6 | |
], | |
[ | |
3, | |
12 | |
] | |
], | |
"upsample_rates": [ | |
8, | |
8, | |
4 | |
], | |
"upsample_initial_channel": 256, | |
"upsample_kernel_sizes": [ | |
16, | |
16, | |
8 | |
], | |
"n_layers_q": 3, | |
"use_spectral_norm": false, | |
"gin_channels": 0, | |
"use_sdp": true | |
}, | |
"phonemes": { | |
"phoneme_separator": "", | |
"word_separator": " ", | |
"phoneme_to_id": null, | |
"pad": "_", | |
"bos": "^", | |
"eos": "$", | |
"blank": "_", | |
"blank_word": "#", | |
"blank_between": "tokens_and_words", | |
"blank_at_start": true, | |
"blank_at_end": true, | |
"simple_punctuation": true, | |
"punctuation_map": null, | |
"separate": [ | |
"\u02c8", | |
"\u02cc" | |
], | |
"separate_graphemes": false, | |
"separate_tones": false, | |
"tone_before": false, | |
"phoneme_map": null, | |
"auto_bos_eos": true, | |
"minor_break": ",", | |
"major_break": ".", | |
"break_phonemes_into_graphemes": false, | |
"break_phonemes_into_codepoints": false, | |
"drop_stress": false, | |
"symbols": null | |
}, | |
"text_aligner": { | |
"aligner": null, | |
"casing": null | |
}, | |
"text_language": "fa", | |
"phonemizer": "espeak", | |
"datasets": [ | |
{ | |
"name": "persian_tts", | |
"metadata_format": "phonemes", | |
"multispeaker": false, | |
"text_language": null, | |
"audio_dir": "/media/12tb/fa/persian-tts-dataset/wav", | |
"cache_dir": "/media/cache/persian-tts-dataset" | |
} | |
], | |
"inference": { | |
"length_scale": 1.0, | |
"noise_scale": 0.333, | |
"noise_w": 0.333, | |
"auto_append_text": "." | |
}, | |
"version": 1, | |
"git_commit": "" | |
} | |