{ "output_path": "/mnt/netapp2/Store_uni/home/usc/ci/ams/experimentos/gaspar", "logger_uri": null, "run_name": "gaspar_grap_48_104", "project_name": null, "run_description": "\ud83d\udc38Coqui trainer run.", "print_step": 25, "plot_step": 100, "model_param_stats": false, "wandb_entity": null, "dashboard_logger": "tensorboard", "save_on_interrupt": true, "log_model_step": null, "save_step": 10000, "save_n_checkpoints": 10, "save_checkpoints": true, "save_all_best": false, "save_best_after": 400, "target_loss": null, "print_eval": true, "test_delay_epochs": -1, "run_eval": true, "run_eval_steps": null, "distributed_backend": "nccl", "distributed_url": "tcp://localhost:54321", "mixed_precision": true, "precision": "fp16", "epochs": 1300, "batch_size": 48, "eval_batch_size": 16, "grad_clip": [ 1000, 1000 ], "scheduler_after_epoch": true, "lr": 0.0001, "optimizer": "AdamW", "optimizer_params": { "betas": [ 0.8, 0.99 ], "eps": 1e-09, "weight_decay": 0.01 }, "lr_scheduler": null, "lr_scheduler_params": {}, "use_grad_scaler": false, "allow_tf32": false, "cudnn_enable": true, "cudnn_deterministic": false, "cudnn_benchmark": false, "training_seed": 54321, "model": "vits", "num_loader_workers": 8, "num_eval_loader_workers": 4, "use_noise_augment": false, "audio": { "fft_size": 1024, "sample_rate": 16000, "win_length": 1024, "hop_length": 256, "num_mels": 80, "mel_fmin": 0, "mel_fmax": null }, "use_phonemes": false, "phonemizer": null, "phoneme_language": null, "compute_input_seq_cache": true, "text_cleaner": null, "enable_eos_bos_chars": false, "test_sentences_file": "", "phoneme_cache_path": "/mnt/netapp2/Store_uni/home/usc/ci/ams/experimentos/gaspar/phoneme_cache", "characters": { "characters_class": "TTS.tts.models.vits.VitsCharacters", "vocab_dict": null, "pad": "", "eos": "", "bos": "", "blank": "", "characters": "ABCDEFGHIJKLMNOPQRSTUVWXYZ\u00c7\u00c1\u00c9\u00cd\u00cf\u00d3\u00da\u00dcabcdefghijklmnopqrstuvwxyz\u00f1\u00e1\u00e9\u00ed\u00ef\u00f3\u00fa\u00fc", "punctuations": "!\u00a1'(),-.:;\u00bf? \"\n", "phonemes": null, "is_unique": true, "is_sorted": true }, "add_blank": true, "batch_group_size": 5, "loss_masking": null, "min_audio_len": 1, "max_audio_len": Infinity, "min_text_len": 1, "max_text_len": Infinity, "compute_f0": false, "compute_energy": false, "compute_linear_spec": true, "precompute_num_workers": 0, "start_by_longest": false, "shuffle": false, "drop_last": false, "datasets": [ { "formatter": "nos_grafemas", "dataset_name": "", "path": "/mnt/netapp2/Store_uni/home/usc/ci/ams/experimentos/gaspar/", "meta_file_train": "texto_corpus_masculino_train.csv", "ignored_speakers": null, "language": "", "phonemizer": "", "meta_file_val": "", "meta_file_attn_mask": "" } ], "test_sentences": [ "como van executar todas estas funci\u00f3ns que lles est\u00e1n a pedir?", "a defensa institucional faina ese goberno e quen goberne, non?", "supo\u00f1o que iso fala dos poucos argumentos que hai enriba da mesa para falar desta cuesti\u00f3n.", "hai xiros da linguaxe con sentido figurado que non deben interpretarse en sentido literal.", "a sentenza completa publicarase nos pr\u00f3ximos d\u00edas.", "as temperaturas descenden lixeiramente, pero seguir\u00e1n elevadas pola tarde.", "era un dos m\u00e1is interesantes proxectos nados na internet galaica.", "falamos xa do tempo: hai avisos no litoral e nalgunhas zonas do interior por vento.", "\u00e9 dif\u00edcil, non?", "a escaseza de vacinas en europa poder\u00eda complicar a administraci\u00f3n da segunda dose.", "que queres!?", "as medidas afectan en galicia a m\u00e1is dun cento de barcos e dous milleiros de mari\u00f1eiros.", "por favor, marque o catrocentos corenta e seis sesenta e oito oitenta e oito oitenta e seis.", "o carballo da retorta ten unha folla revirada que lla revirou o aire unha noite de xeada.", "orden\u00e1molos en par\u00e1grafos de catro li\u00f1as ou de seis?", "\u00e9 licenciada en ciencias econ\u00f3micas e desenvolveu a meirande parte da s\u00faa carreira profesional na administraci\u00f3n p\u00fablica.", "os enxe\u00f1eiros cualificaron a obra de moi complexa debido \u00e1 orograf\u00eda das zonas polas que discorre a v\u00eda.", "ti xa sabes o que debes facer.", "ter\u00e1s algo que contar...", "que esc\u00e1ndalo!", "que ben ole!", "donas e cabaleiros: voulles amosa-lo home m\u00e1is forte do mundo.", "a curuxa!, -berrou o vello.", "a erupci\u00f3n provoca a emanaci\u00f3n de gases \u00e1 atmosfera.", "as autoestradas da xunta (vigo baiona e a coru\u00f1a carballo) estar\u00e1n rematadas no ano mil novecentos noventa e sete.", "investigadores estadounidenses identifican o xene responsable da propagaci\u00f3n das c\u00e9lulas cancer\u00edxenas.", "ai!, e xogando \u00f3 trompo tam\u00e9n hab\u00eda xente que o coll\u00eda \u00e1 u\u00f1a, non sabes?, e velo coller \u00e1 u\u00f1a...", "o valor das n\u00e9coras e das centolas de antano.", "os hostaleiros miran as cifras con preocupaci\u00f3n.", "deber\u00e1 efectuar a comunicaci\u00f3n coa debida antecedencia." ], "eval_split_max_size": null, "eval_split_size": 0.05, "use_speaker_weighted_sampler": false, "speaker_weighted_sampler_alpha": 1.0, "use_language_weighted_sampler": false, "language_weighted_sampler_alpha": 1.0, "use_length_weighted_sampler": false, "length_weighted_sampler_alpha": 1.0, "model_args": { "num_chars": 85, "out_channels": 513, "spec_segment_size": 32, "hidden_channels": 192, "hidden_channels_ffn_text_encoder": 768, "num_heads_text_encoder": 2, "num_layers_text_encoder": 6, "kernel_size_text_encoder": 3, "dropout_p_text_encoder": 0.1, "dropout_p_duration_predictor": 0.5, "kernel_size_posterior_encoder": 5, "dilation_rate_posterior_encoder": 1, "num_layers_posterior_encoder": 16, "kernel_size_flow": 5, "dilation_rate_flow": 1, "num_layers_flow": 4, "resblock_type_decoder": "1", "resblock_kernel_sizes_decoder": [ 3, 7, 11 ], "resblock_dilation_sizes_decoder": [ [ 1, 3, 5 ], [ 1, 3, 5 ], [ 1, 3, 5 ] ], "upsample_rates_decoder": [ 8, 8, 2, 2 ], "upsample_initial_channel_decoder": 512, "upsample_kernel_sizes_decoder": [ 16, 16, 4, 4 ], "periods_multi_period_discriminator": [ 2, 3, 5, 7, 11 ], "use_sdp": true, "noise_scale": 1.0, "inference_noise_scale": 0.667, "length_scale": 1, "noise_scale_dp": 1.0, "inference_noise_scale_dp": 1.0, "max_inference_len": null, "init_discriminator": true, "use_spectral_norm_disriminator": false, "use_speaker_embedding": false, "num_speakers": 0, "speakers_file": null, "d_vector_file": null, "speaker_embedding_channels": 256, "use_d_vector_file": false, "d_vector_dim": 0, "detach_dp_input": true, "use_language_embedding": false, "embedded_language_dim": 4, "num_languages": 0, "language_ids_file": null, "use_speaker_encoder_as_loss": false, "speaker_encoder_config_path": "", "speaker_encoder_model_path": "", "condition_dp_on_speaker": true, "freeze_encoder": false, "freeze_DP": false, "freeze_PE": false, "freeze_flow_decoder": false, "freeze_waveform_decoder": false, "encoder_sample_rate": null, "interpolate_z": true, "reinit_DP": false, "reinit_text_encoder": false }, "lr_gen": 0.0002, "lr_disc": 0.0002, "lr_scheduler_gen": "ExponentialLR", "lr_scheduler_gen_params": { "gamma": 0.999875, "last_epoch": -1 }, "lr_scheduler_disc": "ExponentialLR", "lr_scheduler_disc_params": { "gamma": 0.999875, "last_epoch": -1 }, "kl_loss_alpha": 1.0, "disc_loss_alpha": 1.0, "gen_loss_alpha": 1.0, "feat_loss_alpha": 1.0, "mel_loss_alpha": 45.0, "dur_loss_alpha": 1.0, "speaker_encoder_loss_alpha": 1.0, "return_wav": true, "use_weighted_sampler": false, "weighted_sampler_attrs": {}, "weighted_sampler_multipliers": {}, "r": 1, "num_speakers": 0, "use_speaker_embedding": false, "speakers_file": null, "speaker_embedding_channels": 256, "language_ids_file": null, "use_language_embedding": false, "use_d_vector_file": false, "d_vector_file": null, "d_vector_dim": 0, "github_branch": "inside_docker" }