VERSION: '1.0' contact: {contact_email: david.guzman@mail.mcgill.ca, contact_name: David Guzman} model: decoder: {conv_kernel_size: 9, dropout: 0.2, feedforward_dim: 1024, heads: 2, input_dim: 256, layers: 4} encoder: {conv_kernel_size: 9, dropout: 0.2, feedforward_dim: 1024, heads: 2, input_dim: 256, layers: 4} learn_alignment: true max_length: 1000 mel_loss: mse multilingual: false multispeaker: false target_text_representation_level: characters use_global_style_token_module: false use_postnet: true variance_predictors: duration: {depthwise: true, dropout: 0.5, input_dim: 256, kernel_size: 3, loss: mse, n_bins: 256, n_layers: 5} energy: {depthwise: true, dropout: 0.5, input_dim: 256, kernel_size: 3, level: phone, loss: mse, n_bins: 256, n_layers: 5} pitch: {depthwise: true, dropout: 0.5, input_dim: 256, kernel_size: 3, level: phone, loss: mse, n_bins: 256, n_layers: 5} path_to_model_config_file: null path_to_preprocessing_config_file: everyvoice-shared-data.yaml path_to_text_config_file: everyvoice-shared-text.yaml path_to_training_config_file: null training: attn_bin_loss_warmup_epochs: 100 attn_bin_loss_weight: 0.1 attn_ctc_loss_weight: 0.1 batch_size: 16 check_val_every_n_epoch: null ckpt_epochs: 1 ckpt_steps: null duration_loss_weight: 0.1 energy_loss_weight: 0.1 filelist_loader: everyvoice.utils.generic_dict_loader finetune_checkpoint: null logger: {name: FeaturePredictionExperiment, save_dir: ../logs_and_checkpoints, sub_dir_callable: everyvoice.utils.get_current_time, version: base} max_epochs: 1000 max_steps: 100000 mel_loss_weight: 1.0 optimizer: betas: [0.9, 0.999] eps: 1.0e-08 learning_rate: 0.001 name: noam warmup_steps: 1000 weight_decay: 1.0e-06 pitch_loss_weight: 0.1 postnet_loss_weight: 1.0 save_top_k_ckpts: 5 train_data_workers: 4 training_filelist: ../preprocessed/training_filelist.psv use_weighted_sampler: false val_check_interval: 500 val_data_workers: 0 validation_filelist: ../preprocessed/validation_filelist.psv vocoder_path: null