EveryVoice-OpenBible-Chhattisgarhi / config /everyvoice-text-to-spec.yaml
davidguzmanr's picture
Add config/everyvoice-text-to-spec.yaml for Chhattisgarhi
bb4b839 verified
raw
history blame
2.13 kB
VERSION: '1.0'
contact: {contact_email: david.guzman@mail.mcgill.ca, contact_name: David Guzman}
model:
decoder: {conv_kernel_size: 9, dropout: 0.2, feedforward_dim: 1024, heads: 2, input_dim: 256,
layers: 4}
encoder: {conv_kernel_size: 9, dropout: 0.2, feedforward_dim: 1024, heads: 2, input_dim: 256,
layers: 4}
learn_alignment: true
max_length: 1000
mel_loss: mse
multilingual: false
multispeaker: true
target_text_representation_level: characters
use_global_style_token_module: false
use_postnet: true
variance_predictors:
duration: {depthwise: true, dropout: 0.5, input_dim: 256, kernel_size: 3, loss: mse,
n_bins: 256, n_layers: 5}
energy: {depthwise: true, dropout: 0.5, input_dim: 256, kernel_size: 3, level: phone,
loss: mse, n_bins: 256, n_layers: 5}
pitch: {depthwise: true, dropout: 0.5, input_dim: 256, kernel_size: 3, level: phone,
loss: mse, n_bins: 256, n_layers: 5}
path_to_model_config_file: null
path_to_preprocessing_config_file: everyvoice-shared-data.yaml
path_to_text_config_file: everyvoice-shared-text.yaml
path_to_training_config_file: null
training:
attn_bin_loss_warmup_epochs: 100
attn_bin_loss_weight: 0.1
attn_ctc_loss_weight: 0.1
batch_size: 16
check_val_every_n_epoch: null
ckpt_epochs: 1
ckpt_steps: null
duration_loss_weight: 0.1
energy_loss_weight: 0.1
filelist_loader: everyvoice.utils.generic_dict_loader
finetune_checkpoint: null
logger: {name: FeaturePredictionExperiment, save_dir: ../logs_and_checkpoints, sub_dir_callable: everyvoice.utils.get_current_time,
version: base}
max_epochs: 1000
max_steps: 100000
mel_loss_weight: 1.0
optimizer:
betas: [0.9, 0.999]
eps: 1.0e-08
learning_rate: 0.001
name: noam
warmup_steps: 1000
weight_decay: 1.0e-06
pitch_loss_weight: 0.1
postnet_loss_weight: 1.0
save_top_k_ckpts: 5
train_data_workers: 4
training_filelist: ../preprocessed/training_filelist.psv
use_weighted_sampler: false
val_check_interval: 500
val_data_workers: 0
validation_filelist: ../preprocessed/validation_filelist.psv
vocoder_path: null