rufaelfekadu's picture
Upload config.yml with huggingface_hub
7923e2f verified
Raw
History Blame
1.44 kB
# Lightning-based configuration for LSTM model
# Extends the base LSTM configuration with Lightning-specific settings
MODEL:
TYPE: 'Transformer'
MAXLEN: 272
VOCAB_SIZE: 77
ASR_VOCAB_SIZE: 91
D_MODEL: 256
NUM_HEADS: 4
DFF: 128
NUM_BLOCKS: 2
DROPOUT_RATE: 0.2
OUTPUT_SIZE: 19
USE_ASR: true
PRETRAINED_PATH: /home/rufael/Projects/forced_alignment/Diac/outputs/old/results/transformer-text+asr/tashkeela+clartts/tensorboard/version_0/checkpoints/best_model.ckpt
LOAD_TEXT_BRANCH_ONLY: false
WITH_CONN: False
TRAIN:
DEVICE: 'cuda'
BATCH_SIZE: 128
NUM_EPOCHS: 1000
LEARNING_RATE: 0.001
SAVE_FREQ: 30
EVAL_FREQ: 1
SAVE_DIR: 'outputs/kssa/transformer-text+asr/tashkeela+clartts+kssa'
EARLY_STOPPING_PATIENCE: 50
ACCUMULATE_GRAD_BATCHES: 1
VAL_CHECK_INTERVAL: 1.0
GRAD_CLIP_NORM: 0.5
INFERENCE:
MAX_LENGTH: 270
WINDOW_SIZE: 50
BUFFER_SIZE: 25
DEVICE: 'cpu'
BATCH_SIZE: 16
MODEL_PATH: /home/rufael/Projects/forced_alignment/Diac/outputs/kssa/transformer-text+asr/tashkeela+clartts+kssa/tensorboard/version_18/checkpoints/best_model.ckpt
ASR_MODEL_NAME: 'sashat/whisper-medium-ClassicalAr'
USE_ASR: True
FORCED_IDS: null
OUTPUT_PATH: 'outputs/kssa/transformer-text+asr/tashkeela+clartts+kssa/outs/dev_nobom.txt'
DATA:
TRAIN_PATH: 'data/kssa/train+asr.tsv'
VAL_PATH: 'data/kssa/dev+asr.tsv'
TEST_PATH: 'data/kssa/dev+asr.tsv'
MAX_LENGTH: 270
CONSTANTS_PATH: 'constants/'