File size: 1,078 Bytes
af1bff0 b4dde73 3ae4c3f af1bff0 8dc3553 af1bff0 8b13090 af1bff0 8dc3553 af1bff0 8b13090 af1bff0 8b13090 af1bff0 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 | # Lightning-based configuration for LSTM model
# Extends the base LSTM configuration with Lightning-specific settings
MODEL:
TYPE: 'Transformer'
MAXLEN: 272
VOCAB_SIZE: 77
ASR_VOCAB_SIZE: 91
D_MODEL: 256
NUM_HEADS: 4
DFF: 128
NUM_BLOCKS: 2
DROPOUT_RATE: 0.2
OUTPUT_SIZE: 19
USE_ASR: false
PRETRAINED_PATH: null
LOAD_TEXT_BRANCH_ONLY: false
WITH_CONN: False
TRAIN:
DEVICE: 'cuda'
BATCH_SIZE: 128
NUM_EPOCHS: 1000
LEARNING_RATE: 0.001
SAVE_FREQ: 30
EVAL_FREQ: 1
SAVE_DIR: 'outputs/kssa/transformer-text+asr/tashkeela'
EARLY_STOPPING_PATIENCE: 50
ACCUMULATE_GRAD_BATCHES: 1
VAL_CHECK_INTERVAL: 1.0
GRAD_CLIP_NORM: 0.5
INFERENCE:
MAX_LENGTH: 270
WINDOW_SIZE: 50
BUFFER_SIZE: 25
DEVICE: 'cpu'
BATCH_SIZE: 16
MODEL_PATH: null
ASR_MODEL_NAME: 'sashat/whisper-medium-ClassicalAr'
USE_ASR: False
FORCED_IDS: null
OUTPUT_PATH: 'results/temp.txt'
DATA:
TRAIN_PATH: 'data/tashkeela/train.txt'
VAL_PATH: 'data/tashkeela/val.txt'
TEST_PATH: 'data/clartts/test.txt'
MAX_LENGTH: 270
CONSTANTS_PATH: 'constants/' |