rufaelfekadu commited on
Commit
af1bff0
·
verified ·
1 Parent(s): 27f6f5a

Upload model checkpoint and constants (http)

Browse files
Files changed (2) hide show
  1. README.md +1 -0
  2. config.yml +51 -0
README.md CHANGED
@@ -4,6 +4,7 @@ tags:
4
  - diacritization
5
  - nlp
6
  - arabic
 
7
  metrics:
8
  - DER
9
  - WER
 
4
  - diacritization
5
  - nlp
6
  - arabic
7
+ - transformer
8
  metrics:
9
  - DER
10
  - WER
config.yml ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Lightning-based configuration for LSTM model
2
+ # Extends the base LSTM configuration with Lightning-specific settings
3
+
4
+ MODEL:
5
+ TYPE: 'Transformer'
6
+ MAXLEN: 272
7
+ VOCAB_SIZE: 77
8
+ ASR_VOCAB_SIZE: 91
9
+ D_MODEL: 256
10
+ NUM_HEADS: 4
11
+ DFF: 128
12
+ NUM_BLOCKS: 2
13
+ DROPOUT_RATE: 0.2
14
+ OUTPUT_SIZE: 19
15
+ USE_ASR: true
16
+ PRETRAINED_PATH: /home/rufael/Projects/forced_alignment/Diac/outputs/old/results/transformer-text+asr/tashkeela+clartts/tensorboard/version_0/checkpoints/best_model.ckpt
17
+ LOAD_TEXT_BRANCH_ONLY: false
18
+ WITH_CONN: False
19
+
20
+ TRAIN:
21
+ DEVICE: 'cuda'
22
+ BATCH_SIZE: 128
23
+ NUM_EPOCHS: 1000
24
+ LEARNING_RATE: 0.001
25
+ SAVE_FREQ: 30
26
+ EVAL_FREQ: 1
27
+ SAVE_DIR: 'outputs/kssa/transformer-text+asr/tashkeela+clartts+kssa'
28
+ EARLY_STOPPING_PATIENCE: 50
29
+ ACCUMULATE_GRAD_BATCHES: 1
30
+ VAL_CHECK_INTERVAL: 1.0
31
+ GRAD_CLIP_NORM: 0.5
32
+
33
+ INFERENCE:
34
+ MAX_LENGTH: 270
35
+ WINDOW_SIZE: 50
36
+ BUFFER_SIZE: 25
37
+ DEVICE: 'cpu'
38
+ BATCH_SIZE: 16
39
+ MODEL_PATH: /home/rufael/Projects/forced_alignment/Diac/outputs/kssa/transformer-text+asr/tashkeela+clartts+kssa/tensorboard/version_18/checkpoints/best_model.ckpt
40
+ ASR_MODEL_NAME: 'sashat/whisper-medium-ClassicalAr'
41
+ USE_ASR: True
42
+ FORCED_IDS: null
43
+ OUTPUT_PATH: 'outputs/kssa/transformer-text+asr/tashkeela+clartts+kssa/outs/dev_nobom.txt'
44
+
45
+ DATA:
46
+ TRAIN_PATH: 'data/kssa/train+asr.tsv'
47
+ VAL_PATH: 'data/kssa/dev+asr.tsv'
48
+ TEST_PATH: 'data/kssa/dev+asr.tsv'
49
+ MAX_LENGTH: 270
50
+
51
+ CONSTANTS_PATH: 'constants/'