moiduy04 commited on
Commit
12d8f44
1 Parent(s): f1bd54d

Upload config_final for ease of use.

Browse files
Files changed (1) hide show
  1. config/config_final.yaml +33 -0
config/config_final.yaml ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ experiment_name: 'runs/transformer_huge'
2
+
3
+ dataset:
4
+ src_lang: 'lo'
5
+ src_tokenizer: 'BPE'
6
+ src_max_seq_len: 400
7
+ tgt_lang: 'vi'
8
+ tgt_tokenizer: 'WordLevel'
9
+ tgt_max_seq_len: 350
10
+ train_dataset: 'train_clean.dat'
11
+ validate_dataset: 'dev_clean.dat'
12
+ tokenizer_file: "tokenizer_{0}.json"
13
+ bleu_dataset: 'test2023'
14
+
15
+ model:
16
+ d_model: 512
17
+ num_heads: 8
18
+ d_ff: 2048
19
+ dropout_p: 0.15
20
+ num_encoder_layers: 8
21
+ num_decoder_layers: 4
22
+ model_folder: "weights"
23
+ model_basename: "transformer_"
24
+ preload: 'huge_61'
25
+
26
+ train:
27
+ lr: 0.001 # 1e-2
28
+ batch_size: 32
29
+ num_epochs: 61
30
+ label_smoothing: 0.1
31
+ on_colab: False # are you training on Colab?
32
+ patience: 1
33
+ warm_up_steps: 200