moiduy04 commited on
Commit
62c6f66
1 Parent(s): af2a0dc

Upload 2 files

Browse files
Files changed (2) hide show
  1. config_big.yaml +30 -0
  2. transformer_big.pt +3 -0
config_big.yaml ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ experiment_name: "runs/transformer_big"
2
+
3
+ dataset:
4
+ src_lang: 'lo'
5
+ src_tokenizer: 'BPE'
6
+ src_max_seq_len: 400
7
+ tgt_lang: 'vi'
8
+ tgt_tokenizer: 'WordLevel'
9
+ tgt_max_seq_len: 350
10
+ train_dataset: 'train_clean.dat'
11
+ validate_dataset: 'dev_clean.dat'
12
+ tokenizer_file: "tokenizer_{0}.json"
13
+
14
+ model: # 42688527 parameters
15
+ d_model: 512
16
+ num_heads: 8
17
+ d_ff: 2048
18
+ dropout_p: 0.3
19
+ num_encoder_layers: 4
20
+ num_decoder_layers: 2
21
+ model_folder: "weights"
22
+ model_basename: "transformer_big_"
23
+ preload:
24
+
25
+ train:
26
+ lr: 0.001 # 1e-2
27
+ batch_size: 16
28
+ num_epochs: 40
29
+ label_smoothing: 0.1
30
+ on_colab: True # are you training on Colab?
transformer_big.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09d82bd3a97ddc94c74c9ef688478b3fe5f61708445c4f7f304170a243571cb5
3
+ size 501299424