amitkayal commited on
Commit
3c1b90d
1 Parent(s): f3dab40

Training in progress, step 1000

Browse files
Files changed (3) hide show
  1. config.json +16 -3
  2. pytorch_model.bin +1 -1
  3. training_args.bin +1 -1
config.json CHANGED
@@ -14,16 +14,29 @@
14
  "d_model": 384,
15
  "decoder_attention_heads": 6,
16
  "decoder_ffn_dim": 1536,
17
- "decoder_layerdrop": 0.0,
18
  "decoder_layers": 4,
19
  "decoder_start_token_id": 50258,
20
- "dropout": 0.001,
21
  "encoder_attention_heads": 6,
22
  "encoder_ffn_dim": 1536,
23
  "encoder_layerdrop": 0.0,
24
  "encoder_layers": 4,
25
  "eos_token_id": 50257,
26
- "forced_decoder_ids": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
27
  "init_std": 0.02,
28
  "is_encoder_decoder": true,
29
  "max_length": 448,
 
14
  "d_model": 384,
15
  "decoder_attention_heads": 6,
16
  "decoder_ffn_dim": 1536,
17
+ "decoder_layerdrop": 0.001,
18
  "decoder_layers": 4,
19
  "decoder_start_token_id": 50258,
20
+ "dropout": 0.002,
21
  "encoder_attention_heads": 6,
22
  "encoder_ffn_dim": 1536,
23
  "encoder_layerdrop": 0.0,
24
  "encoder_layers": 4,
25
  "eos_token_id": 50257,
26
+ "forced_decoder_ids": [
27
+ [
28
+ 1,
29
+ 50276
30
+ ],
31
+ [
32
+ 2,
33
+ 50359
34
+ ],
35
+ [
36
+ 3,
37
+ 50363
38
+ ]
39
+ ],
40
  "init_std": 0.02,
41
  "is_encoder_decoder": true,
42
  "max_length": 448,
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fbcef5e2a7194062d61a9347991825202abe18b868b060f2ffbadf39cff4652f
3
  size 151097331
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5a08eabbc6c0d9d110c46d3698dcebf96be426dd9a315ad12899cda43d1cf56
3
  size 151097331
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:61ba97ab2c8a29b57887653d24c133456633e9515673a5fd3d099c5df2cd83ab
3
  size 3567
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1e67d801aaa88c36784a2cf1f21d7f615ef79cd324b6fec8ebf6503a1fe78bd
3
  size 3567