minwooeom commited on
Commit
e11d56b
1 Parent(s): 6e7bb1c
config.json CHANGED
@@ -1,11 +1,11 @@
1
  {
2
- "_name_or_path": "t5-small",
3
  "architectures": [
4
  "T5ForConditionalGeneration"
5
  ],
6
- "d_ff": 2048,
7
  "d_kv": 64,
8
- "d_model": 512,
9
  "decoder_start_token_id": 0,
10
  "dense_act_fn": "relu",
11
  "dropout_rate": 0.1,
@@ -17,9 +17,9 @@
17
  "layer_norm_epsilon": 1e-06,
18
  "model_type": "t5",
19
  "n_positions": 512,
20
- "num_decoder_layers": 6,
21
- "num_heads": 8,
22
- "num_layers": 6,
23
  "output_past": true,
24
  "pad_token_id": 0,
25
  "relative_attention_max_distance": 128,
 
1
  {
2
+ "_name_or_path": "t5-base",
3
  "architectures": [
4
  "T5ForConditionalGeneration"
5
  ],
6
+ "d_ff": 3072,
7
  "d_kv": 64,
8
+ "d_model": 768,
9
  "decoder_start_token_id": 0,
10
  "dense_act_fn": "relu",
11
  "dropout_rate": 0.1,
 
17
  "layer_norm_epsilon": 1e-06,
18
  "model_type": "t5",
19
  "n_positions": 512,
20
+ "num_decoder_layers": 12,
21
+ "num_heads": 12,
22
+ "num_layers": 12,
23
  "output_past": true,
24
  "pad_token_id": 0,
25
  "relative_attention_max_distance": 128,
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b4519a0a301b271a4aff30155c6bc958072df977587a29852161b73351a7ee3f
3
- size 242016345
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:145414a7e4c60cad9ada1bc978c9dc3d109acea373cd4253f0c5d1e9b2165423
3
+ size 891619985
runs/Feb23_22-59-46_a362d227330c/1677193199.5576441/events.out.tfevents.1677193199.a362d227330c.2861.12 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4eed55ce2f5ebb566c82bc5930c19c625c7b0bc7af1e308ffb7bbd5d3100386a
3
+ size 5700
runs/Feb23_22-59-46_a362d227330c/events.out.tfevents.1677193199.a362d227330c.2861.11 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63b3ddd5ebf6662f01fbbf83b1feefa4918cf3576e1f25b0ceec5197dcaac34c
3
+ size 4654
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:152d5cdf5bcb65ce45f0917d5bd67526a42c75da10045dff9fbc02c67c8ca799
3
  size 3451
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0ea9e5431ae4f4bf35c27f0ee702ac53202bb7069d92234ccc288f3ba688fd8
3
  size 3451