sorayutmild commited on
Commit
dc8fa44
1 Parent(s): 05bd9cd

Training in progress, step 2000

Browse files
Files changed (25) hide show
  1. .gitattributes +1 -0
  2. .gitignore +1 -0
  3. config.json +32 -0
  4. pytorch_model.bin +3 -0
  5. runs/Dec22_13-19-54_3efc8d045e2f/1671715404.0960257/events.out.tfevents.1671715404.3efc8d045e2f.23.2 +3 -0
  6. runs/Dec22_13-19-54_3efc8d045e2f/1671715417.2763708/events.out.tfevents.1671715417.3efc8d045e2f.23.3 +3 -0
  7. runs/Dec22_13-19-54_3efc8d045e2f/1671715428.5540988/events.out.tfevents.1671715428.3efc8d045e2f.23.4 +3 -0
  8. runs/Dec22_13-19-54_3efc8d045e2f/1671715441.1662471/events.out.tfevents.1671715441.3efc8d045e2f.23.5 +3 -0
  9. runs/Dec22_13-19-54_3efc8d045e2f/1671715451.616452/events.out.tfevents.1671715451.3efc8d045e2f.23.6 +3 -0
  10. runs/Dec22_13-19-54_3efc8d045e2f/1671715492.9185338/events.out.tfevents.1671715492.3efc8d045e2f.23.7 +3 -0
  11. runs/Dec22_13-19-54_3efc8d045e2f/events.out.tfevents.1671715403.3efc8d045e2f.23.1 +3 -0
  12. runs/Dec22_13-25-09_3efc8d045e2f/1671715524.4630265/events.out.tfevents.1671715524.3efc8d045e2f.23.9 +3 -0
  13. runs/Dec22_13-25-09_3efc8d045e2f/1671715531.49861/events.out.tfevents.1671715531.3efc8d045e2f.23.10 +3 -0
  14. runs/Dec22_13-25-09_3efc8d045e2f/events.out.tfevents.1671715524.3efc8d045e2f.23.8 +3 -0
  15. runs/Dec22_13-26-27_3efc8d045e2f/1671715591.830819/events.out.tfevents.1671715591.3efc8d045e2f.23.12 +3 -0
  16. runs/Dec22_13-26-27_3efc8d045e2f/1671715666.0171692/events.out.tfevents.1671715666.3efc8d045e2f.23.13 +3 -0
  17. runs/Dec22_13-26-27_3efc8d045e2f/events.out.tfevents.1671715591.3efc8d045e2f.23.11 +3 -0
  18. runs/Dec22_13-27-58_3efc8d045e2f/1671715687.5748084/events.out.tfevents.1671715687.3efc8d045e2f.23.15 +3 -0
  19. runs/Dec22_13-27-58_3efc8d045e2f/1671715692.787198/events.out.tfevents.1671715692.3efc8d045e2f.23.16 +3 -0
  20. runs/Dec22_13-27-58_3efc8d045e2f/events.out.tfevents.1671715687.3efc8d045e2f.23.14 +3 -0
  21. special_tokens_map.json +5 -0
  22. spiece.model +3 -0
  23. tokenizer.json +3 -0
  24. tokenizer_config.json +12 -0
  25. training_args.bin +3 -0
.gitattributes CHANGED
@@ -32,3 +32,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
35
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoint-*/
config.json ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "thanathorn/mt5-cpe-kmutt-thai-sentence-sum",
3
+ "architectures": [
4
+ "MT5ForConditionalGeneration"
5
+ ],
6
+ "d_ff": 2048,
7
+ "d_kv": 64,
8
+ "d_model": 768,
9
+ "decoder_start_token_id": 0,
10
+ "dense_act_fn": "gelu_new",
11
+ "dropout_rate": 0.1,
12
+ "eos_token_id": 1,
13
+ "feed_forward_proj": "gated-gelu",
14
+ "initializer_factor": 1.0,
15
+ "is_encoder_decoder": true,
16
+ "is_gated_act": true,
17
+ "layer_norm_epsilon": 1e-06,
18
+ "model_type": "mt5",
19
+ "num_decoder_layers": 12,
20
+ "num_heads": 12,
21
+ "num_layers": 12,
22
+ "output_past": true,
23
+ "pad_token_id": 0,
24
+ "relative_attention_max_distance": 128,
25
+ "relative_attention_num_buckets": 32,
26
+ "tie_word_embeddings": false,
27
+ "tokenizer_class": "T5Tokenizer",
28
+ "torch_dtype": "float32",
29
+ "transformers_version": "4.20.1",
30
+ "use_cache": true,
31
+ "vocab_size": 250112
32
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55d69b4085f93b4ff49bdc1d5c842cd55c55463006f2e9d5ad97b36ba717e287
3
+ size 2329700173
runs/Dec22_13-19-54_3efc8d045e2f/1671715404.0960257/events.out.tfevents.1671715404.3efc8d045e2f.23.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7ff07576274d3c7283f58c2fe06b75ec97d3d0d84142c80440a795940c76c20
3
+ size 5702
runs/Dec22_13-19-54_3efc8d045e2f/1671715417.2763708/events.out.tfevents.1671715417.3efc8d045e2f.23.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce1260bda67ecf2418d2c108d0976c12c23e41676b7c1748d58d752c32b42ce6
3
+ size 5702
runs/Dec22_13-19-54_3efc8d045e2f/1671715428.5540988/events.out.tfevents.1671715428.3efc8d045e2f.23.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:607b3e55ccffc0f823f21e02b173815e83b1a8e752db82cae2644922da3d612c
3
+ size 5702
runs/Dec22_13-19-54_3efc8d045e2f/1671715441.1662471/events.out.tfevents.1671715441.3efc8d045e2f.23.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db1a4a0c30ebd52ad67b103302a19c09ab0baa8046331502b7618b11abf9d28d
3
+ size 5702
runs/Dec22_13-19-54_3efc8d045e2f/1671715451.616452/events.out.tfevents.1671715451.3efc8d045e2f.23.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f89180f6461efb659cd4ff130568e2b5d061f86b0b9690a14ea7985b621e53e
3
+ size 5702
runs/Dec22_13-19-54_3efc8d045e2f/1671715492.9185338/events.out.tfevents.1671715492.3efc8d045e2f.23.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:396524122392f355e2b7c1e0766f20bede15c995b21c76948ca3efd1f145f94e
3
+ size 5702
runs/Dec22_13-19-54_3efc8d045e2f/events.out.tfevents.1671715403.3efc8d045e2f.23.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e36c930942299a90c3be9f01c92782eb91bb657972579904f66ddf3a2692b5ed
3
+ size 24584
runs/Dec22_13-25-09_3efc8d045e2f/1671715524.4630265/events.out.tfevents.1671715524.3efc8d045e2f.23.9 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a08ea118741d707f53fbca8989cb0a7becbcf4ff9b20ed776bc8c8d23f6981ec
3
+ size 5702
runs/Dec22_13-25-09_3efc8d045e2f/1671715531.49861/events.out.tfevents.1671715531.3efc8d045e2f.23.10 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:215d5387b8396d116a2d5e1d3be7d5e9090ff945221fb7cc0237452a55e02a28
3
+ size 5702
runs/Dec22_13-25-09_3efc8d045e2f/events.out.tfevents.1671715524.3efc8d045e2f.23.8 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eee41196f6e571128b0ebc97959d8dee01d93dacaeb18e27dfc0f15c778a4ccb
3
+ size 8088
runs/Dec22_13-26-27_3efc8d045e2f/1671715591.830819/events.out.tfevents.1671715591.3efc8d045e2f.23.12 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:418e00a4f9e7ace6e25b48d7069ffedf2f909664a249fa389508d64dab6be3a9
3
+ size 5702
runs/Dec22_13-26-27_3efc8d045e2f/1671715666.0171692/events.out.tfevents.1671715666.3efc8d045e2f.23.13 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bce33056c1b4d971024e822dadaa97e31bd9602eb5f40d8f52dea9b2dc544c22
3
+ size 5702
runs/Dec22_13-26-27_3efc8d045e2f/events.out.tfevents.1671715591.3efc8d045e2f.23.11 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b6daf730b807967a9ad800485b75a176717f346dc2b39e5bfde13417861646f
3
+ size 8088
runs/Dec22_13-27-58_3efc8d045e2f/1671715687.5748084/events.out.tfevents.1671715687.3efc8d045e2f.23.15 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e324b80818693f86879058985853fb4aae8efbdbfa743d8825ce486893b6e154
3
+ size 5702
runs/Dec22_13-27-58_3efc8d045e2f/1671715692.787198/events.out.tfevents.1671715692.3efc8d045e2f.23.16 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2419d53a1e0642925605e3e5575ae527b51dfa56bfc3ddc913dc22cf6eeb6310
3
+ size 5702
runs/Dec22_13-27-58_3efc8d045e2f/events.out.tfevents.1671715687.3efc8d045e2f.23.14 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:072cbdea0cfbf241453e30c882115adf6d456932359ae67f9d39789001ad2187
3
+ size 8716
special_tokens_map.json ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ {
2
+ "eos_token": "</s>",
3
+ "pad_token": "<pad>",
4
+ "unk_token": "<unk>"
5
+ }
spiece.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef78f86560d809067d12bac6c09f19a462cb3af3f54d2b8acbba26e1433125d6
3
+ size 4309802
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93c3578052e1605d8332eb961bc08d72e246071974e4cc54aa6991826b802aa5
3
+ size 16330369
tokenizer_config.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": null,
3
+ "eos_token": "</s>",
4
+ "extra_ids": 0,
5
+ "name_or_path": "thanathorn/mt5-cpe-kmutt-thai-sentence-sum",
6
+ "pad_token": "<pad>",
7
+ "sp_model_kwargs": {},
8
+ "special_tokens_map_file": "/home/patrick/.cache/torch/transformers/685ac0ca8568ec593a48b61b0a3c272beee9bc194a3c7241d15dcadb5f875e53.f76030f3ec1b96a8199b2593390c610e76ca8028ef3d24680000619ffb646276",
9
+ "tokenizer_class": "T5Tokenizer",
10
+ "truncate": true,
11
+ "unk_token": "<unk>"
12
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b18463aa97d9f229af1f4234149444ea4ce5edd2060b1732bf8f26a6a382ee2e
3
+ size 3567