End of training
Browse files- .gitattributes +1 -0
- .gitignore +1 -0
- config.json +32 -0
- generation_config.json +6 -0
- pytorch_model.bin +3 -0
- runs/Mar18_06-44-24_9890d0642dfc/1679121899.2792878/events.out.tfevents.1679121899.9890d0642dfc.2360.5 +3 -0
- runs/Mar18_06-44-24_9890d0642dfc/events.out.tfevents.1679121899.9890d0642dfc.2360.4 +3 -0
- runs/Mar18_06-46-54_9890d0642dfc/1679122034.1118152/events.out.tfevents.1679122034.9890d0642dfc.2360.7 +3 -0
- runs/Mar18_06-46-54_9890d0642dfc/1679122058.75141/events.out.tfevents.1679122058.9890d0642dfc.2360.8 +3 -0
- runs/Mar18_06-46-54_9890d0642dfc/events.out.tfevents.1679122034.9890d0642dfc.2360.6 +3 -0
- runs/Mar18_06-49-01_9890d0642dfc/1679122158.6341114/events.out.tfevents.1679122158.9890d0642dfc.2360.10 +3 -0
- runs/Mar18_06-49-01_9890d0642dfc/events.out.tfevents.1679122158.9890d0642dfc.2360.9 +3 -0
- runs/Mar18_06-49-44_9890d0642dfc/1679122201.4648492/events.out.tfevents.1679122201.9890d0642dfc.2360.12 +3 -0
- runs/Mar18_06-49-44_9890d0642dfc/1679122214.9618635/events.out.tfevents.1679122214.9890d0642dfc.2360.13 +3 -0
- runs/Mar18_06-49-44_9890d0642dfc/events.out.tfevents.1679122201.9890d0642dfc.2360.11 +3 -0
- runs/Mar18_06-50-48_9890d0642dfc/1679122281.7235017/events.out.tfevents.1679122281.9890d0642dfc.2360.15 +3 -0
- runs/Mar18_06-50-48_9890d0642dfc/1679122293.9574654/events.out.tfevents.1679122293.9890d0642dfc.2360.16 +3 -0
- runs/Mar18_06-50-48_9890d0642dfc/events.out.tfevents.1679122281.9890d0642dfc.2360.14 +3 -0
- runs/Mar18_06-52-23_9890d0642dfc/1679122377.6678984/events.out.tfevents.1679122377.9890d0642dfc.2360.18 +3 -0
- runs/Mar18_06-52-23_9890d0642dfc/1679122391.7081497/events.out.tfevents.1679122391.9890d0642dfc.2360.19 +3 -0
- runs/Mar18_06-52-23_9890d0642dfc/1679122563.8788617/events.out.tfevents.1679122563.9890d0642dfc.2360.20 +3 -0
- runs/Mar18_06-52-23_9890d0642dfc/events.out.tfevents.1679122377.9890d0642dfc.2360.17 +3 -0
- runs/Mar18_06-58-48_9890d0642dfc/1679122738.5127883/events.out.tfevents.1679122738.9890d0642dfc.10171.1 +3 -0
- runs/Mar18_06-58-48_9890d0642dfc/events.out.tfevents.1679122738.9890d0642dfc.10171.0 +3 -0
- runs/Mar18_07-00-18_9890d0642dfc/1679122840.795825/events.out.tfevents.1679122840.9890d0642dfc.10171.3 +3 -0
- runs/Mar18_07-00-18_9890d0642dfc/1679122956.9261463/events.out.tfevents.1679122956.9890d0642dfc.10171.4 +3 -0
- runs/Mar18_07-00-18_9890d0642dfc/events.out.tfevents.1679122840.9890d0642dfc.10171.2 +3 -0
- runs/Mar18_07-04-39_9890d0642dfc/1679123089.3368871/events.out.tfevents.1679123089.9890d0642dfc.12111.1 +3 -0
- runs/Mar18_07-04-39_9890d0642dfc/events.out.tfevents.1679123089.9890d0642dfc.12111.0 +3 -0
- runs/Mar18_07-16-55_9890d0642dfc/1679123826.059968/events.out.tfevents.1679123826.9890d0642dfc.14299.1 +3 -0
- runs/Mar18_07-16-55_9890d0642dfc/events.out.tfevents.1679123826.9890d0642dfc.14299.0 +3 -0
- runs/Mar18_07-18-53_9890d0642dfc/1679123943.4282925/events.out.tfevents.1679123943.9890d0642dfc.16157.1 +3 -0
- runs/Mar18_07-18-53_9890d0642dfc/events.out.tfevents.1679123943.9890d0642dfc.16157.0 +3 -0
- special_tokens_map.json +5 -0
- spiece.model +3 -0
- tokenizer.json +3 -0
- tokenizer_config.json +11 -0
- training_args.bin +3 -0
.gitattributes
CHANGED
@@ -32,3 +32,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
32 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
33 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
34 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
32 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
33 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
34 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
35 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
.gitignore
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
checkpoint-*/
|
config.json
ADDED
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "google/mt5-large",
|
3 |
+
"architectures": [
|
4 |
+
"MT5ForConditionalGeneration"
|
5 |
+
],
|
6 |
+
"d_ff": 2816,
|
7 |
+
"d_kv": 64,
|
8 |
+
"d_model": 1024,
|
9 |
+
"decoder_start_token_id": 0,
|
10 |
+
"dense_act_fn": "gelu_new",
|
11 |
+
"dropout_rate": 0.1,
|
12 |
+
"eos_token_id": 1,
|
13 |
+
"feed_forward_proj": "gated-gelu",
|
14 |
+
"initializer_factor": 1.0,
|
15 |
+
"is_encoder_decoder": true,
|
16 |
+
"is_gated_act": true,
|
17 |
+
"layer_norm_epsilon": 1e-06,
|
18 |
+
"model_type": "mt5",
|
19 |
+
"num_decoder_layers": 24,
|
20 |
+
"num_heads": 16,
|
21 |
+
"num_layers": 24,
|
22 |
+
"output_past": true,
|
23 |
+
"pad_token_id": 0,
|
24 |
+
"relative_attention_max_distance": 128,
|
25 |
+
"relative_attention_num_buckets": 32,
|
26 |
+
"tie_word_embeddings": false,
|
27 |
+
"tokenizer_class": "T5Tokenizer",
|
28 |
+
"torch_dtype": "float32",
|
29 |
+
"transformers_version": "4.27.1",
|
30 |
+
"use_cache": true,
|
31 |
+
"vocab_size": 250112
|
32 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"decoder_start_token_id": 0,
|
3 |
+
"eos_token_id": 1,
|
4 |
+
"pad_token_id": 0,
|
5 |
+
"transformers_version": "4.27.1"
|
6 |
+
}
|
pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e43ae12e41c2e46005ac1ef073f133ee5370c6bd9577837b2e5da3730baf9120
|
3 |
+
size 4918519065
|
runs/Mar18_06-44-24_9890d0642dfc/1679121899.2792878/events.out.tfevents.1679121899.9890d0642dfc.2360.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:197e4d9b4d5de80afb83c0063fbb8aa3a8b67c988fae0008d86d5bf3499c850c
|
3 |
+
size 6034
|
runs/Mar18_06-44-24_9890d0642dfc/events.out.tfevents.1679121899.9890d0642dfc.2360.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bef6cfbbb218007da3271de4857346c133a81cd4adc634f546122b7564eb4f94
|
3 |
+
size 4204
|
runs/Mar18_06-46-54_9890d0642dfc/1679122034.1118152/events.out.tfevents.1679122034.9890d0642dfc.2360.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db1390efb74823179a1d8f417113e09506c71c178337a2c27e91674283676f73
|
3 |
+
size 6034
|
runs/Mar18_06-46-54_9890d0642dfc/1679122058.75141/events.out.tfevents.1679122058.9890d0642dfc.2360.8
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0394705083889190b8a93c39d9f7763cc42ad74db8bd5ebd4775d982ffdbf4d2
|
3 |
+
size 6034
|
runs/Mar18_06-46-54_9890d0642dfc/events.out.tfevents.1679122034.9890d0642dfc.2360.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dff162f19322590ba9da1aebb62a0adb9124c5f0ac373b07505757af5ec85259
|
3 |
+
size 8368
|
runs/Mar18_06-49-01_9890d0642dfc/1679122158.6341114/events.out.tfevents.1679122158.9890d0642dfc.2360.10
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ba0c7424c91a6b65dc163a95e9ad17f5ad55419a008dc5263dd3278e334b337
|
3 |
+
size 6034
|
runs/Mar18_06-49-01_9890d0642dfc/events.out.tfevents.1679122158.9890d0642dfc.2360.9
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a11ddfddb19b0aa7a8a97568fa8d03fb03c5e4959ecb0283226dab47dc2aa001
|
3 |
+
size 4204
|
runs/Mar18_06-49-44_9890d0642dfc/1679122201.4648492/events.out.tfevents.1679122201.9890d0642dfc.2360.12
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be636af4b85996db1daea9684fd1463976870f038b63cb222cf11fcac1834bd5
|
3 |
+
size 6034
|
runs/Mar18_06-49-44_9890d0642dfc/1679122214.9618635/events.out.tfevents.1679122214.9890d0642dfc.2360.13
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9eb1763db38c86f3c8cbe2e9cc99058dd32f6707295d89aa25d171474c3c4309
|
3 |
+
size 6034
|
runs/Mar18_06-49-44_9890d0642dfc/events.out.tfevents.1679122201.9890d0642dfc.2360.11
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ba638a93bb1965d576d8218b970bba89ddc1e2b9e8a7fcb8b3d22065eb27769
|
3 |
+
size 8364
|
runs/Mar18_06-50-48_9890d0642dfc/1679122281.7235017/events.out.tfevents.1679122281.9890d0642dfc.2360.15
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2976f4da734859589f4e78b9354fe573c42330ba538edb31a379dfaae59adf21
|
3 |
+
size 6034
|
runs/Mar18_06-50-48_9890d0642dfc/1679122293.9574654/events.out.tfevents.1679122293.9890d0642dfc.2360.16
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be55e16ffb0fdb714d2917ed514694d092b91cdcc33860b6f2f5da1c2ffb123e
|
3 |
+
size 6034
|
runs/Mar18_06-50-48_9890d0642dfc/events.out.tfevents.1679122281.9890d0642dfc.2360.14
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9af289b1bb821060db422960b11fdf9f92fe7d01ff7ad642929ddd6545c8d07e
|
3 |
+
size 8366
|
runs/Mar18_06-52-23_9890d0642dfc/1679122377.6678984/events.out.tfevents.1679122377.9890d0642dfc.2360.18
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:497469f6e1e53b7e2a801f0ee4d1b95c711a5125d6b671e261c12ca4c0b7627f
|
3 |
+
size 6034
|
runs/Mar18_06-52-23_9890d0642dfc/1679122391.7081497/events.out.tfevents.1679122391.9890d0642dfc.2360.19
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:55c8892a60467b4271b6822ad54811e632ab5d28e0ce611338691f28ac4aea50
|
3 |
+
size 6034
|
runs/Mar18_06-52-23_9890d0642dfc/1679122563.8788617/events.out.tfevents.1679122563.9890d0642dfc.2360.20
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:714d2d1562aa842b07f1c562cb69eebfe95b4399114d5c2da70c116171830973
|
3 |
+
size 6034
|
runs/Mar18_06-52-23_9890d0642dfc/events.out.tfevents.1679122377.9890d0642dfc.2360.17
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3c54042b52511173c2541218ed3ccdc2a5131216cf865ebb3cf60482db070c6
|
3 |
+
size 12460
|
runs/Mar18_06-58-48_9890d0642dfc/1679122738.5127883/events.out.tfevents.1679122738.9890d0642dfc.10171.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02223d5e1ccd2cda2086d98345161f319f26333a900f983b4a9d302431fd477e
|
3 |
+
size 6034
|
runs/Mar18_06-58-48_9890d0642dfc/events.out.tfevents.1679122738.9890d0642dfc.10171.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7c3dbd94bdb73ea669b15a0df542f7a871898542768136cb45b9608e7f3c6667
|
3 |
+
size 4202
|
runs/Mar18_07-00-18_9890d0642dfc/1679122840.795825/events.out.tfevents.1679122840.9890d0642dfc.10171.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32c051393e7fd9e145c18a1167a88f3c5b6a0b544dedbdd030445fef99987e7b
|
3 |
+
size 6034
|
runs/Mar18_07-00-18_9890d0642dfc/1679122956.9261463/events.out.tfevents.1679122956.9890d0642dfc.10171.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e41189dea7a0725aaf812e2f2db40d7e278e05e84e1572e5fa0a30561f36073
|
3 |
+
size 6034
|
runs/Mar18_07-00-18_9890d0642dfc/events.out.tfevents.1679122840.9890d0642dfc.10171.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3540fef723bc17282476df0a0180fd69b93f016548cafd56a02ff7b5b20ef08c
|
3 |
+
size 8232
|
runs/Mar18_07-04-39_9890d0642dfc/1679123089.3368871/events.out.tfevents.1679123089.9890d0642dfc.12111.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ead5aa3b78441ffe865b7983739d6fd723f13ed3719477558292d002b42ecf2f
|
3 |
+
size 6034
|
runs/Mar18_07-04-39_9890d0642dfc/events.out.tfevents.1679123089.9890d0642dfc.12111.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:259d8f615f785ebc6aa5fcce0083dcf7a75d9153f36588cd185e9ef3b02b4864
|
3 |
+
size 4202
|
runs/Mar18_07-16-55_9890d0642dfc/1679123826.059968/events.out.tfevents.1679123826.9890d0642dfc.14299.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a15c73f1d95c7aa786617ec83aae9549e26fddc67391a20f62ba3f4cd70bec1f
|
3 |
+
size 6034
|
runs/Mar18_07-16-55_9890d0642dfc/events.out.tfevents.1679123826.9890d0642dfc.14299.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f90afeff2a58285c658c0e50079578473d6ef28e05fe975ce82586bbceb5517
|
3 |
+
size 4136
|
runs/Mar18_07-18-53_9890d0642dfc/1679123943.4282925/events.out.tfevents.1679123943.9890d0642dfc.16157.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9461b6a53862622e7bb68302870b64c3024616d833a38e5a53bfa508374f47e1
|
3 |
+
size 6034
|
runs/Mar18_07-18-53_9890d0642dfc/events.out.tfevents.1679123943.9890d0642dfc.16157.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82b88a662d61189bdfabd1fb9cbd20a9c90018e956378781ffe3263ee40dd61c
|
3 |
+
size 4359
|
special_tokens_map.json
ADDED
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"eos_token": "</s>",
|
3 |
+
"pad_token": "<pad>",
|
4 |
+
"unk_token": "<unk>"
|
5 |
+
}
|
spiece.model
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef78f86560d809067d12bac6c09f19a462cb3af3f54d2b8acbba26e1433125d6
|
3 |
+
size 4309802
|
tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad87025a36c0e90fb1dab13f69c58d99a96404d789288636b02d5dc763dcf299
|
3 |
+
size 16330466
|
tokenizer_config.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"additional_special_tokens": null,
|
3 |
+
"eos_token": "</s>",
|
4 |
+
"extra_ids": 0,
|
5 |
+
"model_max_length": 1000000000000000019884624838656,
|
6 |
+
"pad_token": "<pad>",
|
7 |
+
"sp_model_kwargs": {},
|
8 |
+
"special_tokens_map_file": "/home/patrick/.cache/torch/transformers/685ac0ca8568ec593a48b61b0a3c272beee9bc194a3c7241d15dcadb5f875e53.f76030f3ec1b96a8199b2593390c610e76ca8028ef3d24680000619ffb646276",
|
9 |
+
"tokenizer_class": "T5Tokenizer",
|
10 |
+
"unk_token": "<unk>"
|
11 |
+
}
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c746a40e970b3a9a8b058f370b27c39c1c01656e8be9133bdd9d9a2033d40cd6
|
3 |
+
size 3707
|