Training in progress, epoch 1
Browse files- .gitattributes +1 -0
- config.json +32 -0
- model.safetensors +3 -0
- runs/Jun19_06-47-08_eae9afaf4557/events.out.tfevents.1718779801.eae9afaf4557.1697.0 +3 -0
- runs/Jun19_07-35-26_eae9afaf4557/events.out.tfevents.1718782635.eae9afaf4557.14766.0 +3 -0
- runs/Jun19_07-35-26_eae9afaf4557/events.out.tfevents.1718782794.eae9afaf4557.14766.1 +3 -0
- runs/Jun19_08-06-59_eae9afaf4557/events.out.tfevents.1718784938.eae9afaf4557.14766.2 +3 -0
- runs/Jun19_08-06-59_eae9afaf4557/events.out.tfevents.1718785200.eae9afaf4557.14766.3 +3 -0
- runs/Jun19_08-06-59_eae9afaf4557/events.out.tfevents.1718786188.eae9afaf4557.14766.4 +3 -0
- runs/Jun19_08-37-50_eae9afaf4557/events.out.tfevents.1718786397.eae9afaf4557.14766.5 +3 -0
- runs/Jun19_08-37-50_eae9afaf4557/events.out.tfevents.1718786598.eae9afaf4557.14766.6 +3 -0
- runs/Jun19_08-37-50_eae9afaf4557/events.out.tfevents.1718786965.eae9afaf4557.14766.7 +3 -0
- runs/Jun19_09-51-01_eae9afaf4557/events.out.tfevents.1718790707.eae9afaf4557.34244.0 +3 -0
- runs/Jun19_09-52-29_eae9afaf4557/events.out.tfevents.1718790775.eae9afaf4557.34244.1 +3 -0
- special_tokens_map.json +23 -0
- spiece.model +3 -0
- tokenizer.json +3 -0
- tokenizer_config.json +39 -0
- training_args.bin +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
config.json
ADDED
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "google/mt5-small",
|
3 |
+
"architectures": [
|
4 |
+
"MT5ForConditionalGeneration"
|
5 |
+
],
|
6 |
+
"classifier_dropout": 0.0,
|
7 |
+
"d_ff": 1024,
|
8 |
+
"d_kv": 64,
|
9 |
+
"d_model": 512,
|
10 |
+
"decoder_start_token_id": 0,
|
11 |
+
"dense_act_fn": "gelu_new",
|
12 |
+
"dropout_rate": 0.1,
|
13 |
+
"eos_token_id": 1,
|
14 |
+
"feed_forward_proj": "gated-gelu",
|
15 |
+
"initializer_factor": 1.0,
|
16 |
+
"is_encoder_decoder": true,
|
17 |
+
"is_gated_act": true,
|
18 |
+
"layer_norm_epsilon": 1e-06,
|
19 |
+
"model_type": "mt5",
|
20 |
+
"num_decoder_layers": 8,
|
21 |
+
"num_heads": 6,
|
22 |
+
"num_layers": 8,
|
23 |
+
"pad_token_id": 0,
|
24 |
+
"relative_attention_max_distance": 128,
|
25 |
+
"relative_attention_num_buckets": 32,
|
26 |
+
"tie_word_embeddings": false,
|
27 |
+
"tokenizer_class": "T5Tokenizer",
|
28 |
+
"torch_dtype": "float32",
|
29 |
+
"transformers_version": "4.41.2",
|
30 |
+
"use_cache": true,
|
31 |
+
"vocab_size": 250112
|
32 |
+
}
|
model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e6cee875cd7f2ed365f854e3b212b48a77806a2d9ba7324853f4a8d4425f1693
|
3 |
+
size 1200729512
|
runs/Jun19_06-47-08_eae9afaf4557/events.out.tfevents.1718779801.eae9afaf4557.1697.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:49fa12b3b1c8e57df953cb772a14e0c438e2627abff110807a2d46cd205d1d27
|
3 |
+
size 4438
|
runs/Jun19_07-35-26_eae9afaf4557/events.out.tfevents.1718782635.eae9afaf4557.14766.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:07ccf2769599bf2e27d00a9c849296490be0e852596fea8ccddabcd9f818134c
|
3 |
+
size 342
|
runs/Jun19_07-35-26_eae9afaf4557/events.out.tfevents.1718782794.eae9afaf4557.14766.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ea7fc46c5686a0337d720b51636ede0542475d7597f9e8777dd0e429267f5e5
|
3 |
+
size 596
|
runs/Jun19_08-06-59_eae9afaf4557/events.out.tfevents.1718784938.eae9afaf4557.14766.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:62fe0a4aa2b3d60151a97f09114746729f24af81ff11f5010d564a838c16b902
|
3 |
+
size 297
|
runs/Jun19_08-06-59_eae9afaf4557/events.out.tfevents.1718785200.eae9afaf4557.14766.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:820bf416092c68729f98f84b49d80fb0e1307806880c0abbbc8c7608ac33df20
|
3 |
+
size 297
|
runs/Jun19_08-06-59_eae9afaf4557/events.out.tfevents.1718786188.eae9afaf4557.14766.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ccf687feb02bb9efee254a4ce09de3ccb14888eb9261fb26267855b7ea708ad9
|
3 |
+
size 342
|
runs/Jun19_08-37-50_eae9afaf4557/events.out.tfevents.1718786397.eae9afaf4557.14766.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e9664497780bb1de17afa5be123fc98d088e0e831d6c0a5c7cf3cdbc4f47b9ae
|
3 |
+
size 342
|
runs/Jun19_08-37-50_eae9afaf4557/events.out.tfevents.1718786598.eae9afaf4557.14766.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f20b7de4c75e1dded1a800652b881912c7f02240c2caca37e72c16114feff2f1
|
3 |
+
size 342
|
runs/Jun19_08-37-50_eae9afaf4557/events.out.tfevents.1718786965.eae9afaf4557.14766.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:647e0ee078adfeafc9eaea6d31ee3be7980b7d843571a3b30c6e15d91b9f2578
|
3 |
+
size 4438
|
runs/Jun19_09-51-01_eae9afaf4557/events.out.tfevents.1718790707.eae9afaf4557.34244.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db68d1f059e64d5ccb11e4a8151121cd93d2af83aad9407ddd10040a5473b24d
|
3 |
+
size 342
|
runs/Jun19_09-52-29_eae9afaf4557/events.out.tfevents.1718790775.eae9afaf4557.34244.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4bacbffa0336766ca486eecdf7a7238d1b32d6c1ab983b3e155b3f3838a36d5f
|
3 |
+
size 5316
|
special_tokens_map.json
ADDED
@@ -0,0 +1,23 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"eos_token": {
|
3 |
+
"content": "</s>",
|
4 |
+
"lstrip": false,
|
5 |
+
"normalized": false,
|
6 |
+
"rstrip": false,
|
7 |
+
"single_word": false
|
8 |
+
},
|
9 |
+
"pad_token": {
|
10 |
+
"content": "<pad>",
|
11 |
+
"lstrip": false,
|
12 |
+
"normalized": false,
|
13 |
+
"rstrip": false,
|
14 |
+
"single_word": false
|
15 |
+
},
|
16 |
+
"unk_token": {
|
17 |
+
"content": "<unk>",
|
18 |
+
"lstrip": false,
|
19 |
+
"normalized": false,
|
20 |
+
"rstrip": false,
|
21 |
+
"single_word": false
|
22 |
+
}
|
23 |
+
}
|
spiece.model
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef78f86560d809067d12bac6c09f19a462cb3af3f54d2b8acbba26e1433125d6
|
3 |
+
size 4309802
|
tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ddb1b00035edffde435e24e69011b7f552691405237455cb7c3a59c890682807
|
3 |
+
size 16330540
|
tokenizer_config.json
ADDED
@@ -0,0 +1,39 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"add_prefix_space": true,
|
3 |
+
"added_tokens_decoder": {
|
4 |
+
"0": {
|
5 |
+
"content": "<pad>",
|
6 |
+
"lstrip": false,
|
7 |
+
"normalized": false,
|
8 |
+
"rstrip": false,
|
9 |
+
"single_word": false,
|
10 |
+
"special": true
|
11 |
+
},
|
12 |
+
"1": {
|
13 |
+
"content": "</s>",
|
14 |
+
"lstrip": false,
|
15 |
+
"normalized": false,
|
16 |
+
"rstrip": false,
|
17 |
+
"single_word": false,
|
18 |
+
"special": true
|
19 |
+
},
|
20 |
+
"2": {
|
21 |
+
"content": "<unk>",
|
22 |
+
"lstrip": false,
|
23 |
+
"normalized": false,
|
24 |
+
"rstrip": false,
|
25 |
+
"single_word": false,
|
26 |
+
"special": true
|
27 |
+
}
|
28 |
+
},
|
29 |
+
"additional_special_tokens": [],
|
30 |
+
"clean_up_tokenization_spaces": true,
|
31 |
+
"eos_token": "</s>",
|
32 |
+
"extra_ids": 0,
|
33 |
+
"legacy": true,
|
34 |
+
"model_max_length": 1000000000000000019884624838656,
|
35 |
+
"pad_token": "<pad>",
|
36 |
+
"sp_model_kwargs": {},
|
37 |
+
"tokenizer_class": "T5Tokenizer",
|
38 |
+
"unk_token": "<unk>"
|
39 |
+
}
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5979652aba4c909814d169ad54e13370c00eb1a3584aa789fa94198b63b044ac
|
3 |
+
size 5240
|