e22vvb commited on
Commit
5e71958
1 Parent(s): aabe6e8

End of training

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,72 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - generated_from_trainer
4
+ model-index:
5
+ - name: ALL_mt5-base_15_spider_15_wikiSQL_new
6
+ results: []
7
+ ---
8
+
9
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
10
+ should probably proofread and complete it, then remove this comment. -->
11
+
12
+ # ALL_mt5-base_15_spider_15_wikiSQL_new
13
+
14
+ This model was trained from scratch on an unknown dataset.
15
+ It achieves the following results on the evaluation set:
16
+ - Loss: 0.2909
17
+ - Rouge2 Precision: 0.6313
18
+ - Rouge2 Recall: 0.4304
19
+ - Rouge2 Fmeasure: 0.4825
20
+
21
+ ## Model description
22
+
23
+ More information needed
24
+
25
+ ## Intended uses & limitations
26
+
27
+ More information needed
28
+
29
+ ## Training and evaluation data
30
+
31
+ More information needed
32
+
33
+ ## Training procedure
34
+
35
+ ### Training hyperparameters
36
+
37
+ The following hyperparameters were used during training:
38
+ - learning_rate: 5e-05
39
+ - train_batch_size: 19
40
+ - eval_batch_size: 16
41
+ - seed: 42
42
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
43
+ - lr_scheduler_type: linear
44
+ - num_epochs: 15
45
+
46
+ ### Training results
47
+
48
+ | Training Loss | Epoch | Step | Validation Loss | Rouge2 Precision | Rouge2 Recall | Rouge2 Fmeasure |
49
+ |:-------------:|:-----:|:-----:|:---------------:|:----------------:|:-------------:|:---------------:|
50
+ | 0.2246 | 1.0 | 1021 | 0.2285 | 0.5427 | 0.3561 | 0.4023 |
51
+ | 0.1399 | 2.0 | 2042 | 0.2178 | 0.5685 | 0.3784 | 0.4254 |
52
+ | 0.1064 | 3.0 | 3063 | 0.2239 | 0.5832 | 0.3955 | 0.443 |
53
+ | 0.0849 | 4.0 | 4084 | 0.2297 | 0.6109 | 0.4157 | 0.466 |
54
+ | 0.0725 | 5.0 | 5105 | 0.2445 | 0.6023 | 0.4067 | 0.4567 |
55
+ | 0.0614 | 6.0 | 6126 | 0.2444 | 0.607 | 0.4123 | 0.4621 |
56
+ | 0.053 | 7.0 | 7147 | 0.2522 | 0.6158 | 0.419 | 0.4694 |
57
+ | 0.0479 | 8.0 | 8168 | 0.2612 | 0.6187 | 0.4194 | 0.4706 |
58
+ | 0.043 | 9.0 | 9189 | 0.2636 | 0.6249 | 0.4268 | 0.4782 |
59
+ | 0.0402 | 10.0 | 10210 | 0.2697 | 0.6304 | 0.4296 | 0.4818 |
60
+ | 0.0368 | 11.0 | 11231 | 0.2770 | 0.6299 | 0.43 | 0.482 |
61
+ | 0.0348 | 12.0 | 12252 | 0.2836 | 0.6284 | 0.4274 | 0.4795 |
62
+ | 0.0329 | 13.0 | 13273 | 0.2879 | 0.6233 | 0.4242 | 0.4758 |
63
+ | 0.0324 | 14.0 | 14294 | 0.2913 | 0.6303 | 0.4296 | 0.4818 |
64
+ | 0.0313 | 15.0 | 15315 | 0.2909 | 0.6313 | 0.4304 | 0.4825 |
65
+
66
+
67
+ ### Framework versions
68
+
69
+ - Transformers 4.26.1
70
+ - Pytorch 2.0.1+cu117
71
+ - Datasets 2.14.7.dev0
72
+ - Tokenizers 0.13.3
generation_config.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "decoder_start_token_id": 0,
4
+ "eos_token_id": 1,
5
+ "pad_token_id": 0,
6
+ "transformers_version": "4.26.1"
7
+ }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2415efdbd6cc2878302a00fe6a61e09f31c418929d91de477d5e9e10c91ed9ee
3
  size 2329702581
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b0be0ea01f13f2730d3f7c892dbeecd45ee3bbead48cb762514fefc4e2c8d1a
3
  size 2329702581
runs/Feb03_13-08-59_munich/events.out.tfevents.1706940546.munich.1021065.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0d7ddff0a58ecfce3e2d8357470bc2fc2793cfb3700bea860633545ff74261de
3
- size 15751
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b59811b14aaf4a305d0868cc9b8a775a77986609ef67d3dedc6afd1a3f3f0d39
3
+ size 16105
special_tokens_map.json ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ {
2
+ "eos_token": "</s>",
3
+ "pad_token": "<pad>",
4
+ "unk_token": "<unk>"
5
+ }
spiece.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef78f86560d809067d12bac6c09f19a462cb3af3f54d2b8acbba26e1433125d6
3
+ size 4309802
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:683ad341b77c862aa429e73bcbcefb2e36c4abc6ecb0ab788997b6f0566457a7
3
+ size 16315386
tokenizer_config.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": null,
3
+ "eos_token": "</s>",
4
+ "extra_ids": 0,
5
+ "model_max_length": 1000000000000000019884624838656,
6
+ "name_or_path": "/home/tong/text_to_sql/content/EN_mt5-base_15_wikiSQL",
7
+ "pad_token": "<pad>",
8
+ "sp_model_kwargs": {},
9
+ "special_tokens_map_file": "/home/patrick/.cache/torch/transformers/685ac0ca8568ec593a48b61b0a3c272beee9bc194a3c7241d15dcadb5f875e53.f76030f3ec1b96a8199b2593390c610e76ca8028ef3d24680000619ffb646276",
10
+ "tokenizer_class": "T5Tokenizer",
11
+ "unk_token": "<unk>"
12
+ }