NatthawatTung commited on
Commit
655af29
1 Parent(s): 674f250

End of training

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,68 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ tags:
4
+ - generated_from_trainer
5
+ model-index:
6
+ - name: ALL_mt5-base_10_wikiSQL_sch
7
+ results: []
8
+ ---
9
+
10
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
11
+ should probably proofread and complete it, then remove this comment. -->
12
+
13
+ # ALL_mt5-base_10_wikiSQL_sch
14
+
15
+ This model is a fine-tuned version of [google/mt5-base](https://huggingface.co/google/mt5-base) on an unknown dataset.
16
+ It achieves the following results on the evaluation set:
17
+ - Loss: 0.0566
18
+ - Rouge2 Precision: 0.8825
19
+ - Rouge2 Recall: 0.802
20
+ - Rouge2 Fmeasure: 0.8343
21
+
22
+ ## Model description
23
+
24
+ More information needed
25
+
26
+ ## Intended uses & limitations
27
+
28
+ More information needed
29
+
30
+ ## Training and evaluation data
31
+
32
+ More information needed
33
+
34
+ ## Training procedure
35
+
36
+ ### Training hyperparameters
37
+
38
+ The following hyperparameters were used during training:
39
+ - learning_rate: 5e-05
40
+ - train_batch_size: 15
41
+ - eval_batch_size: 16
42
+ - seed: 42
43
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
44
+ - lr_scheduler_type: linear
45
+ - num_epochs: 10
46
+
47
+ ### Training results
48
+
49
+ | Training Loss | Epoch | Step | Validation Loss | Rouge2 Precision | Rouge2 Recall | Rouge2 Fmeasure |
50
+ |:-------------:|:-----:|:-----:|:---------------:|:----------------:|:-------------:|:---------------:|
51
+ | 0.0789 | 1.0 | 8637 | 0.0678 | 0.859 | 0.7788 | 0.8103 |
52
+ | 0.0683 | 2.0 | 17274 | 0.0613 | 0.8688 | 0.7867 | 0.8196 |
53
+ | 0.0587 | 3.0 | 25911 | 0.0595 | 0.8726 | 0.7917 | 0.8241 |
54
+ | 0.0546 | 4.0 | 34548 | 0.0578 | 0.8771 | 0.7957 | 0.8284 |
55
+ | 0.0499 | 5.0 | 43185 | 0.0572 | 0.8793 | 0.7981 | 0.8308 |
56
+ | 0.0484 | 6.0 | 51822 | 0.0568 | 0.8797 | 0.7992 | 0.8315 |
57
+ | 0.0447 | 7.0 | 60459 | 0.0565 | 0.8809 | 0.8003 | 0.8326 |
58
+ | 0.0415 | 8.0 | 69096 | 0.0565 | 0.882 | 0.8013 | 0.8337 |
59
+ | 0.042 | 9.0 | 77733 | 0.0564 | 0.8822 | 0.8019 | 0.8341 |
60
+ | 0.0407 | 10.0 | 86370 | 0.0566 | 0.8825 | 0.802 | 0.8343 |
61
+
62
+
63
+ ### Framework versions
64
+
65
+ - Transformers 4.26.1
66
+ - Pytorch 2.1.2
67
+ - Datasets 2.16.1
68
+ - Tokenizers 0.13.3
special_tokens_map.json ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ {
2
+ "eos_token": "</s>",
3
+ "pad_token": "<pad>",
4
+ "unk_token": "<unk>"
5
+ }
spiece.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef78f86560d809067d12bac6c09f19a462cb3af3f54d2b8acbba26e1433125d6
3
+ size 4309802
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b49fe5973ba16763424a9230fea46fd3bebedc6e497d7d230fb00ce9f5a2fb1
3
+ size 16330634
tokenizer_config.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": null,
3
+ "eos_token": "</s>",
4
+ "extra_ids": 0,
5
+ "model_max_length": 1000000000000000019884624838656,
6
+ "name_or_path": "google/mt5-base",
7
+ "pad_token": "<pad>",
8
+ "sp_model_kwargs": {},
9
+ "special_tokens_map_file": "/home/patrick/.cache/torch/transformers/685ac0ca8568ec593a48b61b0a3c272beee9bc194a3c7241d15dcadb5f875e53.f76030f3ec1b96a8199b2593390c610e76ca8028ef3d24680000619ffb646276",
10
+ "tokenizer_class": "T5Tokenizer",
11
+ "unk_token": "<unk>"
12
+ }