End of training
Browse files- README.md +22 -35
- config.json +1 -1
- pytorch_model.bin +2 -2
README.md
CHANGED
@@ -6,14 +6,14 @@ tags:
|
|
6 |
metrics:
|
7 |
- accuracy
|
8 |
model-index:
|
9 |
-
- name: xtremedistil-l6-h384-uncased-
|
10 |
results: []
|
11 |
---
|
12 |
|
13 |
<!-- This model card has been generated automatically according to the information the Trainer had access to. You
|
14 |
should probably proofread and complete it, then remove this comment. -->
|
15 |
|
16 |
-
# xtremedistil-l6-h384-uncased-
|
17 |
|
18 |
This model is a fine-tuned version of [microsoft/xtremedistil-l6-h384-uncased](https://huggingface.co/microsoft/xtremedistil-l6-h384-uncased) on the None dataset.
|
19 |
It achieves the following results on the evaluation set:
|
@@ -57,39 +57,26 @@ The following hyperparameters were used during training:
|
|
57 |
|
58 |
### Training results
|
59 |
|
60 |
-
|
|
61 |
-
|
62 |
-
|
|
63 |
-
|
|
64 |
-
|
|
65 |
-
|
|
66 |
-
|
|
67 |
-
|
|
68 |
-
|
|
69 |
-
|
|
70 |
-
|
|
71 |
-
|
|
72 |
-
|
|
73 |
-
|
|
74 |
-
|
|
75 |
-
|
76 |
-
|
77 |
-
|
|
78 |
-
|
|
79 |
-
|
80 |
-
|eval_f1_macro|0.717|0.488|0.684|0.7|
|
81 |
-
|eval_f1_micro|0.718|0.506|0.684|0.7|
|
82 |
-
|eval_accuracy_balanced|0.719|0.501|0.687|0.702|
|
83 |
-
|eval_accuracy|0.718|0.506|0.684|0.7|
|
84 |
-
|eval_precision_macro|0.718|0.501|0.686|0.701|
|
85 |
-
|eval_recall_macro|0.719|0.501|0.687|0.702|
|
86 |
-
|eval_precision_micro|0.718|0.506|0.684|0.7|
|
87 |
-
|eval_recall_micro|0.718|0.506|0.684|0.7|
|
88 |
-
|eval_runtime|8.405|0.176|1.864|7.407|
|
89 |
-
|eval_samples_per_second|1011.367|5358.555|1013.595|1020.275|
|
90 |
-
|eval_steps_per_second|7.972|45.315|8.049|8.101|
|
91 |
-
|epoch|3.0|3.0|3.0|3.0|
|
92 |
-
|Size of dataset|8500|946|1889|7557|
|
93 |
|
94 |
### Framework versions
|
95 |
|
|
|
6 |
metrics:
|
7 |
- accuracy
|
8 |
model-index:
|
9 |
+
- name: xtremedistil-l6-h384-uncased-v2.0
|
10 |
results: []
|
11 |
---
|
12 |
|
13 |
<!-- This model card has been generated automatically according to the information the Trainer had access to. You
|
14 |
should probably proofread and complete it, then remove this comment. -->
|
15 |
|
16 |
+
# xtremedistil-l6-h384-uncased-v2.0
|
17 |
|
18 |
This model is a fine-tuned version of [microsoft/xtremedistil-l6-h384-uncased](https://huggingface.co/microsoft/xtremedistil-l6-h384-uncased) on the None dataset.
|
19 |
It achieves the following results on the evaluation set:
|
|
|
57 |
|
58 |
### Training results
|
59 |
|
60 |
+
| Training Loss | Epoch | Step | Validation Loss | F1 Macro | F1 Micro | Accuracy Balanced | Accuracy | Precision Macro | Recall Macro | Precision Micro | Recall Micro |
|
61 |
+
|:-------------:|:-----:|:----:|:---------------:|:--------:|:--------:|:-----------------:|:--------:|:---------------:|:------------:|:---------------:|:------------:|
|
62 |
+
| 0.6275 | 0.17 | 200 | 0.6177 | 0.3647 | 0.5463 | 0.5039 | 0.5463 | 0.6163 | 0.5039 | 0.5463 | 0.5463 |
|
63 |
+
| 0.5811 | 0.34 | 400 | 0.5808 | 0.5807 | 0.6194 | 0.5976 | 0.6194 | 0.6331 | 0.5976 | 0.6194 | 0.6194 |
|
64 |
+
| 0.5769 | 0.51 | 600 | 0.5680 | 0.6564 | 0.6585 | 0.6703 | 0.6585 | 0.6796 | 0.6703 | 0.6585 | 0.6585 |
|
65 |
+
| 0.5647 | 0.68 | 800 | 0.5634 | 0.6703 | 0.6728 | 0.6855 | 0.6728 | 0.6976 | 0.6855 | 0.6728 | 0.6728 |
|
66 |
+
| 0.5607 | 0.85 | 1000 | 0.5720 | 0.6176 | 0.6448 | 0.6264 | 0.6448 | 0.6569 | 0.6264 | 0.6448 | 0.6448 |
|
67 |
+
| 0.5645 | 1.02 | 1200 | 0.5617 | 0.6523 | 0.6601 | 0.6521 | 0.6601 | 0.6581 | 0.6521 | 0.6601 | 0.6601 |
|
68 |
+
| 0.5665 | 1.19 | 1400 | 0.5479 | 0.6802 | 0.6840 | 0.6986 | 0.6840 | 0.7172 | 0.6986 | 0.6840 | 0.6840 |
|
69 |
+
| 0.5432 | 1.35 | 1600 | 0.5540 | 0.6642 | 0.6665 | 0.6644 | 0.6665 | 0.6641 | 0.6644 | 0.6665 | 0.6665 |
|
70 |
+
| 0.5427 | 1.52 | 1800 | 0.5520 | 0.6533 | 0.6617 | 0.6532 | 0.6617 | 0.6601 | 0.6532 | 0.6617 | 0.6617 |
|
71 |
+
| 0.5453 | 1.69 | 2000 | 0.5487 | 0.6756 | 0.6781 | 0.6755 | 0.6781 | 0.6757 | 0.6755 | 0.6781 | 0.6781 |
|
72 |
+
| 0.5528 | 1.86 | 2200 | 0.5492 | 0.6720 | 0.6771 | 0.6713 | 0.6771 | 0.6747 | 0.6713 | 0.6771 | 0.6771 |
|
73 |
+
| 0.531 | 2.03 | 2400 | 0.5476 | 0.6799 | 0.6803 | 0.6882 | 0.6803 | 0.6911 | 0.6882 | 0.6803 | 0.6803 |
|
74 |
+
| 0.5199 | 2.2 | 2600 | 0.5454 | 0.6823 | 0.6824 | 0.6863 | 0.6824 | 0.6856 | 0.6863 | 0.6824 | 0.6824 |
|
75 |
+
| 0.535 | 2.37 | 2800 | 0.5441 | 0.6797 | 0.6803 | 0.6817 | 0.6803 | 0.6804 | 0.6817 | 0.6803 | 0.6803 |
|
76 |
+
| 0.5246 | 2.54 | 3000 | 0.5453 | 0.6746 | 0.6750 | 0.6771 | 0.6750 | 0.6759 | 0.6771 | 0.6750 | 0.6750 |
|
77 |
+
| 0.5405 | 2.71 | 3200 | 0.5408 | 0.6824 | 0.6861 | 0.6819 | 0.6861 | 0.6836 | 0.6819 | 0.6861 | 0.6861 |
|
78 |
+
| 0.5414 | 2.88 | 3400 | 0.5404 | 0.6826 | 0.6834 | 0.6841 | 0.6834 | 0.6828 | 0.6841 | 0.6834 | 0.6834 |
|
79 |
+
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
80 |
|
81 |
### Framework versions
|
82 |
|
config.json
CHANGED
@@ -27,7 +27,7 @@
|
|
27 |
"pad_token_id": 0,
|
28 |
"position_embedding_type": "absolute",
|
29 |
"problem_type": "single_label_classification",
|
30 |
-
"torch_dtype": "
|
31 |
"transformers_version": "4.33.3",
|
32 |
"type_vocab_size": 2,
|
33 |
"use_cache": true,
|
|
|
27 |
"pad_token_id": 0,
|
28 |
"position_embedding_type": "absolute",
|
29 |
"problem_type": "single_label_classification",
|
30 |
+
"torch_dtype": "float16",
|
31 |
"transformers_version": "4.33.3",
|
32 |
"type_vocab_size": 2,
|
33 |
"use_cache": true,
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc9784ccb8ade0cd06803fc824d515cc4d2dd31b1976be8e15a4e134ba7d61f1
|
3 |
+
size 45463854
|