jslai//content/sample_data/best_models//MBERT_uncased_CrossEntropyLoss_lora
Browse files- README.md +9 -9
- adapter_config.json +11 -11
- adapter_model.safetensors +1 -1
README.md
CHANGED
@@ -21,12 +21,12 @@ should probably proofread and complete it, then remove this comment. -->
|
|
21 |
|
22 |
This model is a fine-tuned version of [google-bert/bert-base-multilingual-uncased](https://huggingface.co/google-bert/bert-base-multilingual-uncased) on the None dataset.
|
23 |
It achieves the following results on the evaluation set:
|
24 |
-
- Loss: 0.
|
25 |
-
- Accuracy: 0.
|
26 |
-
- F1: 0.
|
27 |
-
- Precision: 0.
|
28 |
-
- Recall: 0.
|
29 |
-
- Roc Auc: 0.
|
30 |
|
31 |
## Model description
|
32 |
|
@@ -61,9 +61,9 @@ The following hyperparameters were used during training:
|
|
61 |
|
62 |
| Training Loss | Epoch | Step | Validation Loss | Accuracy | F1 | Precision | Recall | Roc Auc |
|
63 |
|:-------------:|:-----:|:----:|:---------------:|:--------:|:------:|:---------:|:------:|:-------:|
|
64 |
-
| No log | 0.992 | 31 | 0.
|
65 |
-
| No log | 1.984 | 62 | 0.
|
66 |
-
| No log | 2.976 | 93 | 0.
|
67 |
|
68 |
|
69 |
### Framework versions
|
|
|
21 |
|
22 |
This model is a fine-tuned version of [google-bert/bert-base-multilingual-uncased](https://huggingface.co/google-bert/bert-base-multilingual-uncased) on the None dataset.
|
23 |
It achieves the following results on the evaluation set:
|
24 |
+
- Loss: 0.6573
|
25 |
+
- Accuracy: 0.717
|
26 |
+
- F1: 0.8344
|
27 |
+
- Precision: 0.7239
|
28 |
+
- Recall: 0.9848
|
29 |
+
- Roc Auc: 0.4996
|
30 |
|
31 |
## Model description
|
32 |
|
|
|
61 |
|
62 |
| Training Loss | Epoch | Step | Validation Loss | Accuracy | F1 | Precision | Recall | Roc Auc |
|
63 |
|:-------------:|:-----:|:----:|:---------------:|:--------:|:------:|:---------:|:------:|:-------:|
|
64 |
+
| No log | 0.992 | 31 | 0.6666 | 0.693 | 0.8174 | 0.7179 | 0.9489 | 0.4853 |
|
65 |
+
| No log | 1.984 | 62 | 0.6595 | 0.714 | 0.8324 | 0.7230 | 0.9807 | 0.4976 |
|
66 |
+
| No log | 2.976 | 93 | 0.6573 | 0.717 | 0.8344 | 0.7239 | 0.9848 | 0.4996 |
|
67 |
|
68 |
|
69 |
### Framework versions
|
adapter_config.json
CHANGED
@@ -26,22 +26,22 @@
|
|
26 |
"rank_pattern": {},
|
27 |
"revision": null,
|
28 |
"target_modules": [
|
29 |
-
"
|
|
|
|
|
30 |
"10.output.dense",
|
31 |
"7.output.dense",
|
32 |
-
"
|
33 |
-
"11.output.dense",
|
34 |
-
"6.output.dense",
|
35 |
"query",
|
36 |
-
"
|
37 |
"1.output.dense",
|
38 |
-
"3.output.dense",
|
39 |
-
"8.output.dense",
|
40 |
-
"key",
|
41 |
"4.output.dense",
|
42 |
-
"
|
43 |
-
"
|
44 |
-
"
|
|
|
|
|
|
|
45 |
],
|
46 |
"task_type": "SEQ_CLS",
|
47 |
"use_dora": false,
|
|
|
26 |
"rank_pattern": {},
|
27 |
"revision": null,
|
28 |
"target_modules": [
|
29 |
+
"9.output.dense",
|
30 |
+
"3.output.dense",
|
31 |
+
"8.output.dense",
|
32 |
"10.output.dense",
|
33 |
"7.output.dense",
|
34 |
+
"2.output.dense",
|
|
|
|
|
35 |
"query",
|
36 |
+
"value",
|
37 |
"1.output.dense",
|
|
|
|
|
|
|
38 |
"4.output.dense",
|
39 |
+
"intermediate.dense",
|
40 |
+
"5.output.dense",
|
41 |
+
"6.output.dense",
|
42 |
+
"key",
|
43 |
+
"0.output.dense",
|
44 |
+
"11.output.dense"
|
45 |
],
|
46 |
"task_type": "SEQ_CLS",
|
47 |
"use_dora": false,
|
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 9460216
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d34f1e1d19d119762cc1845a872ee9a1287b06575fd7f7320b3c35639db33ad3
|
3 |
size 9460216
|