jsl5710 commited on
Commit
e338ddd
1 Parent(s): bab5ad9

jslai//content/sample_data/best_models//MBERT_uncased_CrossEntropyLoss_lora

Browse files
Files changed (3) hide show
  1. README.md +9 -9
  2. adapter_config.json +11 -11
  3. adapter_model.safetensors +1 -1
README.md CHANGED
@@ -21,12 +21,12 @@ should probably proofread and complete it, then remove this comment. -->
21
 
22
  This model is a fine-tuned version of [google-bert/bert-base-multilingual-uncased](https://huggingface.co/google-bert/bert-base-multilingual-uncased) on the None dataset.
23
  It achieves the following results on the evaluation set:
24
- - Loss: 0.6924
25
- - Accuracy: 0.518
26
- - F1: 0.6730
27
- - Precision: 0.6613
28
- - Recall: 0.6851
29
- - Roc Auc: 0.3824
30
 
31
  ## Model description
32
 
@@ -61,9 +61,9 @@ The following hyperparameters were used during training:
61
 
62
  | Training Loss | Epoch | Step | Validation Loss | Accuracy | F1 | Precision | Recall | Roc Auc |
63
  |:-------------:|:-----:|:----:|:---------------:|:--------:|:------:|:---------:|:------:|:-------:|
64
- | No log | 0.992 | 31 | 0.7081 | 0.347 | 0.4287 | 0.5847 | 0.3384 | 0.3540 |
65
- | No log | 1.984 | 62 | 0.6961 | 0.479 | 0.6354 | 0.6440 | 0.6271 | 0.3588 |
66
- | No log | 2.976 | 93 | 0.6924 | 0.518 | 0.6730 | 0.6613 | 0.6851 | 0.3824 |
67
 
68
 
69
  ### Framework versions
 
21
 
22
  This model is a fine-tuned version of [google-bert/bert-base-multilingual-uncased](https://huggingface.co/google-bert/bert-base-multilingual-uncased) on the None dataset.
23
  It achieves the following results on the evaluation set:
24
+ - Loss: 0.6573
25
+ - Accuracy: 0.717
26
+ - F1: 0.8344
27
+ - Precision: 0.7239
28
+ - Recall: 0.9848
29
+ - Roc Auc: 0.4996
30
 
31
  ## Model description
32
 
 
61
 
62
  | Training Loss | Epoch | Step | Validation Loss | Accuracy | F1 | Precision | Recall | Roc Auc |
63
  |:-------------:|:-----:|:----:|:---------------:|:--------:|:------:|:---------:|:------:|:-------:|
64
+ | No log | 0.992 | 31 | 0.6666 | 0.693 | 0.8174 | 0.7179 | 0.9489 | 0.4853 |
65
+ | No log | 1.984 | 62 | 0.6595 | 0.714 | 0.8324 | 0.7230 | 0.9807 | 0.4976 |
66
+ | No log | 2.976 | 93 | 0.6573 | 0.717 | 0.8344 | 0.7239 | 0.9848 | 0.4996 |
67
 
68
 
69
  ### Framework versions
adapter_config.json CHANGED
@@ -26,22 +26,22 @@
26
  "rank_pattern": {},
27
  "revision": null,
28
  "target_modules": [
29
- "2.output.dense",
 
 
30
  "10.output.dense",
31
  "7.output.dense",
32
- "0.output.dense",
33
- "11.output.dense",
34
- "6.output.dense",
35
  "query",
36
- "intermediate.dense",
37
  "1.output.dense",
38
- "3.output.dense",
39
- "8.output.dense",
40
- "key",
41
  "4.output.dense",
42
- "value",
43
- "9.output.dense",
44
- "5.output.dense"
 
 
 
45
  ],
46
  "task_type": "SEQ_CLS",
47
  "use_dora": false,
 
26
  "rank_pattern": {},
27
  "revision": null,
28
  "target_modules": [
29
+ "9.output.dense",
30
+ "3.output.dense",
31
+ "8.output.dense",
32
  "10.output.dense",
33
  "7.output.dense",
34
+ "2.output.dense",
 
 
35
  "query",
36
+ "value",
37
  "1.output.dense",
 
 
 
38
  "4.output.dense",
39
+ "intermediate.dense",
40
+ "5.output.dense",
41
+ "6.output.dense",
42
+ "key",
43
+ "0.output.dense",
44
+ "11.output.dense"
45
  ],
46
  "task_type": "SEQ_CLS",
47
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bbf2f8bd5fd0b9ee7d80ff96a52e17294e9a5993f0c4ff96bc133dee7c672233
3
  size 9460216
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d34f1e1d19d119762cc1845a872ee9a1287b06575fd7f7320b3c35639db33ad3
3
  size 9460216