Commit
•
2baaa44
1
Parent(s):
4dae360
End of training
Browse files- ABSA_Sentiment_classification_Semeval_houlsby_Stack/adapter_config.json +41 -0
- ABSA_Sentiment_classification_Semeval_houlsby_Stack/head_config.json +21 -0
- ABSA_Sentiment_classification_Semeval_houlsby_Stack/pytorch_adapter.bin +3 -0
- ABSA_Sentiment_classification_Semeval_houlsby_Stack/pytorch_model_head.bin +3 -0
- all_results.json +24 -0
- eval_results.json +11 -0
- mlm/adapter_config.json +41 -0
- mlm/head_config.json +19 -0
- mlm/pytorch_adapter.bin +3 -0
- mlm/pytorch_model_head.bin +3 -0
- runs/Aug04_16-39-09_e296e91d98be/events.out.tfevents.1691167167.e296e91d98be.457.0 +2 -2
- runs/Aug04_16-39-09_e296e91d98be/events.out.tfevents.1691169630.e296e91d98be.457.2 +3 -0
- test_results.json +10 -0
- train_results.json +8 -0
ABSA_Sentiment_classification_Semeval_houlsby_Stack/adapter_config.json
ADDED
@@ -0,0 +1,41 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"config": {
|
3 |
+
"adapter_residual_before_ln": false,
|
4 |
+
"cross_adapter": false,
|
5 |
+
"factorized_phm_W": true,
|
6 |
+
"factorized_phm_rule": false,
|
7 |
+
"hypercomplex_nonlinearity": "glorot-uniform",
|
8 |
+
"init_weights": "bert",
|
9 |
+
"inv_adapter": null,
|
10 |
+
"inv_adapter_reduction_factor": null,
|
11 |
+
"is_parallel": false,
|
12 |
+
"learn_phm": true,
|
13 |
+
"leave_out": [],
|
14 |
+
"ln_after": false,
|
15 |
+
"ln_before": false,
|
16 |
+
"mh_adapter": true,
|
17 |
+
"non_linearity": "swish",
|
18 |
+
"original_ln_after": true,
|
19 |
+
"original_ln_before": false,
|
20 |
+
"output_adapter": true,
|
21 |
+
"phm_bias": true,
|
22 |
+
"phm_c_init": "normal",
|
23 |
+
"phm_dim": 4,
|
24 |
+
"phm_init_range": 0.0001,
|
25 |
+
"phm_layer": false,
|
26 |
+
"phm_rank": 1,
|
27 |
+
"reduction_factor": 16,
|
28 |
+
"residual_before_ln": true,
|
29 |
+
"scaling": 1.0,
|
30 |
+
"shared_W_phm": false,
|
31 |
+
"shared_phm_rule": true,
|
32 |
+
"use_gating": false
|
33 |
+
},
|
34 |
+
"config_id": "b1017368d7a97b11",
|
35 |
+
"hidden_size": 768,
|
36 |
+
"model_class": "BertModelWithHeads",
|
37 |
+
"model_name": "CAMeL-Lab/bert-base-arabic-camelbert-msa",
|
38 |
+
"model_type": "bert",
|
39 |
+
"name": "ABSA_Sentiment_classification_Semeval_houlsby_Stack",
|
40 |
+
"version": "3.2.1"
|
41 |
+
}
|
ABSA_Sentiment_classification_Semeval_houlsby_Stack/head_config.json
ADDED
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"config": {
|
3 |
+
"activation_function": "tanh",
|
4 |
+
"bias": true,
|
5 |
+
"head_type": "classification",
|
6 |
+
"label2id": {
|
7 |
+
"negative": 0,
|
8 |
+
"neutral": 2,
|
9 |
+
"positive": 1
|
10 |
+
},
|
11 |
+
"layers": 2,
|
12 |
+
"num_labels": 3,
|
13 |
+
"use_pooler": false
|
14 |
+
},
|
15 |
+
"hidden_size": 768,
|
16 |
+
"model_class": "BertModelWithHeads",
|
17 |
+
"model_name": "CAMeL-Lab/bert-base-arabic-camelbert-msa",
|
18 |
+
"model_type": "bert",
|
19 |
+
"name": "ABSA_Sentiment_classification_Semeval_houlsby_Stack",
|
20 |
+
"version": "3.2.1"
|
21 |
+
}
|
ABSA_Sentiment_classification_Semeval_houlsby_Stack/pytorch_adapter.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f79377baabfcd1d415e6f609b64788c3f198e02f6b0f3dc0bbd39b783358bba7
|
3 |
+
size 7195157
|
ABSA_Sentiment_classification_Semeval_houlsby_Stack/pytorch_model_head.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5555442a44cf2f5e663f830f9f90334ea2c5f961e6317a3888b05a5bf6180ad
|
3 |
+
size 2373473
|
all_results.json
ADDED
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"epoch": 20.0,
|
3 |
+
"eval_accuracy": 0.8752362948960303,
|
4 |
+
"eval_f1": 0.8752362948960303,
|
5 |
+
"eval_loss": 0.32043901085853577,
|
6 |
+
"eval_precision": 0.8752362948960303,
|
7 |
+
"eval_recall": 0.8752362948960303,
|
8 |
+
"eval_runtime": 17.8506,
|
9 |
+
"eval_samples_per_second": 118.539,
|
10 |
+
"eval_steps_per_second": 3.753,
|
11 |
+
"test_accuracy": 0.8740399385560675,
|
12 |
+
"test_f1": 0.8740399385560675,
|
13 |
+
"test_loss": 0.3366047143936157,
|
14 |
+
"test_precision": 0.8740399385560675,
|
15 |
+
"test_recall": 0.8740399385560675,
|
16 |
+
"test_runtime": 18.1593,
|
17 |
+
"test_samples_per_second": 143.397,
|
18 |
+
"test_steps_per_second": 4.516,
|
19 |
+
"total_flos": 8766240604668522.0,
|
20 |
+
"train_loss": 0.276022268061368,
|
21 |
+
"train_runtime": 2445.9034,
|
22 |
+
"train_samples_per_second": 69.185,
|
23 |
+
"train_steps_per_second": 2.167
|
24 |
+
}
|
eval_results.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"epoch": 20.0,
|
3 |
+
"eval_accuracy": 0.8752362948960303,
|
4 |
+
"eval_f1": 0.8752362948960303,
|
5 |
+
"eval_loss": 0.32043901085853577,
|
6 |
+
"eval_precision": 0.8752362948960303,
|
7 |
+
"eval_recall": 0.8752362948960303,
|
8 |
+
"eval_runtime": 17.8506,
|
9 |
+
"eval_samples_per_second": 118.539,
|
10 |
+
"eval_steps_per_second": 3.753
|
11 |
+
}
|
mlm/adapter_config.json
ADDED
@@ -0,0 +1,41 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"config": {
|
3 |
+
"adapter_residual_before_ln": false,
|
4 |
+
"cross_adapter": false,
|
5 |
+
"factorized_phm_W": true,
|
6 |
+
"factorized_phm_rule": false,
|
7 |
+
"hypercomplex_nonlinearity": "glorot-uniform",
|
8 |
+
"init_weights": "bert",
|
9 |
+
"inv_adapter": "nice",
|
10 |
+
"inv_adapter_reduction_factor": 2,
|
11 |
+
"is_parallel": false,
|
12 |
+
"learn_phm": true,
|
13 |
+
"leave_out": [],
|
14 |
+
"ln_after": false,
|
15 |
+
"ln_before": false,
|
16 |
+
"mh_adapter": false,
|
17 |
+
"non_linearity": "relu",
|
18 |
+
"original_ln_after": true,
|
19 |
+
"original_ln_before": true,
|
20 |
+
"output_adapter": true,
|
21 |
+
"phm_bias": true,
|
22 |
+
"phm_c_init": "normal",
|
23 |
+
"phm_dim": 4,
|
24 |
+
"phm_init_range": 0.0001,
|
25 |
+
"phm_layer": false,
|
26 |
+
"phm_rank": 1,
|
27 |
+
"reduction_factor": 16,
|
28 |
+
"residual_before_ln": true,
|
29 |
+
"scaling": 1.0,
|
30 |
+
"shared_W_phm": false,
|
31 |
+
"shared_phm_rule": true,
|
32 |
+
"use_gating": false
|
33 |
+
},
|
34 |
+
"config_id": "9ed5b5a29de19b71",
|
35 |
+
"hidden_size": 768,
|
36 |
+
"model_class": "BertModelWithHeads",
|
37 |
+
"model_name": "CAMeL-Lab/bert-base-arabic-camelbert-msa",
|
38 |
+
"model_type": "bert",
|
39 |
+
"name": "mlm",
|
40 |
+
"version": "3.2.1"
|
41 |
+
}
|
mlm/head_config.json
ADDED
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"config": {
|
3 |
+
"activation_function": "gelu",
|
4 |
+
"bias": true,
|
5 |
+
"embedding_size": 768,
|
6 |
+
"head_type": "masked_lm",
|
7 |
+
"label2id": null,
|
8 |
+
"layer_norm": true,
|
9 |
+
"layers": 2,
|
10 |
+
"shift_labels": false,
|
11 |
+
"vocab_size": 30000
|
12 |
+
},
|
13 |
+
"hidden_size": 768,
|
14 |
+
"model_class": "BertModelWithHeads",
|
15 |
+
"model_name": "CAMeL-Lab/bert-base-arabic-camelbert-msa",
|
16 |
+
"model_type": "bert",
|
17 |
+
"name": "mlm",
|
18 |
+
"version": "3.2.1"
|
19 |
+
}
|
mlm/pytorch_adapter.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1fe7e729c4de1953e7784cabb44a321fd0f2a8cfe4b11182cef5d2d7ed12a430
|
3 |
+
size 4781837
|
mlm/pytorch_model_head.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:faa9818390df8e5b73959629c1d63d9f131b7c8d996380be3fed6a455194b344
|
3 |
+
size 94650799
|
runs/Aug04_16-39-09_e296e91d98be/events.out.tfevents.1691167167.e296e91d98be.457.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8bab686ea3fdbabba26e18d08f700b5a604630d4b4621fc95b2b905bc2133094
|
3 |
+
size 19993
|
runs/Aug04_16-39-09_e296e91d98be/events.out.tfevents.1691169630.e296e91d98be.457.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2928760e649a4fceeaadb10a1a61bb0ec8d6b4c792e8aeed51633b7ac3a5ee3
|
3 |
+
size 1032
|
test_results.json
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"test_accuracy": 0.8740399385560675,
|
3 |
+
"test_f1": 0.8740399385560675,
|
4 |
+
"test_loss": 0.3366047143936157,
|
5 |
+
"test_precision": 0.8740399385560675,
|
6 |
+
"test_recall": 0.8740399385560675,
|
7 |
+
"test_runtime": 18.1593,
|
8 |
+
"test_samples_per_second": 143.397,
|
9 |
+
"test_steps_per_second": 4.516
|
10 |
+
}
|
train_results.json
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"epoch": 20.0,
|
3 |
+
"total_flos": 8766240604668522.0,
|
4 |
+
"train_loss": 0.276022268061368,
|
5 |
+
"train_runtime": 2445.9034,
|
6 |
+
"train_samples_per_second": 69.185,
|
7 |
+
"train_steps_per_second": 2.167
|
8 |
+
}
|