Ubuntu
commited on
Commit
•
0b44937
1
Parent(s):
4292dec
added ST model
Browse files- 0_Transformer/added_tokens.json +1 -0
- 0_Transformer/config.json +27 -0
- 0_Transformer/pytorch_model.bin +3 -0
- 0_Transformer/sentence_bert_config.json +4 -0
- 0_Transformer/sentencepiece.bpe.model +3 -0
- 0_Transformer/special_tokens_map.json +1 -0
- 0_Transformer/tokenizer_config.json +1 -0
- 1_Pooling/config.json +7 -0
- config.json +3 -0
- modules.json +14 -0
- similarity_evaluation_sts-dev_results.csv +5 -0
- similarity_evaluation_sts-test_results.csv +2 -0
0_Transformer/added_tokens.json
ADDED
@@ -0,0 +1 @@
|
|
|
1 |
+
{"IDancienthistoryID": 250002, "IDhomerunID": 250033, "IDweddingdayID": 250061, "IDinsurancecompanyID": 250034, "IDswansongID": 250056, "IDprivateeyeID": 250047, "IDflowerchildID": 250028, "IDmailinglistID": 250038, "IDchainreactionID": 250012, "IDpillowslipID": 250046, "IDcallcentreID": 250010, "IDelbowroomID": 250025, "IDgooseeggID": 250030, "IDbusybeeID": 250009, "IDsittingduckID": 250053, "IDduststormID": 250022, "IDtopdogID": 250058, "IDphonebookID": 250045, "IDcottoncandyID": 250017, "IDpandacarID": 250043, "IDlifevestID": 250036, "IDhighlifeID": 250032, "IDeagerbeaverID": 250023, "IDthinktankID": 250057, "IDsacredcowID": 250050, "IDhealthcheckID": 250031, "IDweddinganniversaryID": 250060, "IDdrylandID": 250021, "IDfishstoryID": 250027, "IDbadappleID": 250003, "IDloansharkID": 250037, "IDpeaceconferenceID": 250044, "IDmailserviceID": 250039, "IDentrancehallID": 250026, "IDskintoneID": 250054, "IDclosedbookID": 250013, "IDcomputerprogramID": 250014, "IDconartistID": 250015, "IDbirthrateID": 250007, "IDcookingstoveID": 250016, "IDcellularphoneID": 250011, "IDlabourunionID": 250035, "IDricepaperID": 250049, "IDmentaldisorderID": 250040, "IDnarrowescapeID": 250042, "IDmiddleschoolID": 250041, "IDsugardaddyID": 250055, "IDfoodmarketID": 250029, "IDbowtieID": 250008, "IDdreamticketID": 250020, "IDbigfishID": 250006, "IDpublicserviceID": 250048, "IDbananarepublicID": 250005, "IDsilverliningID": 250052, "IDbadhatID": 250004, "IDsexbombID": 250051, "IDcriticalreviewID": 250018, "IDeconomicaidID": 250024, "IDtravelguideID": 250059, "IDdisabilityinsuranceID": 250019}
|
0_Transformer/config.json
ADDED
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "/home/ubuntu/tmp/",
|
3 |
+
"architectures": [
|
4 |
+
"XLMRobertaModel"
|
5 |
+
],
|
6 |
+
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"bos_token_id": 0,
|
8 |
+
"eos_token_id": 2,
|
9 |
+
"gradient_checkpointing": false,
|
10 |
+
"hidden_act": "gelu",
|
11 |
+
"hidden_dropout_prob": 0.1,
|
12 |
+
"hidden_size": 768,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 3072,
|
15 |
+
"layer_norm_eps": 1e-05,
|
16 |
+
"max_position_embeddings": 514,
|
17 |
+
"model_type": "xlm-roberta",
|
18 |
+
"num_attention_heads": 12,
|
19 |
+
"num_hidden_layers": 12,
|
20 |
+
"output_past": true,
|
21 |
+
"pad_token_id": 1,
|
22 |
+
"position_embedding_type": "absolute",
|
23 |
+
"transformers_version": "4.5.1",
|
24 |
+
"type_vocab_size": 1,
|
25 |
+
"use_cache": true,
|
26 |
+
"vocab_size": 250062
|
27 |
+
}
|
0_Transformer/pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a7089fe53bbe57db8acce94e381e9ab1504b276f02e850e9f03e2e325a6706b
|
3 |
+
size 1112445495
|
0_Transformer/sentence_bert_config.json
ADDED
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"max_seq_length": null,
|
3 |
+
"do_lower_case": false
|
4 |
+
}
|
0_Transformer/sentencepiece.bpe.model
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
|
3 |
+
size 5069051
|
0_Transformer/special_tokens_map.json
ADDED
@@ -0,0 +1 @@
|
|
|
1 |
+
{"bos_token": "<s>", "eos_token": "</s>", "unk_token": "<unk>", "sep_token": "</s>", "pad_token": "<pad>", "cls_token": "<s>", "mask_token": {"content": "<mask>", "single_word": false, "lstrip": true, "rstrip": false, "normalized": true}}
|
0_Transformer/tokenizer_config.json
ADDED
@@ -0,0 +1 @@
|
|
|
1 |
+
{"bos_token": "<s>", "eos_token": "</s>", "sep_token": "</s>", "cls_token": "<s>", "unk_token": "<unk>", "pad_token": "<pad>", "mask_token": {"content": "<mask>", "single_word": false, "lstrip": true, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "truncation": true, "model_max_length": 512, "special_tokens_map_file": null, "name_or_path": "/home/ubuntu/tmp/"}
|
1_Pooling/config.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"word_embedding_dimension": 768,
|
3 |
+
"pooling_mode_cls_token": false,
|
4 |
+
"pooling_mode_mean_tokens": true,
|
5 |
+
"pooling_mode_max_tokens": false,
|
6 |
+
"pooling_mode_mean_sqrt_len_tokens": false
|
7 |
+
}
|
config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"__version__": "1.1.0"
|
3 |
+
}
|
modules.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"idx": 0,
|
4 |
+
"name": "0",
|
5 |
+
"path": "0_Transformer",
|
6 |
+
"type": "sentence_transformers.models.Transformer"
|
7 |
+
},
|
8 |
+
{
|
9 |
+
"idx": 1,
|
10 |
+
"name": "1",
|
11 |
+
"path": "1_Pooling",
|
12 |
+
"type": "sentence_transformers.models.Pooling"
|
13 |
+
}
|
14 |
+
]
|
similarity_evaluation_sts-dev_results.csv
ADDED
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
1 |
+
epoch,steps,cosine_pearson,cosine_spearman,euclidean_pearson,euclidean_spearman,manhattan_pearson,manhattan_spearman,dot_pearson,dot_spearman
|
2 |
+
0,-1,0.8068453666185014,0.8091793146510394,0.8048708512868359,0.8057732251118485,0.8150273883865529,0.8157099871427879,0.7523952010509299,0.7503425605240357
|
3 |
+
1,-1,0.8326340331606166,0.8349558021905582,0.8278354008865084,0.8283915841373897,0.8344265880843423,0.835056022900291,0.7813159592427814,0.7834231047055855
|
4 |
+
2,-1,0.8531377765618325,0.855079059850075,0.8422047783688726,0.8452438573331594,0.8480692234057359,0.8506436244047921,0.8252254219803428,0.8269980547059492
|
5 |
+
3,-1,0.8538679921765833,0.855391230884013,0.843583765135863,0.8471519768407193,0.8485321279546,0.8511623525207791,0.8265153502799939,0.8278091798208754
|
similarity_evaluation_sts-test_results.csv
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
1 |
+
epoch,steps,cosine_pearson,cosine_spearman,euclidean_pearson,euclidean_spearman,manhattan_pearson,manhattan_spearman,dot_pearson,dot_spearman
|
2 |
+
-1,-1,0.8281024548375999,0.8235372139268156,0.8200413882187241,0.8147515000551068,0.8250539828729784,0.8184865551389828,0.7843721996955079,0.7736275040320477
|