luismsgomes
commited on
Commit
•
472e467
1
Parent(s):
e0129ad
added model
Browse files- 1_Pooling/config.json +10 -0
- config.json +38 -0
- config_sentence_transformers.json +9 -0
- eval/Information-Retrieval_evaluation_mmarco-pt-dev-small_results-lr1e-5-aborted.csv +5 -0
- eval/Information-Retrieval_evaluation_mmarco-pt-dev-small_results.csv +105 -0
- eval/similarity_evaluation_assin-ptbr-test_results.csv +2 -0
- eval/similarity_evaluation_assin-ptpt-test_results.csv +2 -0
- eval/similarity_evaluation_assin2-test_results.csv +2 -0
- eval/similarity_evaluation_iris-sts-test_results.csv +2 -0
- eval/similarity_evaluation_stsb-multi-mt-pt-test_results.csv +2 -0
- model.safetensors +3 -0
- modules.json +14 -0
- sentence_bert_config.json +4 -0
- special_tokens_map.json +51 -0
- tokenizer.json +0 -0
- tokenizer_config.json +65 -0
- train-config.yaml +27 -0
1_Pooling/config.json
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"word_embedding_dimension": 1536,
|
3 |
+
"pooling_mode_cls_token": false,
|
4 |
+
"pooling_mode_mean_tokens": true,
|
5 |
+
"pooling_mode_max_tokens": false,
|
6 |
+
"pooling_mode_mean_sqrt_len_tokens": false,
|
7 |
+
"pooling_mode_weightedmean_tokens": false,
|
8 |
+
"pooling_mode_lasttoken": false,
|
9 |
+
"include_prompt": true
|
10 |
+
}
|
config.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "models/albertina-900m-ptpt-europarl-eubookshop-ted2020-tatoeba-ct1-nli-gist10-sts-cosent20-v1",
|
3 |
+
"architectures": [
|
4 |
+
"DebertaV2Model"
|
5 |
+
],
|
6 |
+
"attention_head_size": 64,
|
7 |
+
"attention_probs_dropout_prob": 0.1,
|
8 |
+
"conv_act": "gelu",
|
9 |
+
"conv_kernel_size": 3,
|
10 |
+
"hidden_act": "gelu",
|
11 |
+
"hidden_dropout_prob": 0.1,
|
12 |
+
"hidden_size": 1536,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 6144,
|
15 |
+
"layer_norm_eps": 1e-07,
|
16 |
+
"max_position_embeddings": 512,
|
17 |
+
"max_relative_positions": -1,
|
18 |
+
"model_type": "deberta-v2",
|
19 |
+
"norm_rel_ebd": "layer_norm",
|
20 |
+
"num_attention_heads": 24,
|
21 |
+
"num_hidden_layers": 24,
|
22 |
+
"pad_token_id": 0,
|
23 |
+
"pooler_dropout": 0,
|
24 |
+
"pooler_hidden_act": "gelu",
|
25 |
+
"pooler_hidden_size": 1536,
|
26 |
+
"pos_att_type": [
|
27 |
+
"p2c",
|
28 |
+
"c2p"
|
29 |
+
],
|
30 |
+
"position_biased_input": false,
|
31 |
+
"position_buckets": 256,
|
32 |
+
"relative_attention": true,
|
33 |
+
"share_att_key": true,
|
34 |
+
"torch_dtype": "float32",
|
35 |
+
"transformers_version": "4.39.3",
|
36 |
+
"type_vocab_size": 0,
|
37 |
+
"vocab_size": 128100
|
38 |
+
}
|
config_sentence_transformers.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"__version__": {
|
3 |
+
"sentence_transformers": "2.6.1",
|
4 |
+
"transformers": "4.39.3",
|
5 |
+
"pytorch": "2.2.2+cu121"
|
6 |
+
},
|
7 |
+
"prompts": {},
|
8 |
+
"default_prompt_name": null
|
9 |
+
}
|
eval/Information-Retrieval_evaluation_mmarco-pt-dev-small_results-lr1e-5-aborted.csv
ADDED
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
epoch,steps,cos_sim-Accuracy@1,cos_sim-Accuracy@3,cos_sim-Accuracy@5,cos_sim-Accuracy@10,cos_sim-Precision@10,cos_sim-Recall@10,cos_sim-MRR@10,cos_sim-NDCG@10,cos_sim-MAP@100
|
2 |
+
0,19891,0.686676217765043,0.8027220630372492,0.8436962750716333,0.8879656160458452,0.09349570200573067,0.8817932187201527,0.7539734843316493,0.7822745078094078,0.7520719215136676
|
3 |
+
0,39782,0.707163323782235,0.8234957020057306,0.8601719197707737,0.9034383954154728,0.09531518624641833,0.8979942693409743,0.773240323827715,0.8007244999086974,0.7707729438411337
|
4 |
+
0,59673,0.6977077363896849,0.8157593123209169,0.85,0.8959885386819484,0.09457020057306591,0.8900191021967526,0.7641103265566007,0.791865440041029,0.7621812413953645
|
5 |
+
0,79564,0.6906876790830946,0.8055873925501432,0.8449856733524356,0.8896848137535817,0.09388252148997135,0.8844555873925501,0.7570755446400139,0.7849885879700434,0.7547763453574594
|
eval/Information-Retrieval_evaluation_mmarco-pt-dev-small_results.csv
ADDED
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
epoch,steps,cos_sim-Accuracy@1,cos_sim-Accuracy@3,cos_sim-Accuracy@5,cos_sim-Accuracy@10,cos_sim-Precision@10,cos_sim-Recall@10,cos_sim-MRR@10,cos_sim-NDCG@10,cos_sim-MAP@100
|
2 |
+
0,19891,0.686676217765043,0.8027220630372492,0.8436962750716333,0.8879656160458452,0.09349570200573067,0.8817932187201527,0.7539734843316493,0.7822745078094078,0.7520719215136676
|
3 |
+
0,39782,0.707163323782235,0.8234957020057306,0.8601719197707737,0.9034383954154728,0.09531518624641833,0.8979942693409743,0.773240323827715,0.8007244999086974,0.7707729438411337
|
4 |
+
0,59673,0.6977077363896849,0.8157593123209169,0.85,0.8959885386819484,0.09457020057306591,0.8900191021967526,0.7641103265566007,0.791865440041029,0.7621812413953645
|
5 |
+
0,79564,0.6906876790830946,0.8055873925501432,0.8449856733524356,0.8896848137535817,0.09388252148997135,0.8844555873925501,0.7570755446400139,0.7849885879700434,0.7547763453574594
|
6 |
+
0,19891,0.6203438395415473,0.7439828080229226,0.7902578796561605,0.8436962750716333,0.08862464183381087,0.8363538681948424,0.6929668667849183,0.7242632677331385,0.690875095984185
|
7 |
+
0,39782,0.6730659025787966,0.7873925501432665,0.8293696275071634,0.8749283667621777,0.09210601719197709,0.8690186246418338,0.7394724155182603,0.7677009562148118,0.7371429499973232
|
8 |
+
0,59673,0.6916905444126075,0.8064469914040114,0.8464183381088826,0.8922636103151862,0.09404011461318051,0.8864016236867239,0.75852907399827,0.7866005017081468,0.7561253194426015
|
9 |
+
0,79564,0.7014326647564469,0.8187679083094556,0.8588825214899714,0.8995702005730659,0.09487106017191978,0.8937917860553963,0.7689602947196058,0.7965738949679296,0.7667968975863902
|
10 |
+
0,99455,0.7124641833810889,0.8318051575931232,0.8664756446991404,0.9078796561604584,0.09577363896848137,0.9023877745940784,0.7790101537272012,0.8062758951064879,0.7765478728499272
|
11 |
+
0,119346,0.716189111747851,0.829512893982808,0.8681948424068768,0.9110315186246418,0.09610315186246418,0.9056232091690545,0.7810983194614973,0.808454180896248,0.7783428813795646
|
12 |
+
0,139237,0.7213467048710601,0.832378223495702,0.873352435530086,0.9136103151862465,0.09637535816618911,0.9081781279847183,0.786252956292354,0.8129255351206011,0.7833076165773594
|
13 |
+
0,159128,0.7253581661891118,0.836676217765043,0.8760744985673352,0.9169054441260746,0.09681948424068768,0.9118314231136581,0.7902542979942679,0.8169299183353848,0.787340364829885
|
14 |
+
0,179019,0.7227793696275072,0.8402578796561605,0.8802292263610315,0.9183381088825215,0.09694842406876791,0.9131685768863418,0.7897997111929753,0.8169561483732921,0.7868466464392998
|
15 |
+
0,198910,0.7297994269340974,0.8432664756446991,0.8796561604584527,0.9191977077363896,0.09694842406876791,0.9136938872970392,0.7942150475280828,0.8203711441203599,0.7912636213800311
|
16 |
+
0,218801,0.7316618911174785,0.8446991404011461,0.8810888252148997,0.921919770773639,0.09723495702005731,0.916404011461318,0.7968953245099366,0.8230238693718747,0.793668054221326
|
17 |
+
0,238692,0.733810888252149,0.8487106017191977,0.8863896848137536,0.9226361031518625,0.09732091690544412,0.9170248328557784,0.7989986696684385,0.8250668816110137,0.7963136676589505
|
18 |
+
0,258583,0.7376790830945559,0.8452722063037249,0.8843839541547278,0.9224928366762177,0.09733524355300861,0.9173113658070677,0.8003599854459444,0.8258782670364493,0.7971645207195726
|
19 |
+
0,278474,0.7411174785100286,0.85,0.8861031518624641,0.920487106017192,0.0971919770773639,0.9155324737344793,0.8032153658980298,0.8279345366913405,0.8007657861121821
|
20 |
+
0,298365,0.7428366762177651,0.851432664756447,0.8891117478510029,0.9243553008595988,0.09763610315186247,0.9193887297039159,0.8047995406376481,0.8297863156828637,0.8015892660342179
|
21 |
+
0,318256,0.7431232091690544,0.8502865329512894,0.88810888252149,0.9234957020057306,0.09755014326647565,0.9187082139446036,0.8045313139582466,0.8296123253332633,0.8017689424775438
|
22 |
+
0,338147,0.7438395415472779,0.8518624641833811,0.8905444126074499,0.9246418338108883,0.0977220630372493,0.9201170009551098,0.8059463546641182,0.8312719746670211,0.8035526961638525
|
23 |
+
0,358038,0.7441260744985674,0.8511461318051576,0.8875358166189111,0.9260744985673353,0.09785100286532951,0.9215974212034383,0.8060013871833343,0.8315254961496272,0.8033696446117365
|
24 |
+
0,377929,0.7491404011461318,0.854727793696275,0.8898280802292263,0.9289398280802292,0.0981948424068768,0.9247492836676218,0.8100722586073585,0.8352357065940328,0.8071837419424122
|
25 |
+
0,397820,0.7468481375358166,0.8545845272206304,0.8914040114613181,0.9285100286532951,0.09800859598853869,0.9234240687679083,0.8089239095829345,0.8340204237662775,0.8059615270024146
|
26 |
+
0,417711,0.751432664756447,0.8557306590257879,0.8926934097421203,0.9306590257879657,0.09822349570200575,0.9255969436485196,0.81199413289671,0.8366639352346111,0.8086662376925663
|
27 |
+
0,437602,0.7505730659025788,0.8574498567335244,0.8939828080229226,0.9300859598853868,0.09828080229226362,0.9255969436485195,0.811524764633645,0.8365442932209558,0.8084316428570375
|
28 |
+
0,457493,0.7547277936962751,0.8617478510028653,0.8944126074498567,0.9283667621776505,0.09803724928366761,0.9234360076408786,0.8146785032064389,0.8383824118847123,0.8116012333573631
|
29 |
+
0,477384,0.7520057306590258,0.857593123209169,0.8914040114613181,0.9305157593123209,0.09825214899713468,0.9258834765998089,0.8127441215263547,0.8375475606248511,0.8098212233216132
|
30 |
+
0,497275,0.7548710601719197,0.8611747851002866,0.8965616045845273,0.9320916905444127,0.0984813753581662,0.9273280802292264,0.8149478669213608,0.8395852047610595,0.8118555082662375
|
31 |
+
0,517166,0.7564469914040115,0.8624641833810889,0.895272206303725,0.9310888252148997,0.09840974212034385,0.926313276026743,0.8171256310547123,0.8412180264058458,0.814434164277915
|
32 |
+
0,537057,0.7563037249283667,0.863323782234957,0.8948424068767908,0.9328080229226361,0.098567335243553,0.928235434574976,0.816596909537452,0.8410890925958876,0.8135340349753447
|
33 |
+
0,556948,0.7571633237822349,0.8627507163323782,0.8964183381088825,0.9320916905444127,0.09852435530085961,0.927351957975167,0.8172349001682796,0.8413873387215821,0.8139932771288845
|
34 |
+
0,576839,0.7577363896848137,0.8626074498567335,0.8987106017191977,0.9303724928366762,0.09825214899713466,0.9254775549188158,0.8170838449993163,0.8408493553992008,0.8142303304448247
|
35 |
+
0,596730,0.7574498567335244,0.8597421203438396,0.8936962750716332,0.9315186246418338,0.09842406876790831,0.9266595033428845,0.8166365352253592,0.8407340804997021,0.8136104839168087
|
36 |
+
0,616621,0.7527220630372493,0.8601719197707737,0.8955587392550143,0.9330945558739255,0.09862464183381091,0.9288443170964662,0.8142032792104411,0.839487726548661,0.8112331145550177
|
37 |
+
0,636512,0.7548710601719197,0.8628939828080229,0.8962750716332378,0.9316618911174785,0.0984813753581662,0.9273638968481376,0.8157000727702715,0.840459593632374,0.8130267687665712
|
38 |
+
0,656403,0.7530085959885386,0.86189111747851,0.8957020057306591,0.9318051575931232,0.09840974212034385,0.9271967526265521,0.8143774730522552,0.8393212188562222,0.8115597819776212
|
39 |
+
0,676294,0.7591690544412607,0.8637535816618911,0.8974212034383954,0.9328080229226361,0.09846704871060173,0.9276623686723974,0.8186200368399494,0.8425963126004824,0.8158499793675448
|
40 |
+
0,696185,0.760458452722063,0.8651862464183381,0.8972779369627507,0.9332378223495702,0.09855300859598855,0.9287368672397325,0.8194560422067562,0.8434678522608476,0.8166719966795604
|
41 |
+
0,716076,0.7610315186246418,0.8628939828080229,0.8984240687679083,0.933810888252149,0.09865329512893985,0.9293218720152818,0.8195302337745008,0.8435721964468267,0.8165069472897686
|
42 |
+
0,735967,0.7594555873925501,0.8641833810888252,0.8968481375358166,0.9328080229226361,0.09853868194842406,0.9280085959885387,0.818944546777639,0.8428762552542166,0.8160852725950872
|
43 |
+
0,755858,0.7637535816618911,0.8654727793696275,0.8977077363896848,0.9332378223495702,0.09858166189111749,0.9287010506208215,0.8221433119570637,0.8455171640505106,0.8193100126894071
|
44 |
+
0,775749,0.7636103151862464,0.8657593123209169,0.8992836676217765,0.9342406876790831,0.0987535816618911,0.929691977077364,0.8216715559194049,0.8453755885717837,0.8188015635589823
|
45 |
+
0,795640,0.7627507163323782,0.866189111747851,0.9005730659025788,0.9336676217765043,0.09869627507163325,0.9293218720152818,0.8217884431709619,0.8453657739099143,0.8188042568245371
|
46 |
+
0,815531,0.7617478510028654,0.8677650429799427,0.9027220630372493,0.9355300859598854,0.09886819484240689,0.9310530085959885,0.8212019033974606,0.8455616898981982,0.8185511599404696
|
47 |
+
0,835422,0.7573065902578796,0.8611747851002866,0.8939828080229226,0.9282234957020057,0.09813753581661891,0.9238896848137536,0.8162890571701445,0.8399374256074439,0.8136899264786653
|
48 |
+
0,855313,0.7613180515759312,0.8614613180515759,0.8964183381088825,0.9326647564469914,0.09862464183381091,0.9285339063992359,0.8194945877109187,0.8433579606167781,0.8164370026194898
|
49 |
+
0,875204,0.7627507163323782,0.867621776504298,0.9012893982808023,0.9361031518624642,0.0988681948424069,0.9313872970391596,0.8227310456178634,0.846536869481785,0.8196750619235467
|
50 |
+
0,895095,0.7644699140401147,0.8648997134670487,0.8982808022922636,0.9349570200573066,0.09872492836676218,0.9304083094555874,0.822390730886431,0.846068686667549,0.8195144421878694
|
51 |
+
0,914986,0.7667621776504298,0.8681948424068768,0.9024355300859599,0.9376790830945558,0.09902578796561605,0.932712511938873,0.824962648383133,0.8484268157102385,0.8216009228170417
|
52 |
+
0,934877,0.7636103151862464,0.8714899713467049,0.9038681948424069,0.9363896848137536,0.09881088825214901,0.9313037249283668,0.8240158957565823,0.8474386082202197,0.8207057654570817
|
53 |
+
0,954768,0.7603151862464184,0.8646131805157593,0.9002865329512894,0.9351002865329513,0.09873925501432665,0.9301337153772683,0.8198284213398804,0.8440687951404998,0.8168797132766971
|
54 |
+
0,974659,0.7611747851002866,0.8686246418338109,0.9053008595988539,0.9356733524355301,0.09879656160458451,0.9306112702960841,0.8219180652203549,0.8457710123153714,0.8188228813051177
|
55 |
+
0,994550,0.7630372492836677,0.8707736389684814,0.9041547277936963,0.9365329512893983,0.09892550143266475,0.9318290353390639,0.8236135557374801,0.847425578209692,0.8206357426133198
|
56 |
+
0,1014441,0.7640401146131806,0.8683381088825215,0.9021489971346704,0.9340974212034384,0.0986676217765043,0.9293218720152817,0.8229491858825646,0.8461883936044302,0.8198774676030318
|
57 |
+
0,1034332,0.7656160458452722,0.867621776504298,0.9020057306590258,0.9353868194842407,0.09892550143266475,0.9312917860553963,0.8236413562559681,0.8472093720791207,0.8204986925626111
|
58 |
+
0,1054223,0.7706303724928367,0.87378223495702,0.9038681948424069,0.9369627507163324,0.09908309455587394,0.9327363896848138,0.828341122026651,0.851058695445996,0.8251213463981715
|
59 |
+
0,1074114,0.7634670487106017,0.8679083094555874,0.9041547277936963,0.935243553008596,0.0988681948424069,0.9308500477554918,0.8226698731068336,0.8465031619947313,0.8197783762774588
|
60 |
+
0,1094005,0.7669054441260745,0.8681948424068768,0.9041547277936963,0.938538681948424,0.09915472779369627,0.933751193887297,0.8252372993132273,0.8488669236180225,0.821920283092166
|
61 |
+
0,1113896,0.7702005730659026,0.873352435530086,0.9081661891117478,0.9376790830945558,0.09921203438395415,0.9333452722063037,0.8276602651566808,0.8508699824856587,0.8246975999698329
|
62 |
+
0,1133787,0.7707736389684814,0.8743553008595989,0.9064469914040114,0.9391117478510028,0.0993409742120344,0.9351361031518625,0.8290096420612159,0.8522788214796762,0.825930900142743
|
63 |
+
0,1153678,0.7664756446991404,0.873352435530086,0.9064469914040114,0.9381088825214899,0.0991404011461318,0.9337392550143266,0.8258741529085335,0.8494891976962177,0.8226592239377765
|
64 |
+
0,1173569,0.7713467048710602,0.8739255014326648,0.9063037249283667,0.938538681948424,0.09916905444126076,0.9340138490926456,0.8292850889161757,0.8520524930539365,0.8259190516755253
|
65 |
+
0,1193460,0.7700573065902578,0.8732091690544412,0.9073065902578796,0.9388252148997135,0.09925501432664757,0.9344675262655205,0.8284495952153518,0.8516703868868762,0.825306547278246
|
66 |
+
0,1213351,0.7700573065902578,0.8730659025787966,0.9060171919770774,0.9379656160458453,0.0991547277936963,0.9337392550143266,0.8284010437986061,0.851447867370514,0.8252460583266904
|
67 |
+
0,1233242,0.7722063037249284,0.8736389684813753,0.9067335243553009,0.9409742120343839,0.09945558739255014,0.9364732569245463,0.8303959157684063,0.8536711396164638,0.8272642227433656
|
68 |
+
0,1253133,0.7717765042979943,0.8719197707736389,0.9067335243553009,0.9402578796561605,0.09939828080229228,0.935947946513849,0.8294898690135057,0.8529469292257653,0.8266551661663469
|
69 |
+
0,1273024,0.7744985673352436,0.87378223495702,0.9088825214899714,0.9402578796561605,0.0993839541547278,0.9359360076408787,0.8312328307636304,0.8543235454585494,0.828475184534567
|
70 |
+
0,1292915,0.7753581661891118,0.8753581661891118,0.908595988538682,0.9402578796561605,0.0993266475644699,0.9355659025787966,0.8317630304270692,0.8546205711558493,0.8290615205923493
|
71 |
+
0,1312806,0.7746418338108882,0.8726361031518625,0.9100286532951289,0.9409742120343839,0.09939828080229228,0.9362941738299904,0.8311668258516377,0.8543081575293895,0.8283336040566576
|
72 |
+
0,1332697,0.775214899713467,0.8749283667621777,0.91189111747851,0.9408309455587393,0.09939828080229225,0.9360792741165234,0.8323945968072022,0.8552681582188931,0.8295149681200018
|
73 |
+
0,1352588,0.7760744985673352,0.8739255014326648,0.908595988538682,0.9418338108882521,0.0994842406876791,0.9371060171919771,0.8323562787101447,0.8553683999686118,0.8293713776889325
|
74 |
+
0,1372479,0.776647564469914,0.8744985673352436,0.9078796561604584,0.9404011461318051,0.0993409742120344,0.9356972301814708,0.8326717492154432,0.8554406628376127,0.8300293879287444
|
75 |
+
0,1392370,0.7744985673352436,0.8756446991404011,0.9103151862464184,0.9416905444126075,0.09945558739255014,0.9367956064947468,0.8319579751671419,0.8549263192487353,0.8288275743683852
|
76 |
+
0,1412261,0.7756446991404011,0.8757879656160459,0.9113180515759313,0.9411174785100287,0.09945558739255014,0.936461318051576,0.8325704962022992,0.8553151443337574,0.8294184977967456
|
77 |
+
0,1432152,0.7740687679083095,0.8734957020057307,0.9126074498567335,0.9424068767908309,0.09959885386819485,0.9378820439350525,0.8319171555919392,0.8552445716695324,0.8287457496980525
|
78 |
+
0,1452043,0.7749283667621777,0.8740687679083095,0.9090257879656161,0.9418338108882521,0.09945558739255014,0.9370224450811843,0.8315162368672383,0.854622057690668,0.8283387293683632
|
79 |
+
0,1471934,0.7750716332378224,0.87621776504298,0.91189111747851,0.9424068767908309,0.0995272206303725,0.9375477554918816,0.8326703847728187,0.8555256674062209,0.8291733176637109
|
80 |
+
0,1491825,0.7742120343839541,0.8740687679083095,0.9097421203438395,0.9415472779369628,0.0994842406876791,0.9369627507163324,0.8311805271296654,0.8543956470819455,0.8281056214377067
|
81 |
+
0,1511716,0.7746418338108882,0.8763610315186247,0.9117478510028654,0.941404011461318,0.0994269340974212,0.9365448901623687,0.8328521967526253,0.8554236484578596,0.8295219194188891
|
82 |
+
0,1531607,0.7736389684813754,0.8749283667621777,0.9108882521489972,0.9421203438395416,0.09955587392550144,0.9376193887297039,0.8315020807750021,0.8549447847288599,0.8286020252915053
|
83 |
+
0,1551498,0.7776504297994269,0.8744985673352436,0.9113180515759313,0.9411174785100287,0.09941260744985675,0.9364255014326648,0.8334837631327591,0.856192361238807,0.830719626832759
|
84 |
+
0,1571389,0.7757879656160458,0.8769340974212034,0.9101719197707736,0.9386819484240687,0.0991977077363897,0.9340974212034384,0.8325849934051928,0.8550142023560136,0.8300529006496287
|
85 |
+
0,1591280,0.7805157593123209,0.8782234957020058,0.9120343839541547,0.9398280802292264,0.09931232091690545,0.935339063992359,0.8357005275844805,0.8575849122572756,0.8330167537506131
|
86 |
+
0,1611171,0.7785100286532951,0.8782234957020058,0.9130372492836676,0.9404011461318051,0.0993839541547278,0.9358882521489972,0.8350823782234937,0.857361797001159,0.8324701802654975
|
87 |
+
0,1631062,0.7785100286532951,0.8785100286532951,0.9100286532951289,0.939971346704871,0.0993839541547278,0.9356614135625596,0.8344279005776131,0.8566506905100588,0.8316185292573617
|
88 |
+
0,1650953,0.7769340974212035,0.8773638968481375,0.9083094555873925,0.9393982808022923,0.0992836676217765,0.9351480420248328,0.8332967776413313,0.8557103453779058,0.8305997893634542
|
89 |
+
0,1670844,0.7759312320916906,0.8782234957020058,0.9095988538681948,0.9409742120343839,0.09945558739255014,0.9364135625596943,0.8332391299404175,0.8559392810292845,0.8303656974621793
|
90 |
+
0,1690735,0.7760744985673352,0.8785100286532951,0.9108882521489972,0.9412607449856734,0.09946991404011461,0.9366523400191021,0.8334693796334179,0.8560226066838483,0.8302847647142915
|
91 |
+
0,1710626,0.7777936962750717,0.8793696275071633,0.9120343839541547,0.9411174785100287,0.09946991404011461,0.9364851957975167,0.8347105676081299,0.8571109691587206,0.8318828784556608
|
92 |
+
0,1730517,0.7793696275071633,0.8795128939828081,0.9117478510028654,0.9421203438395416,0.0995702005730659,0.9375596943648519,0.8359242393232356,0.858251679822224,0.8330393221207893
|
93 |
+
0,1750408,0.7765042979942693,0.8792263610315186,0.9116045845272206,0.9419770773638968,0.09954154727793697,0.9375835721107927,0.8343801450857306,0.8572086014264069,0.8316938164592865
|
94 |
+
0,1770299,0.7808022922636103,0.8795128939828081,0.9111747851002865,0.9424068767908309,0.09958452722063038,0.9378462273161413,0.8370010119616123,0.8591335773119384,0.8341050781528395
|
95 |
+
0,1790190,0.7786532951289399,0.8800859598853868,0.9114613180515759,0.9422636103151862,0.09954154727793697,0.9375716332378223,0.8358997362077571,0.8582436476355945,0.8330240087507138
|
96 |
+
0,1810081,0.7826647564469914,0.8806590257879656,0.9117478510028654,0.9432664756446991,0.09964183381088826,0.9385744985673352,0.838352719788965,0.8602248514056844,0.8352773976334323
|
97 |
+
0,1829972,0.7812320916905444,0.8802292263610315,0.9116045845272206,0.9429799426934098,0.09961318051575932,0.9382521489971347,0.8371784463546624,0.8595013094329498,0.8345531451415473
|
98 |
+
0,1849863,0.7813753581661891,0.8799426934097421,0.9121776504297995,0.9432664756446991,0.09965616045845273,0.9386103151862464,0.8374647518988471,0.8597746404234234,0.8347362041438514
|
99 |
+
0,1869754,0.7812320916905444,0.8793696275071633,0.9111747851002865,0.9434097421203438,0.09968481375358167,0.9388252148997135,0.8371134079228629,0.8595104394781836,0.8343265402530841
|
100 |
+
0,1889645,0.7800859598853869,0.8795128939828081,0.9116045845272206,0.9429799426934098,0.09964183381088826,0.9383954154727794,0.8365225474143798,0.8590669700463994,0.8339347345588674
|
101 |
+
0,1909536,0.7802292263610315,0.8797994269340974,0.9124641833810888,0.9426934097421203,0.09964183381088826,0.9383476599808978,0.8368026561149761,0.8592814029496454,0.8341963523889172
|
102 |
+
0,1929427,0.7803724928366762,0.8795128939828081,0.9121776504297995,0.9421203438395416,0.0995702005730659,0.9376074498567335,0.8368038500022731,0.8590343964053853,0.8341177984987821
|
103 |
+
0,1949318,0.7799426934097421,0.8787965616045845,0.9120343839541547,0.9422636103151862,0.0995702005730659,0.9376790830945558,0.8365484718242585,0.8588402816144871,0.8338396581430574
|
104 |
+
0,1969209,0.7803724928366762,0.879083094555874,0.91189111747851,0.9426934097421203,0.09962750716332379,0.9381805157593123,0.8369040796834483,0.8592423094188277,0.8341833420017519
|
105 |
+
0,-1,0.7803724928366762,0.8792263610315186,0.9121776504297995,0.9429799426934098,0.09964183381088826,0.9383954154727794,0.8369651384909255,0.8593301327978569,0.834216619802917
|
eval/similarity_evaluation_assin-ptbr-test_results.csv
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
epoch,steps,cosine_pearson,cosine_spearman,euclidean_pearson,euclidean_spearman,manhattan_pearson,manhattan_spearman,dot_pearson,dot_spearman
|
2 |
+
-1,-1,0.747952229525418,0.7389185074643115,0.7664688149997081,0.7451763920752217,0.7663714125110497,0.7448613669883203,0.6926662911193622,0.679171949634377
|
eval/similarity_evaluation_assin-ptpt-test_results.csv
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
epoch,steps,cosine_pearson,cosine_spearman,euclidean_pearson,euclidean_spearman,manhattan_pearson,manhattan_spearman,dot_pearson,dot_spearman
|
2 |
+
-1,-1,0.7513773337811402,0.7560695337787583,0.7695326843113053,0.7571855518591687,0.7690356354169847,0.7567781765660634,0.7033434479345515,0.7012318192432161
|
eval/similarity_evaluation_assin2-test_results.csv
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
epoch,steps,cosine_pearson,cosine_spearman,euclidean_pearson,euclidean_spearman,manhattan_pearson,manhattan_spearman,dot_pearson,dot_spearman
|
2 |
+
-1,-1,0.8101696141720081,0.748927138087568,0.7834599801877342,0.7380892542494936,0.7832049594625379,0.7379402565975568,0.7842993628977963,0.70714470616414
|
eval/similarity_evaluation_iris-sts-test_results.csv
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
epoch,steps,cosine_pearson,cosine_spearman,euclidean_pearson,euclidean_spearman,manhattan_pearson,manhattan_spearman,dot_pearson,dot_spearman
|
2 |
+
-1,-1,0.7895231664158904,0.7847394112710312,0.7673844666417402,0.7689592688421604,0.7678979617213967,0.770274053807498,0.7810706078118825,0.7831173637402492
|
eval/similarity_evaluation_stsb-multi-mt-pt-test_results.csv
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
epoch,steps,cosine_pearson,cosine_spearman,euclidean_pearson,euclidean_spearman,manhattan_pearson,manhattan_spearman,dot_pearson,dot_spearman
|
2 |
+
-1,-1,0.836985262455597,0.826866882475686,0.8241037932727239,0.8214984273617987,0.8236820326347707,0.8210951099457946,0.7951527627824947,0.7806583497866606
|
model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd550d317aa8736324695cc1949201676e5b05f9ee41f088920053642c93ef68
|
3 |
+
size 3538419000
|
modules.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"idx": 0,
|
4 |
+
"name": "0",
|
5 |
+
"path": "",
|
6 |
+
"type": "sentence_transformers.models.Transformer"
|
7 |
+
},
|
8 |
+
{
|
9 |
+
"idx": 1,
|
10 |
+
"name": "1",
|
11 |
+
"path": "1_Pooling",
|
12 |
+
"type": "sentence_transformers.models.Pooling"
|
13 |
+
}
|
14 |
+
]
|
sentence_bert_config.json
ADDED
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"max_seq_length": 128,
|
3 |
+
"do_lower_case": false
|
4 |
+
}
|
special_tokens_map.json
ADDED
@@ -0,0 +1,51 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": {
|
3 |
+
"content": "[CLS]",
|
4 |
+
"lstrip": false,
|
5 |
+
"normalized": false,
|
6 |
+
"rstrip": false,
|
7 |
+
"single_word": false
|
8 |
+
},
|
9 |
+
"cls_token": {
|
10 |
+
"content": "[CLS]",
|
11 |
+
"lstrip": false,
|
12 |
+
"normalized": false,
|
13 |
+
"rstrip": false,
|
14 |
+
"single_word": false
|
15 |
+
},
|
16 |
+
"eos_token": {
|
17 |
+
"content": "[SEP]",
|
18 |
+
"lstrip": false,
|
19 |
+
"normalized": false,
|
20 |
+
"rstrip": false,
|
21 |
+
"single_word": false
|
22 |
+
},
|
23 |
+
"mask_token": {
|
24 |
+
"content": "[MASK]",
|
25 |
+
"lstrip": false,
|
26 |
+
"normalized": false,
|
27 |
+
"rstrip": false,
|
28 |
+
"single_word": false
|
29 |
+
},
|
30 |
+
"pad_token": {
|
31 |
+
"content": "[PAD]",
|
32 |
+
"lstrip": false,
|
33 |
+
"normalized": false,
|
34 |
+
"rstrip": false,
|
35 |
+
"single_word": false
|
36 |
+
},
|
37 |
+
"sep_token": {
|
38 |
+
"content": "[SEP]",
|
39 |
+
"lstrip": false,
|
40 |
+
"normalized": false,
|
41 |
+
"rstrip": false,
|
42 |
+
"single_word": false
|
43 |
+
},
|
44 |
+
"unk_token": {
|
45 |
+
"content": "[UNK]",
|
46 |
+
"lstrip": false,
|
47 |
+
"normalized": false,
|
48 |
+
"rstrip": false,
|
49 |
+
"single_word": false
|
50 |
+
}
|
51 |
+
}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1,65 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"added_tokens_decoder": {
|
3 |
+
"0": {
|
4 |
+
"content": "[PAD]",
|
5 |
+
"lstrip": false,
|
6 |
+
"normalized": false,
|
7 |
+
"rstrip": false,
|
8 |
+
"single_word": false,
|
9 |
+
"special": true
|
10 |
+
},
|
11 |
+
"1": {
|
12 |
+
"content": "[CLS]",
|
13 |
+
"lstrip": false,
|
14 |
+
"normalized": false,
|
15 |
+
"rstrip": false,
|
16 |
+
"single_word": false,
|
17 |
+
"special": true
|
18 |
+
},
|
19 |
+
"2": {
|
20 |
+
"content": "[SEP]",
|
21 |
+
"lstrip": false,
|
22 |
+
"normalized": false,
|
23 |
+
"rstrip": false,
|
24 |
+
"single_word": false,
|
25 |
+
"special": true
|
26 |
+
},
|
27 |
+
"3": {
|
28 |
+
"content": "[UNK]",
|
29 |
+
"lstrip": false,
|
30 |
+
"normalized": false,
|
31 |
+
"rstrip": false,
|
32 |
+
"single_word": false,
|
33 |
+
"special": true
|
34 |
+
},
|
35 |
+
"128000": {
|
36 |
+
"content": "[MASK]",
|
37 |
+
"lstrip": false,
|
38 |
+
"normalized": false,
|
39 |
+
"rstrip": false,
|
40 |
+
"single_word": false,
|
41 |
+
"special": true
|
42 |
+
}
|
43 |
+
},
|
44 |
+
"bos_token": "[CLS]",
|
45 |
+
"clean_up_tokenization_spaces": true,
|
46 |
+
"cls_token": "[CLS]",
|
47 |
+
"do_lower_case": false,
|
48 |
+
"eos_token": "[SEP]",
|
49 |
+
"mask_token": "[MASK]",
|
50 |
+
"max_length": 128,
|
51 |
+
"model_max_length": 512,
|
52 |
+
"pad_to_multiple_of": null,
|
53 |
+
"pad_token": "[PAD]",
|
54 |
+
"pad_token_type_id": 0,
|
55 |
+
"padding_side": "right",
|
56 |
+
"sep_token": "[SEP]",
|
57 |
+
"sp_model_kwargs": {},
|
58 |
+
"split_by_punct": false,
|
59 |
+
"stride": 0,
|
60 |
+
"tokenizer_class": "DebertaV2Tokenizer",
|
61 |
+
"truncation_side": "right",
|
62 |
+
"truncation_strategy": "longest_first",
|
63 |
+
"unk_token": "[UNK]",
|
64 |
+
"vocab_type": "spm"
|
65 |
+
}
|
train-config.yaml
ADDED
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
trainer: "gist"
|
2 |
+
model_name: "albertina-900m-ptpt-mmarco-pairs-gist1-v1"
|
3 |
+
base_model_name: "albertina-900m-ptpt-europarl-eubookshop-ted2020-tatoeba-ct1-nli-gist10-sts-cosent20-v1"
|
4 |
+
guide_model_name: "bertimbau-100m-europarl-eubookshop-ted2020-tatoeba-ct1-nli-gist10-sts-cosent20-v1"
|
5 |
+
validation_ir: True
|
6 |
+
validation_ir_corpus_size: 50000
|
7 |
+
# validation_ir_corpus_size: 500
|
8 |
+
|
9 |
+
# see https://huggingface.co/docs/datasets/v2.18.0/en/about_dataset_load
|
10 |
+
train_dataset_configs:
|
11 |
+
- alias: "mmarco"
|
12 |
+
path: "unicamp-dl/mmarco"
|
13 |
+
name: "portuguese"
|
14 |
+
split: "train"
|
15 |
+
# split: "train[1000:2000]"
|
16 |
+
|
17 |
+
examples_are_triples: False
|
18 |
+
examples_are_labelled: False
|
19 |
+
seed: 1
|
20 |
+
learning_rate: 1e-6
|
21 |
+
warmup_ratio: 0.1
|
22 |
+
weight_decay: 0.01
|
23 |
+
batch_size: 40
|
24 |
+
use_amp: True
|
25 |
+
epochs: 1
|
26 |
+
# validations_per_epoch: 1
|
27 |
+
validations_per_epoch: 100
|