luismsgomes commited on
Commit
472e467
1 Parent(s): e0129ad

added model

Browse files
1_Pooling/config.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "word_embedding_dimension": 1536,
3
+ "pooling_mode_cls_token": false,
4
+ "pooling_mode_mean_tokens": true,
5
+ "pooling_mode_max_tokens": false,
6
+ "pooling_mode_mean_sqrt_len_tokens": false,
7
+ "pooling_mode_weightedmean_tokens": false,
8
+ "pooling_mode_lasttoken": false,
9
+ "include_prompt": true
10
+ }
config.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "models/albertina-900m-ptpt-europarl-eubookshop-ted2020-tatoeba-ct1-nli-gist10-sts-cosent20-v1",
3
+ "architectures": [
4
+ "DebertaV2Model"
5
+ ],
6
+ "attention_head_size": 64,
7
+ "attention_probs_dropout_prob": 0.1,
8
+ "conv_act": "gelu",
9
+ "conv_kernel_size": 3,
10
+ "hidden_act": "gelu",
11
+ "hidden_dropout_prob": 0.1,
12
+ "hidden_size": 1536,
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 6144,
15
+ "layer_norm_eps": 1e-07,
16
+ "max_position_embeddings": 512,
17
+ "max_relative_positions": -1,
18
+ "model_type": "deberta-v2",
19
+ "norm_rel_ebd": "layer_norm",
20
+ "num_attention_heads": 24,
21
+ "num_hidden_layers": 24,
22
+ "pad_token_id": 0,
23
+ "pooler_dropout": 0,
24
+ "pooler_hidden_act": "gelu",
25
+ "pooler_hidden_size": 1536,
26
+ "pos_att_type": [
27
+ "p2c",
28
+ "c2p"
29
+ ],
30
+ "position_biased_input": false,
31
+ "position_buckets": 256,
32
+ "relative_attention": true,
33
+ "share_att_key": true,
34
+ "torch_dtype": "float32",
35
+ "transformers_version": "4.39.3",
36
+ "type_vocab_size": 0,
37
+ "vocab_size": 128100
38
+ }
config_sentence_transformers.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "__version__": {
3
+ "sentence_transformers": "2.6.1",
4
+ "transformers": "4.39.3",
5
+ "pytorch": "2.2.2+cu121"
6
+ },
7
+ "prompts": {},
8
+ "default_prompt_name": null
9
+ }
eval/Information-Retrieval_evaluation_mmarco-pt-dev-small_results-lr1e-5-aborted.csv ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ epoch,steps,cos_sim-Accuracy@1,cos_sim-Accuracy@3,cos_sim-Accuracy@5,cos_sim-Accuracy@10,cos_sim-Precision@10,cos_sim-Recall@10,cos_sim-MRR@10,cos_sim-NDCG@10,cos_sim-MAP@100
2
+ 0,19891,0.686676217765043,0.8027220630372492,0.8436962750716333,0.8879656160458452,0.09349570200573067,0.8817932187201527,0.7539734843316493,0.7822745078094078,0.7520719215136676
3
+ 0,39782,0.707163323782235,0.8234957020057306,0.8601719197707737,0.9034383954154728,0.09531518624641833,0.8979942693409743,0.773240323827715,0.8007244999086974,0.7707729438411337
4
+ 0,59673,0.6977077363896849,0.8157593123209169,0.85,0.8959885386819484,0.09457020057306591,0.8900191021967526,0.7641103265566007,0.791865440041029,0.7621812413953645
5
+ 0,79564,0.6906876790830946,0.8055873925501432,0.8449856733524356,0.8896848137535817,0.09388252148997135,0.8844555873925501,0.7570755446400139,0.7849885879700434,0.7547763453574594
eval/Information-Retrieval_evaluation_mmarco-pt-dev-small_results.csv ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ epoch,steps,cos_sim-Accuracy@1,cos_sim-Accuracy@3,cos_sim-Accuracy@5,cos_sim-Accuracy@10,cos_sim-Precision@10,cos_sim-Recall@10,cos_sim-MRR@10,cos_sim-NDCG@10,cos_sim-MAP@100
2
+ 0,19891,0.686676217765043,0.8027220630372492,0.8436962750716333,0.8879656160458452,0.09349570200573067,0.8817932187201527,0.7539734843316493,0.7822745078094078,0.7520719215136676
3
+ 0,39782,0.707163323782235,0.8234957020057306,0.8601719197707737,0.9034383954154728,0.09531518624641833,0.8979942693409743,0.773240323827715,0.8007244999086974,0.7707729438411337
4
+ 0,59673,0.6977077363896849,0.8157593123209169,0.85,0.8959885386819484,0.09457020057306591,0.8900191021967526,0.7641103265566007,0.791865440041029,0.7621812413953645
5
+ 0,79564,0.6906876790830946,0.8055873925501432,0.8449856733524356,0.8896848137535817,0.09388252148997135,0.8844555873925501,0.7570755446400139,0.7849885879700434,0.7547763453574594
6
+ 0,19891,0.6203438395415473,0.7439828080229226,0.7902578796561605,0.8436962750716333,0.08862464183381087,0.8363538681948424,0.6929668667849183,0.7242632677331385,0.690875095984185
7
+ 0,39782,0.6730659025787966,0.7873925501432665,0.8293696275071634,0.8749283667621777,0.09210601719197709,0.8690186246418338,0.7394724155182603,0.7677009562148118,0.7371429499973232
8
+ 0,59673,0.6916905444126075,0.8064469914040114,0.8464183381088826,0.8922636103151862,0.09404011461318051,0.8864016236867239,0.75852907399827,0.7866005017081468,0.7561253194426015
9
+ 0,79564,0.7014326647564469,0.8187679083094556,0.8588825214899714,0.8995702005730659,0.09487106017191978,0.8937917860553963,0.7689602947196058,0.7965738949679296,0.7667968975863902
10
+ 0,99455,0.7124641833810889,0.8318051575931232,0.8664756446991404,0.9078796561604584,0.09577363896848137,0.9023877745940784,0.7790101537272012,0.8062758951064879,0.7765478728499272
11
+ 0,119346,0.716189111747851,0.829512893982808,0.8681948424068768,0.9110315186246418,0.09610315186246418,0.9056232091690545,0.7810983194614973,0.808454180896248,0.7783428813795646
12
+ 0,139237,0.7213467048710601,0.832378223495702,0.873352435530086,0.9136103151862465,0.09637535816618911,0.9081781279847183,0.786252956292354,0.8129255351206011,0.7833076165773594
13
+ 0,159128,0.7253581661891118,0.836676217765043,0.8760744985673352,0.9169054441260746,0.09681948424068768,0.9118314231136581,0.7902542979942679,0.8169299183353848,0.787340364829885
14
+ 0,179019,0.7227793696275072,0.8402578796561605,0.8802292263610315,0.9183381088825215,0.09694842406876791,0.9131685768863418,0.7897997111929753,0.8169561483732921,0.7868466464392998
15
+ 0,198910,0.7297994269340974,0.8432664756446991,0.8796561604584527,0.9191977077363896,0.09694842406876791,0.9136938872970392,0.7942150475280828,0.8203711441203599,0.7912636213800311
16
+ 0,218801,0.7316618911174785,0.8446991404011461,0.8810888252148997,0.921919770773639,0.09723495702005731,0.916404011461318,0.7968953245099366,0.8230238693718747,0.793668054221326
17
+ 0,238692,0.733810888252149,0.8487106017191977,0.8863896848137536,0.9226361031518625,0.09732091690544412,0.9170248328557784,0.7989986696684385,0.8250668816110137,0.7963136676589505
18
+ 0,258583,0.7376790830945559,0.8452722063037249,0.8843839541547278,0.9224928366762177,0.09733524355300861,0.9173113658070677,0.8003599854459444,0.8258782670364493,0.7971645207195726
19
+ 0,278474,0.7411174785100286,0.85,0.8861031518624641,0.920487106017192,0.0971919770773639,0.9155324737344793,0.8032153658980298,0.8279345366913405,0.8007657861121821
20
+ 0,298365,0.7428366762177651,0.851432664756447,0.8891117478510029,0.9243553008595988,0.09763610315186247,0.9193887297039159,0.8047995406376481,0.8297863156828637,0.8015892660342179
21
+ 0,318256,0.7431232091690544,0.8502865329512894,0.88810888252149,0.9234957020057306,0.09755014326647565,0.9187082139446036,0.8045313139582466,0.8296123253332633,0.8017689424775438
22
+ 0,338147,0.7438395415472779,0.8518624641833811,0.8905444126074499,0.9246418338108883,0.0977220630372493,0.9201170009551098,0.8059463546641182,0.8312719746670211,0.8035526961638525
23
+ 0,358038,0.7441260744985674,0.8511461318051576,0.8875358166189111,0.9260744985673353,0.09785100286532951,0.9215974212034383,0.8060013871833343,0.8315254961496272,0.8033696446117365
24
+ 0,377929,0.7491404011461318,0.854727793696275,0.8898280802292263,0.9289398280802292,0.0981948424068768,0.9247492836676218,0.8100722586073585,0.8352357065940328,0.8071837419424122
25
+ 0,397820,0.7468481375358166,0.8545845272206304,0.8914040114613181,0.9285100286532951,0.09800859598853869,0.9234240687679083,0.8089239095829345,0.8340204237662775,0.8059615270024146
26
+ 0,417711,0.751432664756447,0.8557306590257879,0.8926934097421203,0.9306590257879657,0.09822349570200575,0.9255969436485196,0.81199413289671,0.8366639352346111,0.8086662376925663
27
+ 0,437602,0.7505730659025788,0.8574498567335244,0.8939828080229226,0.9300859598853868,0.09828080229226362,0.9255969436485195,0.811524764633645,0.8365442932209558,0.8084316428570375
28
+ 0,457493,0.7547277936962751,0.8617478510028653,0.8944126074498567,0.9283667621776505,0.09803724928366761,0.9234360076408786,0.8146785032064389,0.8383824118847123,0.8116012333573631
29
+ 0,477384,0.7520057306590258,0.857593123209169,0.8914040114613181,0.9305157593123209,0.09825214899713468,0.9258834765998089,0.8127441215263547,0.8375475606248511,0.8098212233216132
30
+ 0,497275,0.7548710601719197,0.8611747851002866,0.8965616045845273,0.9320916905444127,0.0984813753581662,0.9273280802292264,0.8149478669213608,0.8395852047610595,0.8118555082662375
31
+ 0,517166,0.7564469914040115,0.8624641833810889,0.895272206303725,0.9310888252148997,0.09840974212034385,0.926313276026743,0.8171256310547123,0.8412180264058458,0.814434164277915
32
+ 0,537057,0.7563037249283667,0.863323782234957,0.8948424068767908,0.9328080229226361,0.098567335243553,0.928235434574976,0.816596909537452,0.8410890925958876,0.8135340349753447
33
+ 0,556948,0.7571633237822349,0.8627507163323782,0.8964183381088825,0.9320916905444127,0.09852435530085961,0.927351957975167,0.8172349001682796,0.8413873387215821,0.8139932771288845
34
+ 0,576839,0.7577363896848137,0.8626074498567335,0.8987106017191977,0.9303724928366762,0.09825214899713466,0.9254775549188158,0.8170838449993163,0.8408493553992008,0.8142303304448247
35
+ 0,596730,0.7574498567335244,0.8597421203438396,0.8936962750716332,0.9315186246418338,0.09842406876790831,0.9266595033428845,0.8166365352253592,0.8407340804997021,0.8136104839168087
36
+ 0,616621,0.7527220630372493,0.8601719197707737,0.8955587392550143,0.9330945558739255,0.09862464183381091,0.9288443170964662,0.8142032792104411,0.839487726548661,0.8112331145550177
37
+ 0,636512,0.7548710601719197,0.8628939828080229,0.8962750716332378,0.9316618911174785,0.0984813753581662,0.9273638968481376,0.8157000727702715,0.840459593632374,0.8130267687665712
38
+ 0,656403,0.7530085959885386,0.86189111747851,0.8957020057306591,0.9318051575931232,0.09840974212034385,0.9271967526265521,0.8143774730522552,0.8393212188562222,0.8115597819776212
39
+ 0,676294,0.7591690544412607,0.8637535816618911,0.8974212034383954,0.9328080229226361,0.09846704871060173,0.9276623686723974,0.8186200368399494,0.8425963126004824,0.8158499793675448
40
+ 0,696185,0.760458452722063,0.8651862464183381,0.8972779369627507,0.9332378223495702,0.09855300859598855,0.9287368672397325,0.8194560422067562,0.8434678522608476,0.8166719966795604
41
+ 0,716076,0.7610315186246418,0.8628939828080229,0.8984240687679083,0.933810888252149,0.09865329512893985,0.9293218720152818,0.8195302337745008,0.8435721964468267,0.8165069472897686
42
+ 0,735967,0.7594555873925501,0.8641833810888252,0.8968481375358166,0.9328080229226361,0.09853868194842406,0.9280085959885387,0.818944546777639,0.8428762552542166,0.8160852725950872
43
+ 0,755858,0.7637535816618911,0.8654727793696275,0.8977077363896848,0.9332378223495702,0.09858166189111749,0.9287010506208215,0.8221433119570637,0.8455171640505106,0.8193100126894071
44
+ 0,775749,0.7636103151862464,0.8657593123209169,0.8992836676217765,0.9342406876790831,0.0987535816618911,0.929691977077364,0.8216715559194049,0.8453755885717837,0.8188015635589823
45
+ 0,795640,0.7627507163323782,0.866189111747851,0.9005730659025788,0.9336676217765043,0.09869627507163325,0.9293218720152818,0.8217884431709619,0.8453657739099143,0.8188042568245371
46
+ 0,815531,0.7617478510028654,0.8677650429799427,0.9027220630372493,0.9355300859598854,0.09886819484240689,0.9310530085959885,0.8212019033974606,0.8455616898981982,0.8185511599404696
47
+ 0,835422,0.7573065902578796,0.8611747851002866,0.8939828080229226,0.9282234957020057,0.09813753581661891,0.9238896848137536,0.8162890571701445,0.8399374256074439,0.8136899264786653
48
+ 0,855313,0.7613180515759312,0.8614613180515759,0.8964183381088825,0.9326647564469914,0.09862464183381091,0.9285339063992359,0.8194945877109187,0.8433579606167781,0.8164370026194898
49
+ 0,875204,0.7627507163323782,0.867621776504298,0.9012893982808023,0.9361031518624642,0.0988681948424069,0.9313872970391596,0.8227310456178634,0.846536869481785,0.8196750619235467
50
+ 0,895095,0.7644699140401147,0.8648997134670487,0.8982808022922636,0.9349570200573066,0.09872492836676218,0.9304083094555874,0.822390730886431,0.846068686667549,0.8195144421878694
51
+ 0,914986,0.7667621776504298,0.8681948424068768,0.9024355300859599,0.9376790830945558,0.09902578796561605,0.932712511938873,0.824962648383133,0.8484268157102385,0.8216009228170417
52
+ 0,934877,0.7636103151862464,0.8714899713467049,0.9038681948424069,0.9363896848137536,0.09881088825214901,0.9313037249283668,0.8240158957565823,0.8474386082202197,0.8207057654570817
53
+ 0,954768,0.7603151862464184,0.8646131805157593,0.9002865329512894,0.9351002865329513,0.09873925501432665,0.9301337153772683,0.8198284213398804,0.8440687951404998,0.8168797132766971
54
+ 0,974659,0.7611747851002866,0.8686246418338109,0.9053008595988539,0.9356733524355301,0.09879656160458451,0.9306112702960841,0.8219180652203549,0.8457710123153714,0.8188228813051177
55
+ 0,994550,0.7630372492836677,0.8707736389684814,0.9041547277936963,0.9365329512893983,0.09892550143266475,0.9318290353390639,0.8236135557374801,0.847425578209692,0.8206357426133198
56
+ 0,1014441,0.7640401146131806,0.8683381088825215,0.9021489971346704,0.9340974212034384,0.0986676217765043,0.9293218720152817,0.8229491858825646,0.8461883936044302,0.8198774676030318
57
+ 0,1034332,0.7656160458452722,0.867621776504298,0.9020057306590258,0.9353868194842407,0.09892550143266475,0.9312917860553963,0.8236413562559681,0.8472093720791207,0.8204986925626111
58
+ 0,1054223,0.7706303724928367,0.87378223495702,0.9038681948424069,0.9369627507163324,0.09908309455587394,0.9327363896848138,0.828341122026651,0.851058695445996,0.8251213463981715
59
+ 0,1074114,0.7634670487106017,0.8679083094555874,0.9041547277936963,0.935243553008596,0.0988681948424069,0.9308500477554918,0.8226698731068336,0.8465031619947313,0.8197783762774588
60
+ 0,1094005,0.7669054441260745,0.8681948424068768,0.9041547277936963,0.938538681948424,0.09915472779369627,0.933751193887297,0.8252372993132273,0.8488669236180225,0.821920283092166
61
+ 0,1113896,0.7702005730659026,0.873352435530086,0.9081661891117478,0.9376790830945558,0.09921203438395415,0.9333452722063037,0.8276602651566808,0.8508699824856587,0.8246975999698329
62
+ 0,1133787,0.7707736389684814,0.8743553008595989,0.9064469914040114,0.9391117478510028,0.0993409742120344,0.9351361031518625,0.8290096420612159,0.8522788214796762,0.825930900142743
63
+ 0,1153678,0.7664756446991404,0.873352435530086,0.9064469914040114,0.9381088825214899,0.0991404011461318,0.9337392550143266,0.8258741529085335,0.8494891976962177,0.8226592239377765
64
+ 0,1173569,0.7713467048710602,0.8739255014326648,0.9063037249283667,0.938538681948424,0.09916905444126076,0.9340138490926456,0.8292850889161757,0.8520524930539365,0.8259190516755253
65
+ 0,1193460,0.7700573065902578,0.8732091690544412,0.9073065902578796,0.9388252148997135,0.09925501432664757,0.9344675262655205,0.8284495952153518,0.8516703868868762,0.825306547278246
66
+ 0,1213351,0.7700573065902578,0.8730659025787966,0.9060171919770774,0.9379656160458453,0.0991547277936963,0.9337392550143266,0.8284010437986061,0.851447867370514,0.8252460583266904
67
+ 0,1233242,0.7722063037249284,0.8736389684813753,0.9067335243553009,0.9409742120343839,0.09945558739255014,0.9364732569245463,0.8303959157684063,0.8536711396164638,0.8272642227433656
68
+ 0,1253133,0.7717765042979943,0.8719197707736389,0.9067335243553009,0.9402578796561605,0.09939828080229228,0.935947946513849,0.8294898690135057,0.8529469292257653,0.8266551661663469
69
+ 0,1273024,0.7744985673352436,0.87378223495702,0.9088825214899714,0.9402578796561605,0.0993839541547278,0.9359360076408787,0.8312328307636304,0.8543235454585494,0.828475184534567
70
+ 0,1292915,0.7753581661891118,0.8753581661891118,0.908595988538682,0.9402578796561605,0.0993266475644699,0.9355659025787966,0.8317630304270692,0.8546205711558493,0.8290615205923493
71
+ 0,1312806,0.7746418338108882,0.8726361031518625,0.9100286532951289,0.9409742120343839,0.09939828080229228,0.9362941738299904,0.8311668258516377,0.8543081575293895,0.8283336040566576
72
+ 0,1332697,0.775214899713467,0.8749283667621777,0.91189111747851,0.9408309455587393,0.09939828080229225,0.9360792741165234,0.8323945968072022,0.8552681582188931,0.8295149681200018
73
+ 0,1352588,0.7760744985673352,0.8739255014326648,0.908595988538682,0.9418338108882521,0.0994842406876791,0.9371060171919771,0.8323562787101447,0.8553683999686118,0.8293713776889325
74
+ 0,1372479,0.776647564469914,0.8744985673352436,0.9078796561604584,0.9404011461318051,0.0993409742120344,0.9356972301814708,0.8326717492154432,0.8554406628376127,0.8300293879287444
75
+ 0,1392370,0.7744985673352436,0.8756446991404011,0.9103151862464184,0.9416905444126075,0.09945558739255014,0.9367956064947468,0.8319579751671419,0.8549263192487353,0.8288275743683852
76
+ 0,1412261,0.7756446991404011,0.8757879656160459,0.9113180515759313,0.9411174785100287,0.09945558739255014,0.936461318051576,0.8325704962022992,0.8553151443337574,0.8294184977967456
77
+ 0,1432152,0.7740687679083095,0.8734957020057307,0.9126074498567335,0.9424068767908309,0.09959885386819485,0.9378820439350525,0.8319171555919392,0.8552445716695324,0.8287457496980525
78
+ 0,1452043,0.7749283667621777,0.8740687679083095,0.9090257879656161,0.9418338108882521,0.09945558739255014,0.9370224450811843,0.8315162368672383,0.854622057690668,0.8283387293683632
79
+ 0,1471934,0.7750716332378224,0.87621776504298,0.91189111747851,0.9424068767908309,0.0995272206303725,0.9375477554918816,0.8326703847728187,0.8555256674062209,0.8291733176637109
80
+ 0,1491825,0.7742120343839541,0.8740687679083095,0.9097421203438395,0.9415472779369628,0.0994842406876791,0.9369627507163324,0.8311805271296654,0.8543956470819455,0.8281056214377067
81
+ 0,1511716,0.7746418338108882,0.8763610315186247,0.9117478510028654,0.941404011461318,0.0994269340974212,0.9365448901623687,0.8328521967526253,0.8554236484578596,0.8295219194188891
82
+ 0,1531607,0.7736389684813754,0.8749283667621777,0.9108882521489972,0.9421203438395416,0.09955587392550144,0.9376193887297039,0.8315020807750021,0.8549447847288599,0.8286020252915053
83
+ 0,1551498,0.7776504297994269,0.8744985673352436,0.9113180515759313,0.9411174785100287,0.09941260744985675,0.9364255014326648,0.8334837631327591,0.856192361238807,0.830719626832759
84
+ 0,1571389,0.7757879656160458,0.8769340974212034,0.9101719197707736,0.9386819484240687,0.0991977077363897,0.9340974212034384,0.8325849934051928,0.8550142023560136,0.8300529006496287
85
+ 0,1591280,0.7805157593123209,0.8782234957020058,0.9120343839541547,0.9398280802292264,0.09931232091690545,0.935339063992359,0.8357005275844805,0.8575849122572756,0.8330167537506131
86
+ 0,1611171,0.7785100286532951,0.8782234957020058,0.9130372492836676,0.9404011461318051,0.0993839541547278,0.9358882521489972,0.8350823782234937,0.857361797001159,0.8324701802654975
87
+ 0,1631062,0.7785100286532951,0.8785100286532951,0.9100286532951289,0.939971346704871,0.0993839541547278,0.9356614135625596,0.8344279005776131,0.8566506905100588,0.8316185292573617
88
+ 0,1650953,0.7769340974212035,0.8773638968481375,0.9083094555873925,0.9393982808022923,0.0992836676217765,0.9351480420248328,0.8332967776413313,0.8557103453779058,0.8305997893634542
89
+ 0,1670844,0.7759312320916906,0.8782234957020058,0.9095988538681948,0.9409742120343839,0.09945558739255014,0.9364135625596943,0.8332391299404175,0.8559392810292845,0.8303656974621793
90
+ 0,1690735,0.7760744985673352,0.8785100286532951,0.9108882521489972,0.9412607449856734,0.09946991404011461,0.9366523400191021,0.8334693796334179,0.8560226066838483,0.8302847647142915
91
+ 0,1710626,0.7777936962750717,0.8793696275071633,0.9120343839541547,0.9411174785100287,0.09946991404011461,0.9364851957975167,0.8347105676081299,0.8571109691587206,0.8318828784556608
92
+ 0,1730517,0.7793696275071633,0.8795128939828081,0.9117478510028654,0.9421203438395416,0.0995702005730659,0.9375596943648519,0.8359242393232356,0.858251679822224,0.8330393221207893
93
+ 0,1750408,0.7765042979942693,0.8792263610315186,0.9116045845272206,0.9419770773638968,0.09954154727793697,0.9375835721107927,0.8343801450857306,0.8572086014264069,0.8316938164592865
94
+ 0,1770299,0.7808022922636103,0.8795128939828081,0.9111747851002865,0.9424068767908309,0.09958452722063038,0.9378462273161413,0.8370010119616123,0.8591335773119384,0.8341050781528395
95
+ 0,1790190,0.7786532951289399,0.8800859598853868,0.9114613180515759,0.9422636103151862,0.09954154727793697,0.9375716332378223,0.8358997362077571,0.8582436476355945,0.8330240087507138
96
+ 0,1810081,0.7826647564469914,0.8806590257879656,0.9117478510028654,0.9432664756446991,0.09964183381088826,0.9385744985673352,0.838352719788965,0.8602248514056844,0.8352773976334323
97
+ 0,1829972,0.7812320916905444,0.8802292263610315,0.9116045845272206,0.9429799426934098,0.09961318051575932,0.9382521489971347,0.8371784463546624,0.8595013094329498,0.8345531451415473
98
+ 0,1849863,0.7813753581661891,0.8799426934097421,0.9121776504297995,0.9432664756446991,0.09965616045845273,0.9386103151862464,0.8374647518988471,0.8597746404234234,0.8347362041438514
99
+ 0,1869754,0.7812320916905444,0.8793696275071633,0.9111747851002865,0.9434097421203438,0.09968481375358167,0.9388252148997135,0.8371134079228629,0.8595104394781836,0.8343265402530841
100
+ 0,1889645,0.7800859598853869,0.8795128939828081,0.9116045845272206,0.9429799426934098,0.09964183381088826,0.9383954154727794,0.8365225474143798,0.8590669700463994,0.8339347345588674
101
+ 0,1909536,0.7802292263610315,0.8797994269340974,0.9124641833810888,0.9426934097421203,0.09964183381088826,0.9383476599808978,0.8368026561149761,0.8592814029496454,0.8341963523889172
102
+ 0,1929427,0.7803724928366762,0.8795128939828081,0.9121776504297995,0.9421203438395416,0.0995702005730659,0.9376074498567335,0.8368038500022731,0.8590343964053853,0.8341177984987821
103
+ 0,1949318,0.7799426934097421,0.8787965616045845,0.9120343839541547,0.9422636103151862,0.0995702005730659,0.9376790830945558,0.8365484718242585,0.8588402816144871,0.8338396581430574
104
+ 0,1969209,0.7803724928366762,0.879083094555874,0.91189111747851,0.9426934097421203,0.09962750716332379,0.9381805157593123,0.8369040796834483,0.8592423094188277,0.8341833420017519
105
+ 0,-1,0.7803724928366762,0.8792263610315186,0.9121776504297995,0.9429799426934098,0.09964183381088826,0.9383954154727794,0.8369651384909255,0.8593301327978569,0.834216619802917
eval/similarity_evaluation_assin-ptbr-test_results.csv ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ epoch,steps,cosine_pearson,cosine_spearman,euclidean_pearson,euclidean_spearman,manhattan_pearson,manhattan_spearman,dot_pearson,dot_spearman
2
+ -1,-1,0.747952229525418,0.7389185074643115,0.7664688149997081,0.7451763920752217,0.7663714125110497,0.7448613669883203,0.6926662911193622,0.679171949634377
eval/similarity_evaluation_assin-ptpt-test_results.csv ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ epoch,steps,cosine_pearson,cosine_spearman,euclidean_pearson,euclidean_spearman,manhattan_pearson,manhattan_spearman,dot_pearson,dot_spearman
2
+ -1,-1,0.7513773337811402,0.7560695337787583,0.7695326843113053,0.7571855518591687,0.7690356354169847,0.7567781765660634,0.7033434479345515,0.7012318192432161
eval/similarity_evaluation_assin2-test_results.csv ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ epoch,steps,cosine_pearson,cosine_spearman,euclidean_pearson,euclidean_spearman,manhattan_pearson,manhattan_spearman,dot_pearson,dot_spearman
2
+ -1,-1,0.8101696141720081,0.748927138087568,0.7834599801877342,0.7380892542494936,0.7832049594625379,0.7379402565975568,0.7842993628977963,0.70714470616414
eval/similarity_evaluation_iris-sts-test_results.csv ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ epoch,steps,cosine_pearson,cosine_spearman,euclidean_pearson,euclidean_spearman,manhattan_pearson,manhattan_spearman,dot_pearson,dot_spearman
2
+ -1,-1,0.7895231664158904,0.7847394112710312,0.7673844666417402,0.7689592688421604,0.7678979617213967,0.770274053807498,0.7810706078118825,0.7831173637402492
eval/similarity_evaluation_stsb-multi-mt-pt-test_results.csv ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ epoch,steps,cosine_pearson,cosine_spearman,euclidean_pearson,euclidean_spearman,manhattan_pearson,manhattan_spearman,dot_pearson,dot_spearman
2
+ -1,-1,0.836985262455597,0.826866882475686,0.8241037932727239,0.8214984273617987,0.8236820326347707,0.8210951099457946,0.7951527627824947,0.7806583497866606
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd550d317aa8736324695cc1949201676e5b05f9ee41f088920053642c93ef68
3
+ size 3538419000
modules.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "idx": 0,
4
+ "name": "0",
5
+ "path": "",
6
+ "type": "sentence_transformers.models.Transformer"
7
+ },
8
+ {
9
+ "idx": 1,
10
+ "name": "1",
11
+ "path": "1_Pooling",
12
+ "type": "sentence_transformers.models.Pooling"
13
+ }
14
+ ]
sentence_bert_config.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "max_seq_length": 128,
3
+ "do_lower_case": false
4
+ }
special_tokens_map.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "[CLS]",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "cls_token": {
10
+ "content": "[CLS]",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "eos_token": {
17
+ "content": "[SEP]",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "mask_token": {
24
+ "content": "[MASK]",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "pad_token": {
31
+ "content": "[PAD]",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ },
37
+ "sep_token": {
38
+ "content": "[SEP]",
39
+ "lstrip": false,
40
+ "normalized": false,
41
+ "rstrip": false,
42
+ "single_word": false
43
+ },
44
+ "unk_token": {
45
+ "content": "[UNK]",
46
+ "lstrip": false,
47
+ "normalized": false,
48
+ "rstrip": false,
49
+ "single_word": false
50
+ }
51
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,65 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "1": {
12
+ "content": "[CLS]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "2": {
20
+ "content": "[SEP]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "3": {
28
+ "content": "[UNK]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "128000": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "bos_token": "[CLS]",
45
+ "clean_up_tokenization_spaces": true,
46
+ "cls_token": "[CLS]",
47
+ "do_lower_case": false,
48
+ "eos_token": "[SEP]",
49
+ "mask_token": "[MASK]",
50
+ "max_length": 128,
51
+ "model_max_length": 512,
52
+ "pad_to_multiple_of": null,
53
+ "pad_token": "[PAD]",
54
+ "pad_token_type_id": 0,
55
+ "padding_side": "right",
56
+ "sep_token": "[SEP]",
57
+ "sp_model_kwargs": {},
58
+ "split_by_punct": false,
59
+ "stride": 0,
60
+ "tokenizer_class": "DebertaV2Tokenizer",
61
+ "truncation_side": "right",
62
+ "truncation_strategy": "longest_first",
63
+ "unk_token": "[UNK]",
64
+ "vocab_type": "spm"
65
+ }
train-config.yaml ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ trainer: "gist"
2
+ model_name: "albertina-900m-ptpt-mmarco-pairs-gist1-v1"
3
+ base_model_name: "albertina-900m-ptpt-europarl-eubookshop-ted2020-tatoeba-ct1-nli-gist10-sts-cosent20-v1"
4
+ guide_model_name: "bertimbau-100m-europarl-eubookshop-ted2020-tatoeba-ct1-nli-gist10-sts-cosent20-v1"
5
+ validation_ir: True
6
+ validation_ir_corpus_size: 50000
7
+ # validation_ir_corpus_size: 500
8
+
9
+ # see https://huggingface.co/docs/datasets/v2.18.0/en/about_dataset_load
10
+ train_dataset_configs:
11
+ - alias: "mmarco"
12
+ path: "unicamp-dl/mmarco"
13
+ name: "portuguese"
14
+ split: "train"
15
+ # split: "train[1000:2000]"
16
+
17
+ examples_are_triples: False
18
+ examples_are_labelled: False
19
+ seed: 1
20
+ learning_rate: 1e-6
21
+ warmup_ratio: 0.1
22
+ weight_decay: 0.01
23
+ batch_size: 40
24
+ use_amp: True
25
+ epochs: 1
26
+ # validations_per_epoch: 1
27
+ validations_per_epoch: 100