diff --git "a/results.json" "b/results.json" --- "a/results.json" +++ "b/results.json" @@ -1,4 +1,123 @@ [ + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"aeb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.1920266076 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.4391810036 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.1921503062 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.4121866696 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"af", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"af", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"af", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"af", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"af", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ak", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ak", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ak", + "task":"translation_from", + "metric":"bleu", + "score":0.0706883182 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ak", + "task":"translation_from", + "metric":"chrf", + "score":0.2475181808 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ak", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ak", + "task":"translation_to", + "metric":"chrf", + "score":0.1707669328 + }, { "model":"amazon\/nova-micro-v1", "bcp_47":"am", @@ -125,6 +244,41 @@ "metric":"chrf", "score":0.5463705477 }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ary", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ary", + "task":"translation_from", + "metric":"bleu", + "score":0.0629352571 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ary", + "task":"translation_from", + "metric":"chrf", + "score":0.3681064162 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ary", + "task":"translation_to", + "metric":"bleu", + "score":0.0907131082 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ary", + "task":"translation_to", + "metric":"chrf", + "score":0.345867578 + }, { "model":"amazon\/nova-micro-v1", "bcp_47":"arz", @@ -160,6 +314,76 @@ "metric":"chrf", "score":0.4094860171 }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"as", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"as", + "task":"translation_from", + "metric":"bleu", + "score":0.178673865 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"as", + "task":"translation_from", + "metric":"chrf", + "score":0.421571814 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"as", + "task":"translation_to", + "metric":"bleu", + "score":0.0893532438 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"as", + "task":"translation_to", + "metric":"chrf", + "score":0.322658401 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"awa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"awa", + "task":"translation_from", + "metric":"bleu", + "score":0.2155508388 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"awa", + "task":"translation_from", + "metric":"chrf", + "score":0.4627157806 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"awa", + "task":"translation_to", + "metric":"bleu", + "score":0.2362014825 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"awa", + "task":"translation_to", + "metric":"chrf", + "score":0.4311272979 + }, { "model":"amazon\/nova-micro-v1", "bcp_47":"az", @@ -195,6 +419,41 @@ "metric":"chrf", "score":0.3827364935 }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"be", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"be", + "task":"translation_from", + "metric":"bleu", + "score":0.0852543641 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"be", + "task":"translation_from", + "metric":"chrf", + "score":0.3968535114 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"be", + "task":"translation_to", + "metric":"bleu", + "score":0.1568859483 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"be", + "task":"translation_to", + "metric":"chrf", + "score":0.3854296145 + }, { "model":"amazon\/nova-micro-v1", "bcp_47":"bho", @@ -230,6 +489,41 @@ "metric":"chrf", "score":0.3498742372 }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"bm", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"bm", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"bm", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"bm", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"bm", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, { "model":"amazon\/nova-micro-v1", "bcp_47":"bn", @@ -279,6 +573,160 @@ "metric":"chrf", "score":0.4502390132 }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ca", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ca", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ca", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ca", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ca", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ceb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"bleu", + "score":0.245009056 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"chrf", + "score":0.4752285329 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"bleu", + "score":0.1249288306 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"chrf", + "score":0.4378159282 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ckb", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"bleu", + "score":0.0418701115 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"chrf", + "score":0.227562406 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"bleu", + "score":0.0126447021 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"chrf", + "score":0.2329401033 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"cs", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"cs", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"cs", + "task":"translation_from", + "metric":"bleu", + "score":0.1929725876 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"cs", + "task":"translation_from", + "metric":"chrf", + "score":0.4742897968 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"cs", + "task":"translation_to", + "metric":"bleu", + "score":0.2142339765 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"cs", + "task":"translation_to", + "metric":"chrf", + "score":0.4337679078 + }, { "model":"amazon\/nova-micro-v1", "bcp_47":"de", @@ -328,6 +776,55 @@ "metric":"chrf", "score":0.6258445826 }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"el", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"el", + "task":"translation_from", + "metric":"bleu", + "score":0.2411522305 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"el", + "task":"translation_from", + "metric":"chrf", + "score":0.4648713205 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"el", + "task":"translation_to", + "metric":"bleu", + "score":0.2526136998 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"el", + "task":"translation_to", + "metric":"chrf", + "score":0.4761366058 + }, { "model":"amazon\/nova-micro-v1", "bcp_47":"en", @@ -559,6 +1056,41 @@ "metric":"chrf", "score":0.5963334297 }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.0342743018 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.2106722499 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0168251159 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.2071693978 + }, { "model":"amazon\/nova-micro-v1", "bcp_47":"gu", @@ -687,46896 +1219,109546 @@ }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"id", + "bcp_47":"hne", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 + "score":0.8 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"id", + "bcp_47":"hne", "task":"translation_from", "metric":"bleu", - "score":0.1741677254 + "score":0.1740026405 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"id", + "bcp_47":"hne", "task":"translation_from", "metric":"chrf", - "score":0.4469342589 + "score":0.4261065659 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"id", + "bcp_47":"hne", "task":"translation_to", "metric":"bleu", - "score":0.1716570673 + "score":0.0865662826 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"id", + "bcp_47":"hne", "task":"translation_to", "metric":"chrf", - "score":0.5608938423 + "score":0.3708353537 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"it", + "bcp_47":"ht", "task":"classification", "metric":"accuracy", - "score":0.8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"mgsm", - "metric":"accuracy", - "score":0.1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.5 + "score":0.0 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"it", + "bcp_47":"ht", "task":"translation_from", "metric":"bleu", - "score":0.2125826846 + "score":0.0 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"it", + "bcp_47":"ht", "task":"translation_from", "metric":"chrf", - "score":0.4735941044 + "score":0.0 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"it", + "bcp_47":"ht", "task":"translation_to", "metric":"bleu", - "score":0.2872908558 + "score":0.0 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"it", + "bcp_47":"ht", "task":"translation_to", "metric":"chrf", - "score":0.5675711887 + "score":0.0 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", + "bcp_47":"hu", "task":"classification", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", + "bcp_47":"hu", "task":"mgsm", "metric":"accuracy", - "score":0.4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.5 + "score":0.1 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", + "bcp_47":"hu", "task":"translation_from", "metric":"bleu", - "score":0.2197709837 + "score":0.2110505791 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", + "bcp_47":"hu", "task":"translation_from", "metric":"chrf", - "score":0.4784848367 + "score":0.4739587631 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", + "bcp_47":"hu", "task":"translation_to", "metric":"bleu", - "score":0.3426239655 + "score":0.258885113 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", + "bcp_47":"hu", "task":"translation_to", "metric":"chrf", - "score":0.4822747548 + "score":0.4885220189 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", + "bcp_47":"id", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.2192585886 + "score":0.1741677254 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.4527368673 + "score":0.4469342589 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", + "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.1076519805 + "score":0.1716570673 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", + "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.4493011434 + "score":0.5608938423 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", + "bcp_47":"ig", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1691888664 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4411352116 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1416550774 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3528205749 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"classification", + "bcp_47":"ig", + "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.1 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", + "bcp_47":"ig", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.3 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", + "bcp_47":"ig", "task":"translation_from", "metric":"bleu", - "score":0.144249324 + "score":0.1185701002 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", + "bcp_47":"ig", "task":"translation_from", "metric":"chrf", - "score":0.4191931285 + "score":0.3493767594 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", + "bcp_47":"ig", "task":"translation_to", "metric":"bleu", - "score":0.2803945229 + "score":0.0477092787 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", + "bcp_47":"ig", "task":"translation_to", "metric":"chrf", - "score":0.3626852212 + "score":0.2820590617 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", + "bcp_47":"ilo", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", + "bcp_47":"ilo", "task":"translation_from", "metric":"bleu", - "score":0.2611524911 + "score":0.1533886213 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", + "bcp_47":"ilo", "task":"translation_from", "metric":"chrf", - "score":0.4964180281 + "score":0.3781904602 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", + "bcp_47":"ilo", "task":"translation_to", "metric":"bleu", - "score":0.1563741006 + "score":0.0407683795 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", + "bcp_47":"ilo", "task":"translation_to", "metric":"chrf", - "score":0.4042462159 + "score":0.3408267624 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", + "bcp_47":"it", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"it", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"it", "task":"translation_from", "metric":"bleu", - "score":0.1387332093 + "score":0.2125826846 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", + "bcp_47":"it", "task":"translation_from", "metric":"chrf", - "score":0.4231622054 + "score":0.4735941044 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", + "bcp_47":"it", "task":"translation_to", "metric":"bleu", - "score":0.1326285083 + "score":0.2872908558 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", + "bcp_47":"it", "task":"translation_to", "metric":"chrf", - "score":0.3320956129 + "score":0.5675711887 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ms", + "bcp_47":"ja", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ms", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ja", "task":"mmlu", "metric":"accuracy", "score":0.5 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ms", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.2497447823 + "score":0.2197709837 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ms", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.5162841499 + "score":0.4784848367 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ms", + "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.3139021174 + "score":0.3426239655 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ms", + "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.6108991322 + "score":0.4822747548 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"my", + "bcp_47":"jv", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"my", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.235010453 + "score":0.2192585886 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"my", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.4387602841 + "score":0.4527368673 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"my", + "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.0992435005 + "score":0.1076519805 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"my", + "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.3897491958 + "score":0.4493011434 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"om", + "bcp_47":"ki", "task":"classification", "metric":"accuracy", - "score":0.6 + "score":0.0 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"om", - "task":"mgsm", - "metric":"accuracy", + "bcp_47":"ki", + "task":"translation_from", + "metric":"bleu", "score":0.0 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"om", - "task":"mmlu", + "bcp_47":"ki", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ki", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ki", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"kk", + "task":"classification", "metric":"accuracy", - "score":0.2 + "score":0.9 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"om", + "bcp_47":"kk", "task":"translation_from", "metric":"bleu", - "score":0.0253971349 + "score":0.1468838458 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"om", + "bcp_47":"kk", "task":"translation_from", "metric":"chrf", - "score":0.1941399108 + "score":0.4417745561 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"om", + "bcp_47":"kk", "task":"translation_to", "metric":"bleu", - "score":0.0169773321 + "score":0.1037111406 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"om", + "bcp_47":"kk", "task":"translation_to", "metric":"chrf", - "score":0.1905807428 + "score":0.3845090606 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"or", + "bcp_47":"km", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"or", + "bcp_47":"km", "task":"translation_from", "metric":"bleu", - "score":0.1621367612 + "score":0.1705614622 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"or", + "bcp_47":"km", "task":"translation_from", "metric":"chrf", - "score":0.4038308668 + "score":0.4283589307 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"or", + "bcp_47":"km", "task":"translation_to", "metric":"bleu", - "score":0.0908092738 + "score":0.0591946627 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"or", + "bcp_47":"km", "task":"translation_to", "metric":"chrf", - "score":0.3143126503 + "score":0.2932951073 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", + "bcp_47":"kn", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", + "bcp_47":"kn", "task":"translation_from", "metric":"bleu", - "score":0.3548435009 + "score":0.1691888664 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", + "bcp_47":"kn", "task":"translation_from", "metric":"chrf", - "score":0.6046727327 + "score":0.4411352116 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", + "bcp_47":"kn", "task":"translation_to", "metric":"bleu", - "score":0.3341282505 + "score":0.1416550774 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", + "bcp_47":"kn", "task":"translation_to", "metric":"chrf", - "score":0.4931240563 + "score":0.3528205749 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", + "bcp_47":"ko", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"mgsm", - "metric":"accuracy", - "score":0.2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", + "bcp_47":"ko", "task":"mmlu", "metric":"accuracy", "score":0.6 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", + "bcp_47":"ko", "task":"translation_from", "metric":"bleu", - "score":0.1867871917 + "score":0.144249324 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", + "bcp_47":"ko", "task":"translation_from", "metric":"chrf", - "score":0.4539322586 + "score":0.4191931285 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", + "bcp_47":"ko", "task":"translation_to", "metric":"bleu", - "score":0.2742131221 + "score":0.2803945229 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", + "bcp_47":"ko", "task":"translation_to", "metric":"chrf", - "score":0.5129096175 + "score":0.3626852212 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", + "bcp_47":"lua", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 + "score":0.8 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", + "bcp_47":"lua", "task":"translation_from", "metric":"bleu", - "score":0.2534618489 + "score":0.0633143836 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", + "bcp_47":"lua", "task":"translation_from", "metric":"chrf", - "score":0.4757478619 + "score":0.2651687739 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", + "bcp_47":"lua", "task":"translation_to", "metric":"bleu", - "score":0.4150555406 + "score":0.020688049 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", + "bcp_47":"lua", "task":"translation_to", "metric":"chrf", - "score":0.632650236 + "score":0.2307402586 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", + "bcp_47":"mag", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"mgsm", - "metric":"accuracy", - "score":0.1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", + "bcp_47":"mag", "task":"translation_from", "metric":"bleu", - "score":0.173300895 + "score":0.2269784465 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", + "bcp_47":"mag", "task":"translation_from", "metric":"chrf", - "score":0.4267275321 + "score":0.4948809346 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", + "bcp_47":"mag", "task":"translation_to", "metric":"bleu", - "score":0.2934481188 + "score":0.2820214504 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", + "bcp_47":"mag", "task":"translation_to", "metric":"chrf", - "score":0.5432096638 + "score":0.5208833255 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", + "bcp_47":"mai", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", + "bcp_47":"mai", "task":"translation_from", "metric":"bleu", - "score":0.1924194773 + "score":0.1601088672 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", + "bcp_47":"mai", "task":"translation_from", "metric":"chrf", - "score":0.4198584709 + "score":0.4390231849 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", + "bcp_47":"mai", "task":"translation_to", "metric":"bleu", - "score":0.0594147664 + "score":0.1901773558 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", + "bcp_47":"mai", "task":"translation_to", "metric":"chrf", - "score":0.2791093079 + "score":0.4143082353 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", + "bcp_47":"mg", "task":"classification", "metric":"accuracy", "score":0.8 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"mgsm", - "metric":"accuracy", - "score":0.1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", + "bcp_47":"mg", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.2 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", + "bcp_47":"mg", "task":"translation_from", "metric":"bleu", - "score":0.203432711 + "score":0.1257791635 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", + "bcp_47":"mg", "task":"translation_from", "metric":"chrf", - "score":0.4661592161 + "score":0.3415200548 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", + "bcp_47":"mg", "task":"translation_to", "metric":"bleu", - "score":0.260138004 + "score":0.0274461195 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", + "bcp_47":"mg", "task":"translation_to", "metric":"chrf", - "score":0.5610336232 + "score":0.3265811196 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", + "bcp_47":"ml", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", + "bcp_47":"ml", "task":"translation_from", "metric":"bleu", - "score":0.1686868634 + "score":0.2611524911 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", + "bcp_47":"ml", "task":"translation_from", "metric":"chrf", - "score":0.4170694333 + "score":0.4964180281 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", + "bcp_47":"ml", "task":"translation_to", "metric":"bleu", - "score":0.1076094956 + "score":0.1563741006 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", + "bcp_47":"ml", "task":"translation_to", "metric":"chrf", - "score":0.4166151764 + "score":0.4042462159 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"te", + "bcp_47":"mr", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"mgsm", + "bcp_47":"mr", + "task":"translation_from", + "metric":"bleu", + "score":0.1387332093 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"mr", + "task":"translation_from", + "metric":"chrf", + "score":0.4231622054 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"mr", + "task":"translation_to", + "metric":"bleu", + "score":0.1326285083 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"mr", + "task":"translation_to", + "metric":"chrf", + "score":0.3320956129 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ms", + "task":"classification", "metric":"accuracy", - "score":0.1 + "score":0.8 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"te", + "bcp_47":"ms", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":0.5 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"te", + "bcp_47":"ms", "task":"translation_from", "metric":"bleu", - "score":0.3031235597 + "score":0.2497447823 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"te", + "bcp_47":"ms", "task":"translation_from", "metric":"chrf", - "score":0.537458124 + "score":0.5162841499 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"te", + "bcp_47":"ms", "task":"translation_to", "metric":"bleu", - "score":0.3112392832 + "score":0.3139021174 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"te", + "bcp_47":"ms", "task":"translation_to", "metric":"chrf", - "score":0.5195600347 + "score":0.6108991322 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"th", + "bcp_47":"my", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"mgsm", - "metric":"accuracy", - "score":0.2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", + "bcp_47":"my", "task":"translation_from", "metric":"bleu", - "score":0.1544266067 + "score":0.235010453 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"th", + "bcp_47":"my", "task":"translation_from", "metric":"chrf", - "score":0.4093583062 + "score":0.4387602841 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"th", + "bcp_47":"my", "task":"translation_to", "metric":"bleu", - "score":0.2921490956 + "score":0.0992435005 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"th", + "bcp_47":"my", "task":"translation_to", "metric":"chrf", - "score":0.4738053288 + "score":0.3897491958 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", + "bcp_47":"ne", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", + "bcp_47":"ne", "task":"mmlu", "metric":"accuracy", "score":0.4 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", + "bcp_47":"ne", "task":"translation_from", "metric":"bleu", - "score":0.1911760417 + "score":0.216754292 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", + "bcp_47":"ne", "task":"translation_from", "metric":"chrf", - "score":0.4884230434 + "score":0.4725649931 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", + "bcp_47":"ne", "task":"translation_to", "metric":"bleu", - "score":0.2744588637 + "score":0.1116933816 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", + "bcp_47":"ne", "task":"translation_to", "metric":"chrf", - "score":0.5473239267 + "score":0.3950140706 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", + "bcp_47":"nl", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", + "bcp_47":"nl", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"nl", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"nl", "task":"translation_from", "metric":"bleu", - "score":0.2338522454 + "score":0.2226934995 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", + "bcp_47":"nl", "task":"translation_from", "metric":"chrf", - "score":0.4761317098 + "score":0.4632319399 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", + "bcp_47":"nl", "task":"translation_to", "metric":"bleu", - "score":0.1016530484 + "score":0.2791201051 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", + "bcp_47":"nl", "task":"translation_to", "metric":"chrf", - "score":0.3475324071 + "score":0.5528589826 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"uz", + "bcp_47":"ny", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"uz", + "bcp_47":"ny", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ny", "task":"translation_from", "metric":"bleu", - "score":0.1532167967 + "score":0.0909296921 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"uz", + "bcp_47":"ny", "task":"translation_from", "metric":"chrf", - "score":0.4049784493 + "score":0.2970179383 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"uz", + "bcp_47":"ny", "task":"translation_to", "metric":"bleu", - "score":0.1825939096 + "score":0.02807499 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"uz", + "bcp_47":"ny", "task":"translation_to", "metric":"chrf", - "score":0.4435726767 + "score":0.219484121 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", + "bcp_47":"om", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.6 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"om", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.2 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", + "bcp_47":"om", "task":"translation_from", "metric":"bleu", - "score":0.122224664 + "score":0.0253971349 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", + "bcp_47":"om", "task":"translation_from", "metric":"chrf", - "score":0.3790772862 + "score":0.1941399108 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", + "bcp_47":"om", "task":"translation_to", "metric":"bleu", - "score":0.1919159066 + "score":0.0169773321 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", + "bcp_47":"om", "task":"translation_to", "metric":"chrf", - "score":0.4399907204 + "score":0.1905807428 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"wuu", + "bcp_47":"or", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"wuu", + "bcp_47":"or", "task":"translation_from", "metric":"bleu", - "score":0.1258893867 + "score":0.1621367612 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"wuu", + "bcp_47":"or", "task":"translation_from", "metric":"chrf", - "score":0.3740568466 + "score":0.4038308668 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"wuu", + "bcp_47":"or", "task":"translation_to", "metric":"bleu", - "score":0.1033449919 + "score":0.0908092738 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"wuu", + "bcp_47":"or", "task":"translation_to", "metric":"chrf", - "score":0.1661073339 + "score":0.3143126503 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", + "bcp_47":"pa", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.1573790422 + "score":0.3548435009 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.438817852 + "score":0.6046727327 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", + "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.1346642263 + "score":0.3341282505 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", + "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.2288901399 + "score":0.4931240563 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", + "bcp_47":"pl", "task":"classification", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", + "bcp_47":"pl", "task":"mgsm", "metric":"accuracy", - "score":0.1 + "score":0.2 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", + "bcp_47":"pl", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.6 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", + "bcp_47":"pl", "task":"translation_from", "metric":"bleu", - "score":0.1734447333 + "score":0.1867871917 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", + "bcp_47":"pl", "task":"translation_from", "metric":"chrf", - "score":0.4737881775 + "score":0.4539322586 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", + "bcp_47":"pl", "task":"translation_to", "metric":"bleu", - "score":0.2855931625 + "score":0.2742131221 }, { "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", + "bcp_47":"pl", "task":"translation_to", "metric":"chrf", - "score":0.3243323503 + "score":0.5129096175 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"am", + "model":"amazon\/nova-micro-v1", + "bcp_47":"pt", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"am", - "task":"mgsm", - "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"am", + "model":"amazon\/nova-micro-v1", + "bcp_47":"pt", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"am", + "model":"amazon\/nova-micro-v1", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.2026417516 + "score":0.2534618489 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"am", + "model":"amazon\/nova-micro-v1", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.463337874 + "score":0.4757478619 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"am", + "model":"amazon\/nova-micro-v1", + "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.1217867685 + "score":0.4150555406 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"am", + "model":"amazon\/nova-micro-v1", + "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.2662662886 + "score":0.632650236 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"apc", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ro", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"apc", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ro", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ro", "task":"translation_from", "metric":"bleu", - "score":0.2523784543 + "score":0.1876189148 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"apc", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ro", "task":"translation_from", "metric":"chrf", - "score":0.5195328715 + "score":0.454947207 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"apc", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ro", "task":"translation_to", "metric":"bleu", - "score":0.2422451252 + "score":0.3342150948 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"apc", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ro", "task":"translation_to", "metric":"chrf", - "score":0.5264317244 + "score":0.57049006 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ru", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ru", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.6 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.2660357996 + "score":0.173300895 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.5489237487 + "score":0.4267275321 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.3431691167 + "score":0.2934481188 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.5659025601 + "score":0.5432096638 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", + "model":"amazon\/nova-micro-v1", + "bcp_47":"rw", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", + "model":"amazon\/nova-micro-v1", + "bcp_47":"rw", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"rw", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"rw", "task":"translation_from", "metric":"bleu", - "score":0.221843468 + "score":0.0583944161 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", + "model":"amazon\/nova-micro-v1", + "bcp_47":"rw", "task":"translation_from", "metric":"chrf", - "score":0.4559655934 + "score":0.3018524463 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", + "model":"amazon\/nova-micro-v1", + "bcp_47":"rw", "task":"translation_to", "metric":"bleu", - "score":0.1965127641 + "score":0.0428604601 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", + "model":"amazon\/nova-micro-v1", + "bcp_47":"rw", "task":"translation_to", "metric":"chrf", - "score":0.4448745325 + "score":0.2723962004 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"az", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sd", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"az", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sd", "task":"translation_from", "metric":"bleu", - "score":0.1557419708 + "score":0.1924194773 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"az", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sd", "task":"translation_from", "metric":"chrf", - "score":0.4249908572 + "score":0.4198584709 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"az", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sd", "task":"translation_to", "metric":"bleu", - "score":0.1551519146 + "score":0.0594147664 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"az", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sd", "task":"translation_to", "metric":"chrf", - "score":0.4046874828 + "score":0.2791093079 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bho", + "model":"amazon\/nova-micro-v1", + "bcp_47":"si", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bho", + "model":"amazon\/nova-micro-v1", + "bcp_47":"si", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"si", "task":"translation_from", "metric":"bleu", - "score":0.2524146198 + "score":0.1888886982 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bho", + "model":"amazon\/nova-micro-v1", + "bcp_47":"si", "task":"translation_from", "metric":"chrf", - "score":0.4953606649 + "score":0.4271659434 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bho", + "model":"amazon\/nova-micro-v1", + "bcp_47":"si", "task":"translation_to", "metric":"bleu", - "score":0.1826604742 + "score":0.0950029931 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bho", + "model":"amazon\/nova-micro-v1", + "bcp_47":"si", "task":"translation_to", "metric":"chrf", - "score":0.3887388562 + "score":0.2956403655 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sn", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sn", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sn", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.5 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sn", "task":"translation_from", "metric":"bleu", - "score":0.2999810338 + "score":0.0476351796 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sn", "task":"translation_from", "metric":"chrf", - "score":0.5315905896 + "score":0.2242691735 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sn", "task":"translation_to", "metric":"bleu", - "score":0.3568113924 + "score":0.0203405417 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sn", "task":"translation_to", "metric":"chrf", - "score":0.5379558638 + "score":0.2850725298 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", + "model":"amazon\/nova-micro-v1", + "bcp_47":"so", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"mgsm", - "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", + "model":"amazon\/nova-micro-v1", + "bcp_47":"so", "task":"mmlu", "metric":"accuracy", - "score":1.0 + "score":0.4 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", + "model":"amazon\/nova-micro-v1", + "bcp_47":"so", "task":"translation_from", "metric":"bleu", - "score":0.3410327538 + "score":0.0944388832 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", + "model":"amazon\/nova-micro-v1", + "bcp_47":"so", "task":"translation_from", "metric":"chrf", - "score":0.5702449417 + "score":0.306261789 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", + "model":"amazon\/nova-micro-v1", + "bcp_47":"so", "task":"translation_to", "metric":"bleu", - "score":0.4621824412 + "score":0.019432628 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", + "model":"amazon\/nova-micro-v1", + "bcp_47":"so", "task":"translation_to", "metric":"chrf", - "score":0.6644677733 + "score":0.2483400713 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"mgsm", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sr", + "task":"mmlu", "metric":"accuracy", - "score":1.0 + "score":0.7 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"mmlu", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sr", + "task":"translation_from", + "metric":"bleu", + "score":0.2062990967 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"sr", + "task":"translation_from", + "metric":"chrf", + "score":0.4818899065 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"sr", + "task":"translation_to", + "metric":"bleu", + "score":0.2783417409 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"sr", + "task":"translation_to", + "metric":"chrf", + "score":0.4975137727 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"su", + "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", + "model":"amazon\/nova-micro-v1", + "bcp_47":"su", "task":"translation_from", "metric":"bleu", - "score":0.5530727537 + "score":0.1360125442 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", + "model":"amazon\/nova-micro-v1", + "bcp_47":"su", "task":"translation_from", "metric":"chrf", - "score":0.7075859327 + "score":0.3674257568 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", + "model":"amazon\/nova-micro-v1", + "bcp_47":"su", "task":"translation_to", "metric":"bleu", - "score":0.6368037655 + "score":0.0850175921 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", + "model":"amazon\/nova-micro-v1", + "bcp_47":"su", "task":"translation_to", "metric":"chrf", - "score":0.8170495194 + "score":0.3898736967 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sv", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sv", "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sv", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.5 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sv", "task":"translation_from", "metric":"bleu", - "score":0.3558328881 + "score":0.2441010155 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sv", "task":"translation_from", "metric":"chrf", - "score":0.5816613686 + "score":0.4832568053 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sv", "task":"translation_to", "metric":"bleu", - "score":0.3018683161 + "score":0.2973906807 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sv", "task":"translation_to", "metric":"chrf", - "score":0.5862734644 + "score":0.5569302178 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sw", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sw", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"sw", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.5 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.2520796337 + "score":0.203432711 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.5331446204 + "score":0.4661592161 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.1921744404 + "score":0.260138004 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.407787256 + "score":0.5610336232 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ta", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ta", "task":"translation_from", "metric":"bleu", - "score":0.3243217549 + "score":0.1686868634 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ta", "task":"translation_from", "metric":"chrf", - "score":0.5392052945 + "score":0.4170694333 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ta", "task":"translation_to", "metric":"bleu", - "score":0.3295144102 + "score":0.1076094956 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ta", "task":"translation_to", "metric":"chrf", - "score":0.5926958618 + "score":0.4166151764 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", + "model":"amazon\/nova-micro-v1", + "bcp_47":"te", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", + "model":"amazon\/nova-micro-v1", + "bcp_47":"te", "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.1 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", + "model":"amazon\/nova-micro-v1", + "bcp_47":"te", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.4 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", + "model":"amazon\/nova-micro-v1", + "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.3482763208 + "score":0.3031235597 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", + "model":"amazon\/nova-micro-v1", + "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.5982327963 + "score":0.537458124 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", + "model":"amazon\/nova-micro-v1", + "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.452269216 + "score":0.3112392832 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", + "model":"amazon\/nova-micro-v1", + "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.6590312745 + "score":0.5195600347 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", + "model":"amazon\/nova-micro-v1", + "bcp_47":"tg", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", + "model":"amazon\/nova-micro-v1", + "bcp_47":"tg", "task":"translation_from", "metric":"bleu", - "score":0.2919455567 + "score":0.1315355302 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", + "model":"amazon\/nova-micro-v1", + "bcp_47":"tg", "task":"translation_from", "metric":"chrf", - "score":0.5131981959 + "score":0.3725651966 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", + "model":"amazon\/nova-micro-v1", + "bcp_47":"tg", "task":"translation_to", "metric":"bleu", - "score":0.1292315656 + "score":0.0631259366 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", + "model":"amazon\/nova-micro-v1", + "bcp_47":"tg", "task":"translation_to", "metric":"chrf", - "score":0.4092770954 + "score":0.3114796779 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", + "model":"amazon\/nova-micro-v1", + "bcp_47":"th", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", + "model":"amazon\/nova-micro-v1", + "bcp_47":"th", "task":"mgsm", "metric":"accuracy", - "score":0.4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 + "score":0.2 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", + "model":"amazon\/nova-micro-v1", + "bcp_47":"th", "task":"translation_from", "metric":"bleu", - "score":0.1854918728 + "score":0.1544266067 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", + "model":"amazon\/nova-micro-v1", + "bcp_47":"th", "task":"translation_from", "metric":"chrf", - "score":0.3934600154 + "score":0.4093583062 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", + "model":"amazon\/nova-micro-v1", + "bcp_47":"th", "task":"translation_to", "metric":"bleu", - "score":0.266974078 + "score":0.2921490956 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", + "model":"amazon\/nova-micro-v1", + "bcp_47":"th", "task":"translation_to", "metric":"chrf", - "score":0.5393383261 + "score":0.4738053288 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ti", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0 + "score":0.6 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ti", "task":"translation_from", "metric":"bleu", - "score":0.3747394322 + "score":0.0376554837 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ti", "task":"translation_from", "metric":"chrf", - "score":0.6079633657 + "score":0.220689676 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ti", "task":"translation_to", "metric":"bleu", - "score":0.4420465241 + "score":0.0245374067 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ti", "task":"translation_to", "metric":"chrf", - "score":0.6372857982 + "score":0.1093782195 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", + "model":"amazon\/nova-micro-v1", + "bcp_47":"tr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", + "model":"amazon\/nova-micro-v1", + "bcp_47":"tr", "task":"mmlu", "metric":"accuracy", - "score":1.0 + "score":0.4 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", + "model":"amazon\/nova-micro-v1", + "bcp_47":"tr", "task":"translation_from", "metric":"bleu", - "score":0.3120299438 + "score":0.1911760417 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", + "model":"amazon\/nova-micro-v1", + "bcp_47":"tr", "task":"translation_from", "metric":"chrf", - "score":0.5421647326 + "score":0.4884230434 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", + "model":"amazon\/nova-micro-v1", + "bcp_47":"tr", "task":"translation_to", "metric":"bleu", - "score":0.3139800299 + "score":0.2744588637 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", + "model":"amazon\/nova-micro-v1", + "bcp_47":"tr", "task":"translation_to", "metric":"chrf", - "score":0.6305869448 + "score":0.5473239267 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", + "model":"amazon\/nova-micro-v1", + "bcp_47":"uk", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", + "model":"amazon\/nova-micro-v1", + "bcp_47":"uk", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.6 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", + "model":"amazon\/nova-micro-v1", + "bcp_47":"uk", "task":"translation_from", "metric":"bleu", - "score":0.2726271593 + "score":0.2342560425 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", + "model":"amazon\/nova-micro-v1", + "bcp_47":"uk", "task":"translation_from", "metric":"chrf", - "score":0.5135668055 + "score":0.4694733574 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", + "model":"amazon\/nova-micro-v1", + "bcp_47":"uk", "task":"translation_to", "metric":"bleu", - "score":0.3420319137 + "score":0.3127145891 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", + "model":"amazon\/nova-micro-v1", + "bcp_47":"uk", "task":"translation_to", "metric":"chrf", - "score":0.6095914494 + "score":0.5389265653 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", + "model":"amazon\/nova-micro-v1", + "bcp_47":"umb", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.3 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 + "model":"amazon\/nova-micro-v1", + "bcp_47":"umb", + "task":"translation_from", + "metric":"bleu", + "score":0.0368191769 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"mmlu", + "model":"amazon\/nova-micro-v1", + "bcp_47":"umb", + "task":"translation_from", + "metric":"chrf", + "score":0.1231521557 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"umb", + "task":"translation_to", + "metric":"bleu", + "score":0.0009825493 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"umb", + "task":"translation_to", + "metric":"chrf", + "score":0.0937946455 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ur", + "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.2121435327 + "score":0.2338522454 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.5165098934 + "score":0.4761317098 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.3965805608 + "score":0.1016530484 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.5197322727 + "score":0.3475324071 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", + "model":"amazon\/nova-micro-v1", + "bcp_47":"uz", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", + "model":"amazon\/nova-micro-v1", + "bcp_47":"uz", "task":"translation_from", "metric":"bleu", - "score":0.2594796679 + "score":0.1532167967 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", + "model":"amazon\/nova-micro-v1", + "bcp_47":"uz", "task":"translation_from", "metric":"chrf", - "score":0.4780086047 + "score":0.4049784493 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", + "model":"amazon\/nova-micro-v1", + "bcp_47":"uz", "task":"translation_to", "metric":"bleu", - "score":0.3009966401 + "score":0.1825939096 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", + "model":"amazon\/nova-micro-v1", + "bcp_47":"uz", "task":"translation_to", "metric":"chrf", - "score":0.5761529867 + "score":0.4435726767 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", + "model":"amazon\/nova-micro-v1", + "bcp_47":"vi", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", + "model":"amazon\/nova-micro-v1", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.2597105982 + "score":0.122224664 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", + "model":"amazon\/nova-micro-v1", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.4929733942 + "score":0.3790772862 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", + "model":"amazon\/nova-micro-v1", + "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.1901313405 + "score":0.1919159066 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", + "model":"amazon\/nova-micro-v1", + "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.4793446685 + "score":0.4399907204 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", + "model":"amazon\/nova-micro-v1", + "bcp_47":"wo", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.7 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", + "model":"amazon\/nova-micro-v1", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"wo", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.2 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", + "model":"amazon\/nova-micro-v1", + "bcp_47":"wo", "task":"translation_from", "metric":"bleu", - "score":0.2650641815 + "score":0.0652970567 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", + "model":"amazon\/nova-micro-v1", + "bcp_47":"wo", "task":"translation_from", "metric":"chrf", - "score":0.5151986111 + "score":0.2548173577 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", + "model":"amazon\/nova-micro-v1", + "bcp_47":"wo", "task":"translation_to", "metric":"bleu", - "score":0.2220814456 + "score":0.006043152 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", + "model":"amazon\/nova-micro-v1", + "bcp_47":"wo", "task":"translation_to", "metric":"chrf", - "score":0.318063422 + "score":0.1774675407 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", + "model":"amazon\/nova-micro-v1", + "bcp_47":"wuu", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", + "model":"amazon\/nova-micro-v1", + "bcp_47":"wuu", "task":"translation_from", "metric":"bleu", - "score":0.3261687004 + "score":0.1258893867 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", + "model":"amazon\/nova-micro-v1", + "bcp_47":"wuu", "task":"translation_from", "metric":"chrf", - "score":0.5570892069 + "score":0.3740568466 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", + "model":"amazon\/nova-micro-v1", + "bcp_47":"wuu", "task":"translation_to", "metric":"bleu", - "score":0.3239362726 + "score":0.1033449919 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", + "model":"amazon\/nova-micro-v1", + "bcp_47":"wuu", "task":"translation_to", "metric":"chrf", - "score":0.5507453743 + "score":0.1661073339 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", + "model":"amazon\/nova-micro-v1", + "bcp_47":"xh", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", + "model":"amazon\/nova-micro-v1", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"xh", "task":"translation_from", "metric":"bleu", - "score":0.2536168105 + "score":0.1178497705 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", + "model":"amazon\/nova-micro-v1", + "bcp_47":"xh", "task":"translation_from", "metric":"chrf", - "score":0.5193737639 + "score":0.3273836873 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", + "model":"amazon\/nova-micro-v1", + "bcp_47":"xh", "task":"translation_to", "metric":"bleu", - "score":0.2743904396 + "score":0.0233770563 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", + "model":"amazon\/nova-micro-v1", + "bcp_47":"xh", "task":"translation_to", "metric":"chrf", - "score":0.4918283752 + "score":0.2536020887 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ms", + "model":"amazon\/nova-micro-v1", + "bcp_47":"yo", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ms", + "model":"amazon\/nova-micro-v1", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"yo", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.4 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ms", + "model":"amazon\/nova-micro-v1", + "bcp_47":"yo", "task":"translation_from", "metric":"bleu", - "score":0.2986347511 + "score":0.0573424824 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ms", + "model":"amazon\/nova-micro-v1", + "bcp_47":"yo", "task":"translation_from", "metric":"chrf", - "score":0.5339411724 + "score":0.2409922496 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ms", + "model":"amazon\/nova-micro-v1", + "bcp_47":"yo", "task":"translation_to", "metric":"bleu", - "score":0.3783664491 + "score":0.0316163135 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ms", + "model":"amazon\/nova-micro-v1", + "bcp_47":"yo", "task":"translation_to", "metric":"chrf", - "score":0.6540376697 + "score":0.1841004492 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"my", + "model":"amazon\/nova-micro-v1", + "bcp_47":"yue", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"my", + "model":"amazon\/nova-micro-v1", + "bcp_47":"yue", "task":"translation_from", "metric":"bleu", - "score":0.2199531275 + "score":0.1573790422 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"my", + "model":"amazon\/nova-micro-v1", + "bcp_47":"yue", "task":"translation_from", "metric":"chrf", - "score":0.4736214414 + "score":0.438817852 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"my", + "model":"amazon\/nova-micro-v1", + "bcp_47":"yue", "task":"translation_to", "metric":"bleu", - "score":0.2571304866 + "score":0.1346642263 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"my", + "model":"amazon\/nova-micro-v1", + "bcp_47":"yue", "task":"translation_to", "metric":"chrf", - "score":0.5221658577 + "score":0.2288901399 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"om", + "model":"amazon\/nova-micro-v1", + "bcp_47":"zh", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.7 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"om", + "model":"amazon\/nova-micro-v1", + "bcp_47":"zh", "task":"mgsm", "metric":"accuracy", - "score":0.4 + "score":0.1 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"om", + "model":"amazon\/nova-micro-v1", + "bcp_47":"zh", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.7 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"om", + "model":"amazon\/nova-micro-v1", + "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.0512543236 + "score":0.1734447333 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"om", + "model":"amazon\/nova-micro-v1", + "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.2613232237 + "score":0.4737881775 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"om", + "model":"amazon\/nova-micro-v1", + "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.0260385015 + "score":0.2855931625 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"om", + "model":"amazon\/nova-micro-v1", + "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.3274101513 + "score":0.3243323503 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", + "model":"amazon\/nova-micro-v1", + "bcp_47":"zu", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", + "model":"amazon\/nova-micro-v1", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"zu", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"zu", "task":"translation_from", "metric":"bleu", - "score":0.271766815 + "score":0.1225580295 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", + "model":"amazon\/nova-micro-v1", + "bcp_47":"zu", "task":"translation_from", "metric":"chrf", - "score":0.5041819226 + "score":0.3092331916 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", + "model":"amazon\/nova-micro-v1", + "bcp_47":"zu", "task":"translation_to", "metric":"bleu", - "score":0.1870998997 + "score":0.0262808074 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", + "model":"amazon\/nova-micro-v1", + "bcp_47":"zu", "task":"translation_to", "metric":"chrf", - "score":0.4329741844 + "score":0.2709457919 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"aeb", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"aeb", "task":"translation_from", "metric":"bleu", - "score":0.4307107958 + "score":0.2525776792 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"aeb", "task":"translation_from", "metric":"chrf", - "score":0.6547934264 + "score":0.486411661 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"aeb", "task":"translation_to", "metric":"bleu", - "score":0.3789232965 + "score":0.1689851292 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"aeb", "task":"translation_to", "metric":"chrf", - "score":0.5490387026 + "score":0.4129981246 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"af", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"af", "task":"translation_from", "metric":"bleu", - "score":0.2715804037 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"af", "task":"translation_from", "metric":"chrf", - "score":0.5307525116 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"af", "task":"translation_to", "metric":"bleu", - "score":0.3285527346 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"af", "task":"translation_to", "metric":"chrf", - "score":0.5692291394 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ak", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ak", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ak", "task":"translation_from", "metric":"bleu", - "score":0.3491027097 + "score":0.2332134247 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ak", "task":"translation_from", "metric":"chrf", - "score":0.5771246685 + "score":0.423589823 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ak", "task":"translation_to", "metric":"bleu", - "score":0.3737440632 + "score":0.1556181424 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ak", "task":"translation_to", "metric":"chrf", - "score":0.6547073078 + "score":0.3940970742 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"am", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"am", "task":"mgsm", "metric":"accuracy", "score":1.0 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"am", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"am", "task":"translation_from", "metric":"bleu", - "score":0.2584319121 + "score":0.3019856242 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"am", "task":"translation_from", "metric":"chrf", - "score":0.5177022275 + "score":0.5356092631 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"am", "task":"translation_to", "metric":"bleu", - "score":0.371218137 + "score":0.2493197472 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"am", "task":"translation_to", "metric":"chrf", - "score":0.5948906549 + "score":0.3683119816 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"apc", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"apc", "task":"translation_from", "metric":"bleu", - "score":0.2619487807 + "score":0.3299261084 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"apc", "task":"translation_from", "metric":"chrf", - "score":0.4937679545 + "score":0.5833446367 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"apc", "task":"translation_to", "metric":"bleu", - "score":0.2097242522 + "score":0.2557354135 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"apc", "task":"translation_to", "metric":"chrf", - "score":0.4402768379 + "score":0.4932559294 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ar", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ar", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.2583542451 + "score":0.2978564835 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.5157482031 + "score":0.5565909038 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.3458513734 + "score":0.432503176 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.634706105 + "score":0.6128170494 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ary", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ary", "task":"translation_from", "metric":"bleu", - "score":0.2339300786 + "score":0.2313315741 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ary", "task":"translation_from", "metric":"chrf", - "score":0.4691042738 + "score":0.4980876242 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ary", "task":"translation_to", "metric":"bleu", - "score":0.2567323645 + "score":0.1602739474 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ary", "task":"translation_to", "metric":"chrf", - "score":0.5361849509 + "score":0.4283745115 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"arz", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"arz", "task":"translation_from", "metric":"bleu", - "score":0.3887890595 + "score":0.2208466475 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"arz", "task":"translation_from", "metric":"chrf", - "score":0.6100201392 + "score":0.4480506021 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"arz", "task":"translation_to", "metric":"bleu", - "score":0.3146346509 + "score":0.2446811676 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"arz", "task":"translation_to", "metric":"chrf", - "score":0.5476489231 + "score":0.4668847579 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"as", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"as", "task":"translation_from", "metric":"bleu", - "score":0.2554271374 + "score":0.2365169024 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"as", "task":"translation_from", "metric":"chrf", - "score":0.5059580785 + "score":0.4798564418 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"as", "task":"translation_to", "metric":"bleu", - "score":0.3635410685 + "score":0.1836576399 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"as", "task":"translation_to", "metric":"chrf", - "score":0.5132811401 + "score":0.4135133991 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"awa", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"awa", "task":"translation_from", "metric":"bleu", - "score":0.3173811815 + "score":0.3426000326 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"awa", "task":"translation_from", "metric":"chrf", - "score":0.5742755278 + "score":0.5515631826 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"awa", "task":"translation_to", "metric":"bleu", - "score":0.3658586977 + "score":0.1661968791 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"awa", "task":"translation_to", "metric":"chrf", - "score":0.5886644893 + "score":0.36455729 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"az", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"az", "task":"translation_from", "metric":"bleu", - "score":0.2324983634 + "score":0.2545049288 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"az", "task":"translation_from", "metric":"chrf", - "score":0.497221173 + "score":0.4810751728 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"az", "task":"translation_to", "metric":"bleu", - "score":0.2976387517 + "score":0.1944100883 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"az", "task":"translation_to", "metric":"chrf", - "score":0.4761547661 + "score":0.4665838917 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"uz", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"be", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"uz", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"be", "task":"translation_from", "metric":"bleu", - "score":0.2305488159 + "score":0.2285219894 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"uz", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"be", "task":"translation_from", "metric":"chrf", - "score":0.4723700911 + "score":0.494917535 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"uz", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"be", "task":"translation_to", "metric":"bleu", - "score":0.2058479152 + "score":0.2797028839 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"uz", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"be", "task":"translation_to", "metric":"chrf", - "score":0.4902380763 + "score":0.4981195393 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"bho", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"bho", "task":"translation_from", "metric":"bleu", - "score":0.3027505857 + "score":0.2674142888 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"bho", "task":"translation_from", "metric":"chrf", - "score":0.5506378818 + "score":0.5117383385 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"bho", "task":"translation_to", "metric":"bleu", - "score":0.3708866541 + "score":0.2226695839 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"bho", "task":"translation_to", "metric":"chrf", - "score":0.5846851624 + "score":0.4175069959 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"wuu", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"bm", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"wuu", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"bm", "task":"translation_from", "metric":"bleu", - "score":0.2388037754 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"wuu", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"bm", "task":"translation_from", "metric":"chrf", - "score":0.5072972409 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"wuu", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"bm", "task":"translation_to", "metric":"bleu", - "score":0.1136417481 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"wuu", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"bm", "task":"translation_to", "metric":"chrf", - "score":0.1766903691 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"bn", "task":"classification", "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", "score":1.0 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.143983328 + "score":0.3456828806 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.3955437811 + "score":0.5745055104 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.2002778421 + "score":0.3168780466 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.2907084137 + "score":0.5146817021 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ca", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ca", "task":"translation_from", "metric":"bleu", - "score":0.2377253988 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ca", "task":"translation_from", "metric":"chrf", - "score":0.5405656214 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ca", "task":"translation_to", "metric":"bleu", - "score":0.2660263348 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ca", "task":"translation_to", "metric":"chrf", - "score":0.3459946232 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"am", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ceb", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"am", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"am", - "task":"mmlu", - "metric":"accuracy", - "score":0.4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"am", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ceb", "task":"translation_from", "metric":"bleu", - "score":0.2016755199 + "score":0.4102088719 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"am", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ceb", "task":"translation_from", "metric":"chrf", - "score":0.4502815524 + "score":0.5919699107 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"am", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ceb", "task":"translation_to", "metric":"bleu", - "score":0.1687061726 + "score":0.3905880035 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"am", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ceb", "task":"translation_to", "metric":"chrf", - "score":0.2849440478 + "score":0.6171544436 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"apc", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ckb", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"apc", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ckb", "task":"translation_from", "metric":"bleu", - "score":0.2569252635 + "score":0.2819272083 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"apc", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ckb", "task":"translation_from", "metric":"chrf", - "score":0.5329928091 + "score":0.5597768822 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"apc", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ckb", "task":"translation_to", "metric":"bleu", - "score":0.2423805131 + "score":0.2855875443 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"apc", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ckb", "task":"translation_to", "metric":"chrf", - "score":0.5144112629 + "score":0.5213025666 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"cs", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"cs", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":1.0 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"cs", "task":"translation_from", "metric":"bleu", - "score":0.2993048546 + "score":0.3459871993 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"cs", "task":"translation_from", "metric":"chrf", - "score":0.5651988199 + "score":0.6001384205 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"cs", "task":"translation_to", "metric":"bleu", - "score":0.3853695566 + "score":0.4616988853 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"cs", "task":"translation_to", "metric":"chrf", - "score":0.602672086 + "score":0.6321620897 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"de", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.1819096557 + "score":0.3819883103 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.4374822654 + "score":0.6006708192 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.2316387528 + "score":0.487017155 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.4676592617 + "score":0.6782242157 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"az", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"el", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"az", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"el", "task":"translation_from", "metric":"bleu", - "score":0.1950569484 + "score":0.3137128529 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"az", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"el", "task":"translation_from", "metric":"chrf", - "score":0.4560500844 + "score":0.547364909 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"az", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"el", "task":"translation_to", "metric":"bleu", - "score":0.1448904562 + "score":0.3942999119 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"az", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"el", "task":"translation_to", "metric":"chrf", - "score":0.4007813245 + "score":0.5751984516 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bho", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"en", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bho", - "task":"translation_from", - "metric":"bleu", - "score":0.2098690628 + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bho", - "task":"translation_from", - "metric":"chrf", - "score":0.4737398201 + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bho", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"en", + "task":"translation_from", + "metric":"bleu", + "score":0.5715619385 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"en", + "task":"translation_from", + "metric":"chrf", + "score":0.715520007 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.1892048942 + "score":0.7318691008 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bho", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.3849575805 + "score":0.8563332446 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"es", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"es", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":1.0 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"es", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":1.0 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.2798537803 + "score":0.3643234323 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.5394779979 + "score":0.5843649416 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.3719179468 + "score":0.3881940897 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.539682577 + "score":0.6134636944 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"fa", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"fa", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"fa", "task":"translation_from", "metric":"bleu", - "score":0.3207762021 + "score":0.3166464353 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"fa", "task":"translation_from", "metric":"chrf", - "score":0.5555389401 + "score":0.5644297126 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"fa", "task":"translation_to", "metric":"bleu", - "score":0.4227752207 + "score":0.255024921 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"fa", "task":"translation_to", "metric":"chrf", - "score":0.6601015066 + "score":0.4730105151 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"fil", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"fil", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":1.0 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"fil", "task":"translation_from", "metric":"bleu", - "score":0.5548034204 + "score":0.3710429385 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"fil", "task":"translation_from", "metric":"chrf", - "score":0.7071106777 + "score":0.6023461066 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"fil", "task":"translation_to", "metric":"bleu", - "score":0.6432470265 + "score":0.3249072169 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"fil", "task":"translation_to", "metric":"chrf", - "score":0.8278285651 + "score":0.6015751183 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"fr", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"fr", "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"fr", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.3223436235 + "score":0.376865653 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.5379000389 + "score":0.6004276916 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.3061941236 + "score":0.528425696 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.5918382188 + "score":0.7187146132 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"fuv", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"fuv", "task":"translation_from", "metric":"bleu", - "score":0.3294693656 + "score":0.0388587129 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"fuv", "task":"translation_from", "metric":"chrf", - "score":0.5673243159 + "score":0.2391023347 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"fuv", "task":"translation_to", "metric":"bleu", - "score":0.1938427279 + "score":0.0240769455 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"fuv", "task":"translation_to", "metric":"chrf", - "score":0.4526315895 + "score":0.243334857 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"gu", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"gu", "task":"translation_from", "metric":"bleu", - "score":0.3412226864 + "score":0.2822570677 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"gu", "task":"translation_from", "metric":"chrf", - "score":0.5602175563 + "score":0.5115986572 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"gu", "task":"translation_to", "metric":"bleu", - "score":0.2910894115 + "score":0.1968109087 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"gu", "task":"translation_to", "metric":"chrf", - "score":0.5672691361 + "score":0.4530952838 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ha", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ha", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ha", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ha", "task":"translation_from", "metric":"bleu", - "score":0.3297556296 + "score":0.2122035826 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ha", "task":"translation_from", "metric":"chrf", - "score":0.5925809306 + "score":0.4411039967 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ha", "task":"translation_to", "metric":"bleu", - "score":0.4619761505 + "score":0.2092794988 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ha", "task":"translation_to", "metric":"chrf", - "score":0.6734036273 + "score":0.4991915153 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"hi", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.3055790363 + "score":0.4228838058 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.5265498141 + "score":0.640023433 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.1365241949 + "score":0.4313107714 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.4093204393 + "score":0.6419340536 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"hne", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"mgsm", - "metric":"accuracy", - "score":0.6 + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"hne", + "task":"translation_from", + "metric":"bleu", + "score":0.2742764457 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"mmlu", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"hne", + "task":"translation_from", + "metric":"chrf", + "score":0.5234337918 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"hne", + "task":"translation_to", + "metric":"bleu", + "score":0.1283588392 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"hne", + "task":"translation_to", + "metric":"chrf", + "score":0.3942937124 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ht", + "task":"classification", "metric":"accuracy", - "score":0.6 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ht", "task":"translation_from", "metric":"bleu", - "score":0.1778454432 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ht", "task":"translation_from", "metric":"chrf", - "score":0.4028796881 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ht", "task":"translation_to", "metric":"bleu", - "score":0.2463440773 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ht", "task":"translation_to", "metric":"chrf", - "score":0.5200026897 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"hu", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"mmlu", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"hu", + "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"hu", "task":"translation_from", "metric":"bleu", - "score":0.3412169553 + "score":0.3239027756 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"hu", "task":"translation_from", "metric":"chrf", - "score":0.598919602 + "score":0.5801190353 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"hu", "task":"translation_to", "metric":"bleu", - "score":0.3937102354 + "score":0.3518811457 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"hu", "task":"translation_to", "metric":"chrf", - "score":0.6229439454 + "score":0.5955885461 }, { - "model":"deepseek\/deepseek-chat-v3-0324", + "model":"anthropic\/claude-3.5-sonnet", "bcp_47":"id", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", + "model":"anthropic\/claude-3.5-sonnet", "bcp_47":"id", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"deepseek\/deepseek-chat-v3-0324", + "model":"anthropic\/claude-3.5-sonnet", "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.3020610187 + "score":0.3600825798 }, { - "model":"deepseek\/deepseek-chat-v3-0324", + "model":"anthropic\/claude-3.5-sonnet", "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.5462026627 + "score":0.6054355131 }, { - "model":"deepseek\/deepseek-chat-v3-0324", + "model":"anthropic\/claude-3.5-sonnet", "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.299038365 + "score":0.3725744078 }, { - "model":"deepseek\/deepseek-chat-v3-0324", + "model":"anthropic\/claude-3.5-sonnet", "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.625735911 + "score":0.6643987333 }, { - "model":"deepseek\/deepseek-chat-v3-0324", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ig", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ig", + "task":"translation_from", + "metric":"bleu", + "score":0.2270079348 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ig", + "task":"translation_from", + "metric":"chrf", + "score":0.4461810563 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ig", + "task":"translation_to", + "metric":"bleu", + "score":0.1880347324 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ig", + "task":"translation_to", + "metric":"chrf", + "score":0.4366454082 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ilo", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"bleu", + "score":0.2896828865 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"chrf", + "score":0.5142198212 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"bleu", + "score":0.2227918044 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"chrf", + "score":0.5195207754 + }, + { + "model":"anthropic\/claude-3.5-sonnet", "bcp_47":"it", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", + "model":"anthropic\/claude-3.5-sonnet", "bcp_47":"it", "task":"mgsm", "metric":"accuracy", "score":1.0 }, { - "model":"deepseek\/deepseek-chat-v3-0324", + "model":"anthropic\/claude-3.5-sonnet", "bcp_47":"it", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", + "model":"anthropic\/claude-3.5-sonnet", "bcp_47":"it", "task":"translation_from", "metric":"bleu", - "score":0.254215081 + "score":0.3487353423 }, { - "model":"deepseek\/deepseek-chat-v3-0324", + "model":"anthropic\/claude-3.5-sonnet", "bcp_47":"it", "task":"translation_from", "metric":"chrf", - "score":0.5128620442 + "score":0.5751528871 }, { - "model":"deepseek\/deepseek-chat-v3-0324", + "model":"anthropic\/claude-3.5-sonnet", "bcp_47":"it", "task":"translation_to", "metric":"bleu", - "score":0.3318074211 + "score":0.4005498625 }, { - "model":"deepseek\/deepseek-chat-v3-0324", + "model":"anthropic\/claude-3.5-sonnet", "bcp_47":"it", "task":"translation_to", "metric":"chrf", - "score":0.5973973733 + "score":0.6354726766 }, { - "model":"deepseek\/deepseek-chat-v3-0324", + "model":"anthropic\/claude-3.5-sonnet", "bcp_47":"ja", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", + "model":"anthropic\/claude-3.5-sonnet", "bcp_47":"ja", "task":"mgsm", "metric":"accuracy", "score":1.0 }, { - "model":"deepseek\/deepseek-chat-v3-0324", + "model":"anthropic\/claude-3.5-sonnet", "bcp_47":"ja", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", + "model":"anthropic\/claude-3.5-sonnet", "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.1875636541 + "score":0.2982872033 }, { - "model":"deepseek\/deepseek-chat-v3-0324", + "model":"anthropic\/claude-3.5-sonnet", "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.5136106256 + "score":0.5388133219 }, { - "model":"deepseek\/deepseek-chat-v3-0324", + "model":"anthropic\/claude-3.5-sonnet", "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.3333377273 + "score":0.3041789231 }, { - "model":"deepseek\/deepseek-chat-v3-0324", + "model":"anthropic\/claude-3.5-sonnet", "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.4709407515 + "score":0.4600408983 }, { - "model":"deepseek\/deepseek-chat-v3-0324", + "model":"anthropic\/claude-3.5-sonnet", "bcp_47":"jv", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", + "model":"anthropic\/claude-3.5-sonnet", "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.2789250445 + "score":0.3464358022 }, { - "model":"deepseek\/deepseek-chat-v3-0324", + "model":"anthropic\/claude-3.5-sonnet", "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.52614288 + "score":0.5558199575 }, { - "model":"deepseek\/deepseek-chat-v3-0324", + "model":"anthropic\/claude-3.5-sonnet", "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.2580648249 + "score":0.2492331002 }, { - "model":"deepseek\/deepseek-chat-v3-0324", + "model":"anthropic\/claude-3.5-sonnet", "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.574708573 + "score":0.5673549318 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ki", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ki", "task":"translation_from", "metric":"bleu", - "score":0.2431929513 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ki", "task":"translation_from", "metric":"chrf", - "score":0.4397197217 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ki", "task":"translation_to", "metric":"bleu", - "score":0.1999599641 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ki", "task":"translation_to", "metric":"chrf", - "score":0.4781553813 + "score":0.0 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"kk", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"kk", "task":"translation_from", "metric":"bleu", - "score":0.2497463416 + "score":0.243733181 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"kk", "task":"translation_from", "metric":"chrf", - "score":0.5083726446 + "score":0.5336823494 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"kk", "task":"translation_to", "metric":"bleu", - "score":0.2002123483 + "score":0.3319552288 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"kk", "task":"translation_to", "metric":"chrf", - "score":0.2845065116 + "score":0.5710759927 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"km", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"km", "task":"translation_from", "metric":"bleu", - "score":0.319035437 + "score":0.3526008915 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"km", "task":"translation_from", "metric":"chrf", - "score":0.555554753 + "score":0.5987314155 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"km", "task":"translation_to", "metric":"bleu", - "score":0.2835968152 + "score":0.2114985992 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"km", "task":"translation_to", "metric":"chrf", - "score":0.5094572017 + "score":0.4380696418 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"kn", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"kn", "task":"translation_from", "metric":"bleu", - "score":0.2487969868 + "score":0.3225451009 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"kn", "task":"translation_from", "metric":"chrf", - "score":0.518708582 + "score":0.5503588307 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"kn", "task":"translation_to", "metric":"bleu", - "score":0.2238578938 + "score":0.3450200815 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"kn", "task":"translation_to", "metric":"chrf", - "score":0.4748109447 + "score":0.5340229728 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ms", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ko", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ms", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ko", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":0.8 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ms", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ko", "task":"translation_from", "metric":"bleu", - "score":0.3058774517 + "score":0.2513328863 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ms", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ko", "task":"translation_from", "metric":"chrf", - "score":0.5603224049 + "score":0.509018423 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ms", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ko", "task":"translation_to", "metric":"bleu", - "score":0.3684068806 + "score":0.3099962758 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ms", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ko", "task":"translation_to", "metric":"chrf", - "score":0.6535736283 + "score":0.3679934022 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"my", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"lua", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":1.0 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"my", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"lua", "task":"translation_from", "metric":"bleu", - "score":0.2253225205 + "score":0.133543561 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"my", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"lua", "task":"translation_from", "metric":"chrf", - "score":0.4798221167 + "score":0.3430238701 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"my", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"lua", "task":"translation_to", "metric":"bleu", - "score":0.2383027705 + "score":0.0554389677 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"my", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"lua", "task":"translation_to", "metric":"chrf", - "score":0.504994716 + "score":0.3402266285 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"om", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"mag", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"om", - "task":"mgsm", - "metric":"accuracy", - "score":0.5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"om", - "task":"mmlu", - "metric":"accuracy", - "score":0.4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"om", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"mag", "task":"translation_from", "metric":"bleu", - "score":0.0235872225 + "score":0.3820373565 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"om", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"mag", "task":"translation_from", "metric":"chrf", - "score":0.2475231508 + "score":0.5998907111 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"om", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"mag", "task":"translation_to", "metric":"bleu", - "score":0.0365961569 + "score":0.2728061501 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"om", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"mag", "task":"translation_to", "metric":"chrf", - "score":0.3050512265 + "score":0.4840324931 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"mai", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"mai", "task":"translation_from", "metric":"bleu", - "score":0.2767258101 + "score":0.295109772 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"mai", "task":"translation_from", "metric":"chrf", - "score":0.514091898 + "score":0.5448597381 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"mai", "task":"translation_to", "metric":"bleu", - "score":0.1796236972 + "score":0.247074884 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"mai", "task":"translation_to", "metric":"chrf", - "score":0.4422888692 + "score":0.4883086081 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"mg", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"mg", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"mg", "task":"translation_from", "metric":"bleu", - "score":0.3823229705 + "score":0.3323748277 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"mg", "task":"translation_from", "metric":"chrf", - "score":0.6453681393 + "score":0.5590337603 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"mg", "task":"translation_to", "metric":"bleu", - "score":0.3548387061 + "score":0.1910199162 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"mg", "task":"translation_to", "metric":"chrf", - "score":0.5492435889 + "score":0.5212112142 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ml", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ml", "task":"translation_from", "metric":"bleu", - "score":0.2581682802 + "score":0.3430335831 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ml", "task":"translation_from", "metric":"chrf", - "score":0.5198796684 + "score":0.5746721035 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ml", "task":"translation_to", "metric":"bleu", - "score":0.2662027737 + "score":0.3481170694 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ml", "task":"translation_to", "metric":"chrf", - "score":0.540420297 + "score":0.5673214411 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"mr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.3091555064 + "score":0.321620887 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.5528775735 + "score":0.554989685 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.3860807525 + "score":0.2947526867 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.6710753294 + "score":0.4967353717 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ms", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ms", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":1.0 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ms", "task":"translation_from", "metric":"bleu", - "score":0.2464304597 + "score":0.3837477301 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ms", "task":"translation_from", "metric":"chrf", - "score":0.5343201712 + "score":0.6078820797 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ms", "task":"translation_to", "metric":"bleu", - "score":0.3592456339 + "score":0.460911653 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ms", "task":"translation_to", "metric":"chrf", - "score":0.5816925415 + "score":0.7361702362 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"my", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"my", "task":"translation_from", "metric":"bleu", - "score":0.2486377856 + "score":0.3243318767 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"my", "task":"translation_from", "metric":"chrf", - "score":0.5019133104 + "score":0.5325074594 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"my", "task":"translation_to", "metric":"bleu", - "score":0.2573787999 + "score":0.29655196 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"my", "task":"translation_to", "metric":"chrf", - "score":0.4669380076 + "score":0.5575622672 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ne", "task":"classification", "metric":"accuracy", - "score":0.8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"mgsm", - "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ne", "task":"mmlu", "metric":"accuracy", - "score":0.7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2438930348 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5213646779 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2864351463 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6249321785 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ne", "task":"translation_from", "metric":"bleu", - "score":0.2312626914 + "score":0.3727062795 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ne", "task":"translation_from", "metric":"chrf", - "score":0.4818505098 + "score":0.6078730814 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ne", "task":"translation_to", "metric":"bleu", - "score":0.2916695233 + "score":0.2761405776 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ne", "task":"translation_to", "metric":"chrf", - "score":0.5596704495 + "score":0.5172440312 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"nl", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"nl", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"nl", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":1.0 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"nl", "task":"translation_from", "metric":"bleu", - "score":0.3464968589 + "score":0.3073830454 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"nl", "task":"translation_from", "metric":"chrf", - "score":0.5970733128 + "score":0.5312334894 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"nl", "task":"translation_to", "metric":"bleu", - "score":0.2948086539 + "score":0.3738440243 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"nl", "task":"translation_to", "metric":"chrf", - "score":0.5417485172 + "score":0.6210548081 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ny", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"mgsm", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ny", + "task":"mmlu", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ny", "task":"translation_from", "metric":"bleu", - "score":0.2555109482 + "score":0.2080935284 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ny", "task":"translation_from", "metric":"chrf", - "score":0.4905742401 + "score":0.4613292908 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ny", "task":"translation_to", "metric":"bleu", - "score":0.3470151937 + "score":0.1142069107 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ny", "task":"translation_to", "metric":"chrf", - "score":0.512427307 + "score":0.4684888109 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"om", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"mmlu", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"om", + "task":"mgsm", "metric":"accuracy", "score":0.6 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"om", "task":"translation_from", "metric":"bleu", - "score":0.3319169877 + "score":0.1248390462 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"om", "task":"translation_from", "metric":"chrf", - "score":0.5670040682 + "score":0.3912118415 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"om", "task":"translation_to", "metric":"bleu", - "score":0.3882912951 + "score":0.0733481499 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"om", "task":"translation_to", "metric":"chrf", - "score":0.6304381337 + "score":0.4043636025 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"or", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"or", "task":"translation_from", "metric":"bleu", - "score":0.2290327476 + "score":0.3088186789 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"or", "task":"translation_from", "metric":"chrf", - "score":0.5229250115 + "score":0.5586166118 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"or", "task":"translation_to", "metric":"bleu", - "score":0.3122409611 + "score":0.2551093032 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"or", "task":"translation_to", "metric":"chrf", - "score":0.4921734247 + "score":0.471197857 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"uz", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"pa", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"uz", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.2244630159 + "score":0.4788356583 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"uz", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.4814457852 + "score":0.6806459378 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"uz", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.2007945741 + "score":0.4407410774 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"uz", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.4705479648 + "score":0.6057762292 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"pl", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"pl", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"pl", "task":"translation_from", "metric":"bleu", - "score":0.2150236607 + "score":0.2858167001 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"pl", "task":"translation_from", "metric":"chrf", - "score":0.4970978512 + "score":0.5489970472 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"pl", "task":"translation_to", "metric":"bleu", - "score":0.3603191861 + "score":0.3573911021 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"pl", "task":"translation_to", "metric":"chrf", - "score":0.5938509481 + "score":0.5811687089 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"wuu", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"pt", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"wuu", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.2230132444 + "score":0.3641053048 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"wuu", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.49266873 + "score":0.588189418 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"wuu", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.0804541385 + "score":0.5753469236 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"wuu", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.1593791779 + "score":0.7440224371 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ro", "task":"classification", "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", "score":0.8 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ro", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ro", "task":"translation_from", "metric":"bleu", - "score":0.1997334357 + "score":0.3322929823 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ro", "task":"translation_from", "metric":"chrf", - "score":0.4568839976 + "score":0.5688847284 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ro", "task":"translation_to", "metric":"bleu", - "score":0.2322349452 + "score":0.5519246878 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ro", "task":"translation_to", "metric":"chrf", - "score":0.3049134513 + "score":0.7223799311 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ru", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ru", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ru", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":1.0 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.2350235637 + "score":0.2548042194 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.528086246 + "score":0.5077624586 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.2524231151 + "score":0.4489469101 }, { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.3456705882 + "score":0.6629307467 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"am", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"rw", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"am", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"rw", "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":0.4 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"am", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"rw", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.6 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"am", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"rw", "task":"translation_from", "metric":"bleu", - "score":0.1512958639 + "score":0.241720034 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"am", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"rw", "task":"translation_from", "metric":"chrf", - "score":0.3039734334 + "score":0.490197442 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"am", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"rw", "task":"translation_to", "metric":"bleu", - "score":0.0801602615 + "score":0.1941190598 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"am", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"rw", "task":"translation_to", "metric":"chrf", - "score":0.1225273024 + "score":0.5032987767 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"apc", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sd", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"apc", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sd", "task":"translation_from", "metric":"bleu", - "score":0.1445854242 + "score":0.3417012568 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"apc", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sd", "task":"translation_from", "metric":"chrf", - "score":0.3358973891 + "score":0.5625174346 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"apc", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sd", "task":"translation_to", "metric":"bleu", - "score":0.1013154049 + "score":0.3132737681 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"apc", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sd", "task":"translation_to", "metric":"chrf", - "score":0.3155908724 + "score":0.4785817971 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ar", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"si", "task":"classification", "metric":"accuracy", - "score":0.1 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ar", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"si", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ar", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"si", "task":"translation_from", "metric":"bleu", - "score":0.2238237549 + "score":0.2661551891 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ar", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"si", "task":"translation_from", "metric":"chrf", - "score":0.4534366926 + "score":0.5088142958 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ar", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"si", "task":"translation_to", "metric":"bleu", - "score":0.2689055687 + "score":0.2657051864 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ar", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"si", "task":"translation_to", "metric":"chrf", - "score":0.4149416248 + "score":0.468771605 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"arz", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sn", "task":"classification", "metric":"accuracy", - "score":0.1 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"arz", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sn", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sn", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sn", "task":"translation_from", "metric":"bleu", - "score":0.159326316 + "score":0.1950454148 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"arz", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sn", "task":"translation_from", "metric":"chrf", - "score":0.382299198 + "score":0.4066164793 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"arz", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sn", "task":"translation_to", "metric":"bleu", - "score":0.1975279012 + "score":0.0895987522 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"arz", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sn", "task":"translation_to", "metric":"chrf", - "score":0.434347868 + "score":0.406366105 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"az", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"so", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"az", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"so", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"so", "task":"translation_from", "metric":"bleu", - "score":0.156849916 + "score":0.2277966149 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"az", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"so", "task":"translation_from", "metric":"chrf", - "score":0.3691380603 + "score":0.4790482859 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"az", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"so", "task":"translation_to", "metric":"bleu", - "score":0.1100740183 + "score":0.1890846456 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"az", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"so", "task":"translation_to", "metric":"chrf", - "score":0.3479696433 + "score":0.4927220926 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"bho", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sr", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"bho", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sr", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sr", "task":"translation_from", "metric":"bleu", - "score":0.1735533986 + "score":0.3283448359 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"bho", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sr", "task":"translation_from", "metric":"chrf", - "score":0.393764966 + "score":0.5971969841 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"bho", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sr", "task":"translation_to", "metric":"bleu", - "score":0.1575864364 + "score":0.4709197385 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"bho", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sr", "task":"translation_to", "metric":"chrf", - "score":0.3025413929 + "score":0.6367420245 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"bn", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"su", "task":"classification", "metric":"accuracy", - "score":0.2 - }, - { - "model":"deepseek\/deepseek-r1", - "bcp_47":"bn", - "task":"mgsm", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"deepseek\/deepseek-r1", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"bn", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"su", "task":"translation_from", "metric":"bleu", - "score":0.2443635406 + "score":0.273412678 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"bn", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"su", "task":"translation_from", "metric":"chrf", - "score":0.4676159664 + "score":0.5129343997 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"bn", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"su", "task":"translation_to", "metric":"bleu", - "score":0.2223182846 + "score":0.1877009474 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"bn", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"su", "task":"translation_to", "metric":"chrf", - "score":0.3685961254 + "score":0.5103267256 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"de", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sv", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"de", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sv", "task":"mgsm", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"de", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sv", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"de", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sv", "task":"translation_from", "metric":"bleu", - "score":0.2633055293 + "score":0.3590806785 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"de", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sv", "task":"translation_from", "metric":"chrf", - "score":0.451378667 + "score":0.5793899495 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"de", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sv", "task":"translation_to", "metric":"bleu", - "score":0.2576565152 + "score":0.4522863769 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"de", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sv", "task":"translation_to", "metric":"chrf", - "score":0.3874723625 + "score":0.69205378 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"en", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sw", "task":"classification", "metric":"accuracy", - "score":0.1 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"en", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sw", "task":"mgsm", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"en", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sw", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"en", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.3974650186 + "score":0.3219627814 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"en", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.5373829936 + "score":0.5598942303 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"en", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.5868227988 + "score":0.4361318725 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"en", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.7574063883 + "score":0.6665904527 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"es", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ta", "task":"classification", "metric":"accuracy", - "score":0.0 - }, - { - "model":"deepseek\/deepseek-r1", - "bcp_47":"es", - "task":"mgsm", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"deepseek\/deepseek-r1", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"es", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ta", "task":"translation_from", "metric":"bleu", - "score":0.2163623393 + "score":0.2472520967 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"es", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ta", "task":"translation_from", "metric":"chrf", - "score":0.4705179867 + "score":0.5258675516 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"es", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ta", "task":"translation_to", "metric":"bleu", - "score":0.2458237388 + "score":0.3092184178 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"es", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ta", "task":"translation_to", "metric":"chrf", - "score":0.426538099 + "score":0.5908056148 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"fa", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"te", "task":"classification", "metric":"accuracy", - "score":0.1 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"fa", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"te", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"fa", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.2533539434 + "score":0.4085013861 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"fa", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.4119435555 + "score":0.624313704 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"fa", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.1546982368 + "score":0.3558604021 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"fa", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.461201833 + "score":0.5800045033 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"fil", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"tg", "task":"classification", "metric":"accuracy", - "score":0.1 - }, - { - "model":"deepseek\/deepseek-r1", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"fil", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"tg", "task":"translation_from", "metric":"bleu", - "score":0.2168672818 + "score":0.2686417951 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"fil", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"tg", "task":"translation_from", "metric":"chrf", - "score":0.4298161123 + "score":0.5013057378 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"fil", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"tg", "task":"translation_to", "metric":"bleu", - "score":0.2544899664 + "score":0.269846858 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"fil", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"tg", "task":"translation_to", "metric":"chrf", - "score":0.4510886635 + "score":0.477780812 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"fr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"th", "task":"classification", "metric":"accuracy", - "score":0.1 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"fr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"th", "task":"mgsm", "metric":"accuracy", - "score":0.7 - }, - { - "model":"deepseek\/deepseek-r1", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"fr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"th", "task":"translation_from", "metric":"bleu", - "score":0.3182982487 + "score":0.2834577064 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"fr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"th", "task":"translation_from", "metric":"chrf", - "score":0.5389072956 + "score":0.5125776742 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"fr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"th", "task":"translation_to", "metric":"bleu", - "score":0.47314841 + "score":0.3998428237 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"fr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"th", "task":"translation_to", "metric":"chrf", - "score":0.6884710951 + "score":0.5544961029 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"gu", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ti", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"gu", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ti", "task":"translation_from", "metric":"bleu", - "score":0.2054043097 + "score":0.2654309389 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"gu", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ti", "task":"translation_from", "metric":"chrf", - "score":0.3989649156 + "score":0.4824817611 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"gu", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ti", "task":"translation_to", "metric":"bleu", - "score":0.0395886562 + "score":0.1862233406 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"gu", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ti", "task":"translation_to", "metric":"chrf", - "score":0.1860957619 + "score":0.2911678276 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ha", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"tr", "task":"classification", "metric":"accuracy", - "score":0.1 - }, - { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ha", - "task":"mgsm", - "metric":"accuracy", - "score":0.4 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ha", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"tr", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ha", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"tr", "task":"translation_from", "metric":"bleu", - "score":0.1042634561 + "score":0.3108788704 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ha", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"tr", "task":"translation_from", "metric":"chrf", - "score":0.2700025792 + "score":0.5602956663 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ha", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"tr", "task":"translation_to", "metric":"bleu", - "score":0.2494923018 + "score":0.3518016236 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ha", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"tr", "task":"translation_to", "metric":"chrf", - "score":0.4977126554 + "score":0.5965516262 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"hi", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"uk", "task":"classification", "metric":"accuracy", - "score":0.2 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"hi", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"uk", "task":"mmlu", "metric":"accuracy", - "score":0.1 + "score":1.0 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"hi", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"uk", "task":"translation_from", "metric":"bleu", - "score":0.2684001499 + "score":0.2801238065 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"hi", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"uk", "task":"translation_from", "metric":"chrf", - "score":0.416230929 + "score":0.5303841848 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"hi", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"uk", "task":"translation_to", "metric":"bleu", - "score":0.2827365983 + "score":0.4297505232 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"hi", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"uk", "task":"translation_to", "metric":"chrf", - "score":0.5128198247 + "score":0.6084569418 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"id", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"umb", "task":"classification", "metric":"accuracy", - "score":0.2 + "score":0.7 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"id", - "task":"mmlu", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"umb", + "task":"translation_from", + "metric":"bleu", + "score":0.05869634 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"umb", + "task":"translation_from", + "metric":"chrf", + "score":0.2062284007 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"umb", + "task":"translation_to", + "metric":"bleu", + "score":0.0559741426 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"umb", + "task":"translation_to", + "metric":"chrf", + "score":0.2728382878 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ur", + "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"id", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.223787985 + "score":0.2899278495 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"id", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.485186041 + "score":0.5575393299 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"id", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.3571004344 + "score":0.2752599873 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"id", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.6398491182 + "score":0.476774558 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"it", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"uz", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"it", - "task":"mgsm", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"uz", + "task":"translation_from", + "metric":"bleu", + "score":0.2826575967 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"uz", + "task":"translation_from", + "metric":"chrf", + "score":0.5327013244 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"uz", + "task":"translation_to", + "metric":"bleu", + "score":0.3655163534 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"uz", + "task":"translation_to", + "metric":"chrf", + "score":0.6164677172 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"vi", + "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"it", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"vi", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"it", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.2225226541 + "score":0.3239526293 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"it", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.4359559623 + "score":0.5501317095 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"it", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.2708679556 + "score":0.395432451 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"it", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.4908463656 + "score":0.6050844519 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ja", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"wo", "task":"classification", "metric":"accuracy", - "score":0.2 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ja", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"wo", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.3 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ja", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"wo", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.3 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ja", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"wo", "task":"translation_from", "metric":"bleu", - "score":0.1711796281 + "score":0.1463159063 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ja", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"wo", "task":"translation_from", "metric":"chrf", - "score":0.4108641598 + "score":0.3734663519 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ja", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"wo", "task":"translation_to", "metric":"bleu", - "score":0.2194500975 + "score":0.0899876038 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ja", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"wo", "task":"translation_to", "metric":"chrf", - "score":0.3589526769 + "score":0.3152591585 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"jv", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"wuu", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"jv", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"wuu", "task":"translation_from", "metric":"bleu", - "score":0.1994883012 + "score":0.2446481916 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"jv", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"wuu", "task":"translation_from", "metric":"chrf", - "score":0.3942042616 + "score":0.4981230837 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"jv", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"wuu", "task":"translation_to", "metric":"bleu", - "score":0.2570478693 + "score":0.1046640677 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"jv", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"wuu", "task":"translation_to", "metric":"chrf", - "score":0.5215463463 + "score":0.1573468803 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"kn", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"xh", "task":"classification", "metric":"accuracy", - "score":0.2 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"kn", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"xh", "task":"translation_from", "metric":"bleu", - "score":0.1622823381 + "score":0.2368457175 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"kn", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"xh", "task":"translation_from", "metric":"chrf", - "score":0.3112906344 + "score":0.4726833185 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"kn", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"xh", "task":"translation_to", "metric":"bleu", - "score":0.0777950259 + "score":0.0745513103 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"kn", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"xh", "task":"translation_to", "metric":"chrf", - "score":0.286449259 + "score":0.4280480618 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ko", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"yo", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ko", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"yo", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.6 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ko", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"yo", "task":"translation_from", "metric":"bleu", - "score":0.2242267538 + "score":0.1823100131 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ko", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"yo", "task":"translation_from", "metric":"chrf", - "score":0.4739719705 + "score":0.4063332022 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ko", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"yo", "task":"translation_to", "metric":"bleu", - "score":0.2193704377 + "score":0.0722898622 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ko", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"yo", "task":"translation_to", "metric":"chrf", - "score":0.2898139055 + "score":0.2293754958 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ml", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"yue", "task":"classification", "metric":"accuracy", - "score":0.1 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ml", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"yue", "task":"translation_from", "metric":"bleu", - "score":0.2496973594 + "score":0.2476485874 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ml", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"yue", "task":"translation_from", "metric":"chrf", - "score":0.435485932 + "score":0.4997416793 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ml", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"yue", "task":"translation_to", "metric":"bleu", - "score":0.1379373956 + "score":0.2660169184 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ml", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"yue", "task":"translation_to", "metric":"chrf", - "score":0.2513871995 + "score":0.2991680484 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"mr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"zh", "task":"classification", "metric":"accuracy", - "score":0.1 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"mr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.1828389227 + "score":0.27341846 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"mr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.3179756072 + "score":0.541063718 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"mr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.2129586558 + "score":0.3233289278 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"mr", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.4314516197 + "score":0.3475215495 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ms", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"zu", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ms", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"zu", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ms", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"zu", "task":"translation_from", "metric":"bleu", - "score":0.24401684 + "score":0.3008140825 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ms", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"zu", "task":"translation_from", "metric":"chrf", - "score":0.4592926922 + "score":0.5503351929 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ms", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"zu", "task":"translation_to", "metric":"bleu", - "score":0.3739586622 + "score":0.3025859718 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ms", + "model":"anthropic\/claude-3.5-sonnet", + "bcp_47":"zu", "task":"translation_to", "metric":"chrf", - "score":0.6802015628 + "score":0.5616917702 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"my", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"aeb", "task":"classification", "metric":"accuracy", - "score":0.1 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"my", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"aeb", "task":"translation_from", "metric":"bleu", - "score":0.1237069224 + "score":0.2714908932 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"my", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"aeb", "task":"translation_from", "metric":"chrf", - "score":0.3000426144 + "score":0.4981839139 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"my", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"aeb", "task":"translation_to", "metric":"bleu", - "score":0.0752750224 + "score":0.2421707351 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"my", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"aeb", "task":"translation_to", "metric":"chrf", - "score":0.1972354123 + "score":0.4638593828 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"om", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"af", "task":"classification", "metric":"accuracy", "score":0.0 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"om", - "task":"mgsm", - "metric":"accuracy", - "score":0.2 - }, - { - "model":"deepseek\/deepseek-r1", - "bcp_47":"om", - "task":"mmlu", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"deepseek\/deepseek-r1", - "bcp_47":"om", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"af", "task":"translation_from", "metric":"bleu", - "score":0.0257539048 + "score":0.0 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"om", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"af", "task":"translation_from", "metric":"chrf", - "score":0.2236454943 + "score":0.0 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"om", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"af", "task":"translation_to", "metric":"bleu", - "score":0.0203648136 + "score":0.0 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"om", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"af", "task":"translation_to", "metric":"chrf", - "score":0.2172604464 + "score":0.0 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"or", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ak", "task":"classification", "metric":"accuracy", - "score":0.0 - }, - { - "model":"deepseek\/deepseek-r1", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1894457708 - }, - { - "model":"deepseek\/deepseek-r1", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.380925147 - }, - { - "model":"deepseek\/deepseek-r1", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0698032229 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2623376551 + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"pa", - "task":"classification", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ak", + "task":"mmlu", "metric":"accuracy", - "score":0.1 + "score":0.8 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"pa", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ak", "task":"translation_from", "metric":"bleu", - "score":0.252814761 + "score":0.1552497705 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"pa", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ak", "task":"translation_from", "metric":"chrf", - "score":0.4131775231 + "score":0.3876789912 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"pa", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ak", "task":"translation_to", "metric":"bleu", - "score":0.2671823746 + "score":0.12404113 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"pa", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ak", "task":"translation_to", "metric":"chrf", - "score":0.3966391033 + "score":0.387786267 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"pl", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"am", "task":"classification", "metric":"accuracy", - "score":0.1 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"pl", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"am", "task":"mgsm", "metric":"accuracy", - "score":0.6 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"pl", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"am", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"pl", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"am", "task":"translation_from", "metric":"bleu", - "score":0.2278356993 + "score":0.2654957101 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"pl", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"am", "task":"translation_from", "metric":"chrf", - "score":0.4590175615 + "score":0.5223894972 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"pl", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"am", "task":"translation_to", "metric":"bleu", - "score":0.2772231531 + "score":0.2492184328 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"pl", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"am", "task":"translation_to", "metric":"chrf", - "score":0.4560149918 + "score":0.3844495283 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"pt", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"apc", "task":"classification", "metric":"accuracy", - "score":0.1 - }, - { - "model":"deepseek\/deepseek-r1", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"pt", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"apc", "task":"translation_from", "metric":"bleu", - "score":0.2348823133 + "score":0.3358787565 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"pt", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"apc", "task":"translation_from", "metric":"chrf", - "score":0.4500923911 + "score":0.5936351207 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"pt", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"apc", "task":"translation_to", "metric":"bleu", - "score":0.4182790857 + "score":0.3077302936 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"pt", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"apc", "task":"translation_to", "metric":"chrf", - "score":0.649967582 + "score":0.5299097797 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ru", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ar", "task":"classification", "metric":"accuracy", - "score":0.1 - }, - { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ru", - "task":"mgsm", - "metric":"accuracy", - "score":0.6 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ru", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ar", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ru", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.1839314203 + "score":0.2889865542 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ru", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.4234191674 + "score":0.5430128204 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ru", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.3489148579 + "score":0.4267246672 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ru", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.5567945257 + "score":0.6048255191 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"sd", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ary", "task":"classification", "metric":"accuracy", - "score":0.1 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"sd", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ary", "task":"translation_from", "metric":"bleu", - "score":0.1949440941 + "score":0.2209069897 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"sd", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ary", "task":"translation_from", "metric":"chrf", - "score":0.4275372517 + "score":0.4983774573 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"sd", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ary", "task":"translation_to", "metric":"bleu", - "score":0.1720625024 + "score":0.2238610606 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"sd", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ary", "task":"translation_to", "metric":"chrf", - "score":0.387179761 + "score":0.4561674954 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"sw", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"arz", "task":"classification", "metric":"accuracy", - "score":0.1 - }, - { - "model":"deepseek\/deepseek-r1", - "bcp_47":"sw", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"deepseek\/deepseek-r1", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"sw", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"arz", "task":"translation_from", "metric":"bleu", - "score":0.2041105012 + "score":0.2218813556 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"sw", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"arz", "task":"translation_from", "metric":"chrf", - "score":0.3657796945 + "score":0.4561380984 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"sw", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"arz", "task":"translation_to", "metric":"bleu", - "score":0.3130978532 + "score":0.2970501456 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"sw", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"arz", "task":"translation_to", "metric":"chrf", - "score":0.5950962977 + "score":0.5026533348 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ta", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"as", "task":"classification", "metric":"accuracy", - "score":0.2 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ta", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"as", "task":"translation_from", "metric":"bleu", - "score":0.2525982324 + "score":0.2349948321 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ta", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"as", "task":"translation_from", "metric":"chrf", - "score":0.4605822105 + "score":0.4767507943 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ta", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"as", "task":"translation_to", "metric":"bleu", - "score":0.1739645144 + "score":0.1835124052 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ta", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"as", "task":"translation_to", "metric":"chrf", - "score":0.3984988334 + "score":0.3948207636 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"te", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"awa", "task":"classification", "metric":"accuracy", - "score":0.1 - }, - { - "model":"deepseek\/deepseek-r1", - "bcp_47":"te", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"deepseek\/deepseek-r1", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"te", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"awa", "task":"translation_from", "metric":"bleu", - "score":0.1200373123 + "score":0.3743066609 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"te", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"awa", "task":"translation_from", "metric":"chrf", - "score":0.3196364935 + "score":0.5599845365 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"te", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"awa", "task":"translation_to", "metric":"bleu", - "score":0.1814754432 + "score":0.197638086 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"te", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"awa", "task":"translation_to", "metric":"chrf", - "score":0.3157059838 + "score":0.4275815242 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"th", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"az", "task":"classification", "metric":"accuracy", - "score":0.1 - }, - { - "model":"deepseek\/deepseek-r1", - "bcp_47":"th", - "task":"mgsm", - "metric":"accuracy", "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"th", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"az", "task":"translation_from", "metric":"bleu", - "score":0.1984127492 + "score":0.2511263756 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"th", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"az", "task":"translation_from", "metric":"chrf", - "score":0.4104368787 + "score":0.4884204513 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"th", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"az", "task":"translation_to", "metric":"bleu", - "score":0.2929382742 + "score":0.185215113 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"th", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"az", "task":"translation_to", "metric":"chrf", - "score":0.4500167319 + "score":0.4698145601 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"tr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"be", "task":"classification", "metric":"accuracy", - "score":0.0 - }, - { - "model":"deepseek\/deepseek-r1", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"tr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"be", "task":"translation_from", "metric":"bleu", - "score":0.264346972 + "score":0.1867886283 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"tr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"be", "task":"translation_from", "metric":"chrf", - "score":0.4993975063 + "score":0.48432494 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"tr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"be", "task":"translation_to", "metric":"bleu", - "score":0.31801505 + "score":0.2914923356 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"tr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"be", "task":"translation_to", "metric":"chrf", - "score":0.5317972494 + "score":0.4904369651 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ur", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"bho", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ur", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"bho", "task":"translation_from", "metric":"bleu", - "score":0.181272453 + "score":0.2947535379 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ur", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"bho", "task":"translation_from", "metric":"chrf", - "score":0.386776605 + "score":0.5165639924 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ur", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"bho", "task":"translation_to", "metric":"bleu", - "score":0.2603415771 + "score":0.2396652186 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"ur", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"bho", "task":"translation_to", "metric":"chrf", - "score":0.4241396601 + "score":0.43949233 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"uz", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"bm", "task":"classification", "metric":"accuracy", - "score":0.1 + "score":0.0 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"uz", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"bm", "task":"translation_from", "metric":"bleu", - "score":0.1963447008 + "score":0.0 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"uz", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"bm", "task":"translation_from", "metric":"chrf", - "score":0.4236533517 + "score":0.0 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"uz", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"bm", "task":"translation_to", "metric":"bleu", - "score":0.1559833307 + "score":0.0 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"uz", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"bm", "task":"translation_to", "metric":"chrf", - "score":0.3946264183 + "score":0.0 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"vi", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"bn", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"vi", - "task":"mmlu", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"bn", + "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"vi", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.1705385375 + "score":0.3082568982 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"vi", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.3747437419 + "score":0.5337051323 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"vi", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.257036702 + "score":0.3355598159 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"vi", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.4598854693 + "score":0.5162264918 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"wuu", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ca", "task":"classification", "metric":"accuracy", - "score":0.1 + "score":0.0 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"wuu", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ca", "task":"translation_from", "metric":"bleu", - "score":0.192705772 + "score":0.0 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"wuu", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ca", "task":"translation_from", "metric":"chrf", - "score":0.444563462 + "score":0.0 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"wuu", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ca", "task":"translation_to", "metric":"bleu", - "score":0.078814153 + "score":0.0 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"wuu", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ca", "task":"translation_to", "metric":"chrf", - "score":0.1049283878 + "score":0.0 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"yue", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ceb", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"yue", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ceb", "task":"translation_from", "metric":"bleu", - "score":0.1352563368 + "score":0.4122857574 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"yue", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ceb", "task":"translation_from", "metric":"chrf", - "score":0.3763213166 + "score":0.6050858924 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"yue", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ceb", "task":"translation_to", "metric":"bleu", - "score":0.2591777223 + "score":0.3836458269 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"yue", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ceb", "task":"translation_to", "metric":"chrf", - "score":0.3119832776 + "score":0.6416210642 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"zh", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ckb", "task":"classification", "metric":"accuracy", - "score":0.1 - }, - { - "model":"deepseek\/deepseek-r1", - "bcp_47":"zh", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"deepseek\/deepseek-r1", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"zh", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ckb", "task":"translation_from", "metric":"bleu", - "score":0.2137844239 + "score":0.2735961462 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"zh", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ckb", "task":"translation_from", "metric":"chrf", - "score":0.5028557922 + "score":0.5476293362 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"zh", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ckb", "task":"translation_to", "metric":"bleu", - "score":0.3129908127 + "score":0.3182484892 }, { - "model":"deepseek\/deepseek-r1", - "bcp_47":"zh", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ckb", "task":"translation_to", "metric":"chrf", - "score":0.3710290799 + "score":0.5528408781 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ar", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"cs", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ar", - "task":"mmlu", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"cs", + "task":"mgsm", "metric":"accuracy", - "score":0.0 - }, - { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2373672543 - }, - { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5260757727 - }, - { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3285274303 - }, - { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5590237808 + "score":0.8 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"arz", - "task":"classification", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"cs", + "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"arz", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"cs", "task":"translation_from", "metric":"bleu", - "score":0.2406381299 + "score":0.3514942306 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"arz", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"cs", "task":"translation_from", "metric":"chrf", - "score":0.4810229449 + "score":0.6058081868 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"arz", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"cs", "task":"translation_to", "metric":"bleu", - "score":0.2249075936 + "score":0.4019223656 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"arz", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"cs", "task":"translation_to", "metric":"chrf", - "score":0.4437585001 + "score":0.592911966 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"bn", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"de", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"bn", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"de", "task":"mgsm", "metric":"accuracy", - "score":0.4 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"bn", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"de", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"bn", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.251982914 + "score":0.3635164411 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"bn", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.5269588388 + "score":0.5991540113 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"bn", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.3081294684 + "score":0.5032720779 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"bn", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.5221618044 + "score":0.693325521 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"de", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"el", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"de", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"el", "task":"mgsm", "metric":"accuracy", - "score":0.4 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"de", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"el", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"de", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"el", "task":"translation_from", "metric":"bleu", - "score":0.3226520344 + "score":0.2964481503 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"de", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"el", "task":"translation_from", "metric":"chrf", - "score":0.5750653902 + "score":0.5313927058 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"de", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"el", "task":"translation_to", "metric":"bleu", - "score":0.3833943767 + "score":0.3878661569 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"de", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"el", "task":"translation_to", "metric":"chrf", - "score":0.5822540388 + "score":0.5730182703 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"en", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"en", "task":"mgsm", "metric":"accuracy", - "score":0.6 + "score":1.0 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"en", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.5414890567 + "score":0.6109509541 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.6901603131 + "score":0.7441302539 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.65136344 + "score":0.7189431005 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.814288256 + "score":0.858877842 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"es", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"es", "task":"mgsm", "metric":"accuracy", - "score":0.3 + "score":1.0 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"es", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.2479212607 + "score":0.3415212877 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.4998884286 + "score":0.581216976 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.2970650759 + "score":0.3866651561 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.5373052889 + "score":0.6216604607 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"fa", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"fa", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"fa", "task":"translation_from", "metric":"bleu", - "score":0.2793086929 + "score":0.2934935537 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"fa", "task":"translation_from", "metric":"chrf", - "score":0.4720611769 + "score":0.5521598139 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"fa", "task":"translation_to", "metric":"bleu", - "score":0.1318325912 + "score":0.2612039966 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"fa", "task":"translation_to", "metric":"chrf", - "score":0.3864569881 + "score":0.4687393359 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"fil", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"fil", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"fil", "task":"translation_from", "metric":"bleu", - "score":0.3666373087 + "score":0.3757506556 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"fil", "task":"translation_from", "metric":"chrf", - "score":0.5839902989 + "score":0.5844308819 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"fil", "task":"translation_to", "metric":"bleu", - "score":0.2824386471 + "score":0.3534386963 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"fil", "task":"translation_to", "metric":"chrf", - "score":0.5388064333 + "score":0.6302138792 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"fr", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"fr", "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":1.0 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"fr", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.3186845256 + "score":0.3472418737 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.5933794038 + "score":0.5869792648 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.4349494723 + "score":0.55907943 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.6079740627 + "score":0.7254469966 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.0579558321 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.2491854022 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0644952316 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.27092494 + }, + { + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"gu", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"gu", "task":"translation_from", "metric":"bleu", - "score":0.1773927146 + "score":0.3154133447 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"gu", "task":"translation_from", "metric":"chrf", - "score":0.3630036378 + "score":0.5290294486 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"gu", "task":"translation_to", "metric":"bleu", - "score":0.0949811313 + "score":0.2126420937 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"gu", "task":"translation_to", "metric":"chrf", - "score":0.3340540429 + "score":0.4630333055 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"ha", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"ha", "task":"mgsm", "metric":"accuracy", - "score":0.3 + "score":0.5 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"ha", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"ha", "task":"translation_from", "metric":"bleu", - "score":0.1872829527 + "score":0.1639811937 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"ha", "task":"translation_from", "metric":"chrf", - "score":0.3848483899 + "score":0.3928914747 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"ha", "task":"translation_to", "metric":"bleu", - "score":0.2170056607 + "score":0.1953419416 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"ha", "task":"translation_to", "metric":"chrf", - "score":0.485021658 + "score":0.478395209 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"hi", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"hi", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.3564149867 + "score":0.4173637317 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.5972656918 + "score":0.6215184775 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.3029237977 + "score":0.4359736097 }, { - "model":"deepseek\/deepseek-r1-0528", + "model":"anthropic\/claude-3.7-sonnet", "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.5276781303 + "score":0.6378773265 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"id", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"hne", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"id", - "task":"mmlu", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"hne", + "task":"translation_from", + "metric":"bleu", + "score":0.2576586101 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"hne", + "task":"translation_from", + "metric":"chrf", + "score":0.4955502153 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"hne", + "task":"translation_to", + "metric":"bleu", + "score":0.1623467534 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"hne", + "task":"translation_to", + "metric":"chrf", + "score":0.4282927035 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ht", + "task":"classification", "metric":"accuracy", "score":0.0 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"id", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ht", "task":"translation_from", "metric":"bleu", - "score":0.2876911945 + "score":0.0 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"id", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ht", "task":"translation_from", "metric":"chrf", - "score":0.5482159609 + "score":0.0 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"id", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ht", "task":"translation_to", "metric":"bleu", - "score":0.2940448188 + "score":0.0 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"id", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ht", "task":"translation_to", "metric":"chrf", - "score":0.5448923741 + "score":0.0 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"it", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"hu", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"it", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"hu", "task":"mgsm", "metric":"accuracy", - "score":0.5 - }, - { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"it", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"hu", "task":"translation_from", "metric":"bleu", - "score":0.2897223986 + "score":0.3311462156 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"it", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"hu", "task":"translation_from", "metric":"chrf", - "score":0.5436301176 + "score":0.5917802475 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"it", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"hu", "task":"translation_to", "metric":"bleu", - "score":0.2571014471 + "score":0.3618326454 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"it", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"hu", "task":"translation_to", "metric":"chrf", - "score":0.4731076434 + "score":0.5905610326 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ja", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"id", "task":"classification", "metric":"accuracy", - "score":0.0 - }, - { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ja", - "task":"mgsm", - "metric":"accuracy", - "score":0.4 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ja", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"id", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ja", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.1827387853 + "score":0.30984493 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ja", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.4769620326 + "score":0.5816152273 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ja", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.0613359658 + "score":0.4256755459 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ja", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.2105103816 + "score":0.6937537754 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"jv", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ig", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"jv", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ig", "task":"translation_from", "metric":"bleu", - "score":0.2802837747 + "score":0.2392256846 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"jv", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ig", "task":"translation_from", "metric":"chrf", - "score":0.4893845985 + "score":0.50697791 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"jv", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ig", "task":"translation_to", "metric":"bleu", - "score":0.1179961209 + "score":0.2113990452 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"jv", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ig", "task":"translation_to", "metric":"chrf", - "score":0.3697436656 + "score":0.4634979196 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"kn", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ilo", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"kn", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ilo", "task":"translation_from", "metric":"bleu", - "score":0.2346057729 + "score":0.2765007451 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"kn", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ilo", "task":"translation_from", "metric":"chrf", - "score":0.4744017815 + "score":0.4939949219 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"kn", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ilo", "task":"translation_to", "metric":"bleu", - "score":0.1793887241 + "score":0.2531559761 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"kn", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ilo", "task":"translation_to", "metric":"chrf", - "score":0.4368728644 + "score":0.5360266274 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ko", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"it", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ko", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"it", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ko", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"it", "task":"translation_from", "metric":"bleu", - "score":0.2249815138 + "score":0.3367683936 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ko", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"it", "task":"translation_from", "metric":"chrf", - "score":0.5077874682 + "score":0.5620478968 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ko", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"it", "task":"translation_to", "metric":"bleu", - "score":0.2125650621 + "score":0.3820994257 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ko", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"it", "task":"translation_to", "metric":"chrf", - "score":0.2904132435 + "score":0.617255004 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ml", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ja", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ml", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.3249125796 + "score":0.3020669513 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ml", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.5545635633 + "score":0.5652474506 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ml", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.2625209874 + "score":0.2526786297 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ml", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.5042437741 + "score":0.4189814818 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"mr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"jv", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"mr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.1520275352 + "score":0.3764722943 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"mr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.3905524229 + "score":0.596660778 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"mr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.0999041852 + "score":0.2446930524 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"mr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.3246573528 + "score":0.5495728981 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"or", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ki", "task":"classification", "metric":"accuracy", "score":0.0 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"or", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ki", "task":"translation_from", "metric":"bleu", - "score":0.2703816733 + "score":0.0 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"or", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ki", "task":"translation_from", "metric":"chrf", - "score":0.5070503073 + "score":0.0 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"or", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ki", "task":"translation_to", "metric":"bleu", - "score":0.1229430143 + "score":0.0 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"or", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ki", "task":"translation_to", "metric":"chrf", - "score":0.3831192143 + "score":0.0 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"pa", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"kk", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"pa", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"kk", "task":"translation_from", "metric":"bleu", - "score":0.361635926 + "score":0.226882832 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"pa", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"kk", "task":"translation_from", "metric":"chrf", - "score":0.5409988692 + "score":0.5274827881 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"pa", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"kk", "task":"translation_to", "metric":"bleu", - "score":0.3917357782 + "score":0.2928073284 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"pa", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"kk", "task":"translation_to", "metric":"chrf", - "score":0.5329271965 + "score":0.5503591158 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"pl", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"km", "task":"classification", "metric":"accuracy", - "score":0.0 - }, - { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"pl", - "task":"mgsm", - "metric":"accuracy", - "score":0.5 - }, - { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"pl", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"km", "task":"translation_from", "metric":"bleu", - "score":0.26251395 + "score":0.3359656431 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"pl", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"km", "task":"translation_from", "metric":"chrf", - "score":0.5352694678 + "score":0.5832978038 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"pl", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"km", "task":"translation_to", "metric":"bleu", - "score":0.3264296122 + "score":0.2052531723 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"pl", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"km", "task":"translation_to", "metric":"chrf", - "score":0.5528035231 + "score":0.423812318 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"pt", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"kn", "task":"classification", "metric":"accuracy", - "score":0.0 - }, - { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"pt", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"kn", "task":"translation_from", "metric":"bleu", - "score":0.3390879053 + "score":0.2624484733 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"pt", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"kn", "task":"translation_from", "metric":"chrf", - "score":0.5804013742 + "score":0.5071140689 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"pt", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"kn", "task":"translation_to", "metric":"bleu", - "score":0.3506563803 + "score":0.3198638529 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"pt", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"kn", "task":"translation_to", "metric":"chrf", - "score":0.5763378703 + "score":0.5401137308 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ru", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ko", "task":"classification", "metric":"accuracy", - "score":0.0 - }, - { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ru", - "task":"mgsm", - "metric":"accuracy", - "score":0.6 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ru", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ko", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ru", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ko", "task":"translation_from", "metric":"bleu", - "score":0.2246840158 + "score":0.2455263458 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ru", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ko", "task":"translation_from", "metric":"chrf", - "score":0.5244113055 + "score":0.5060005291 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ru", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ko", "task":"translation_to", "metric":"bleu", - "score":0.3594079605 + "score":0.26830985 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ru", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ko", "task":"translation_to", "metric":"chrf", - "score":0.5726823578 + "score":0.3779300192 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"sd", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"lua", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"sd", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"lua", "task":"translation_from", "metric":"bleu", - "score":0.1351642547 + "score":0.0877409274 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"sd", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"lua", "task":"translation_from", "metric":"chrf", - "score":0.419979284 + "score":0.2860240482 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"sd", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"lua", "task":"translation_to", "metric":"bleu", - "score":0.1783822717 + "score":0.0878946168 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"sd", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"lua", "task":"translation_to", "metric":"chrf", - "score":0.3420045131 + "score":0.3792924127 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"sw", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"mag", "task":"classification", "metric":"accuracy", - "score":0.0 - }, - { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"sw", - "task":"mgsm", - "metric":"accuracy", - "score":0.2 - }, - { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"sw", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"mag", "task":"translation_from", "metric":"bleu", - "score":0.2074916818 + "score":0.3575309079 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"sw", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"mag", "task":"translation_from", "metric":"chrf", - "score":0.4529002152 + "score":0.5809284684 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"sw", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"mag", "task":"translation_to", "metric":"bleu", - "score":0.3320288719 + "score":0.3412387019 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"sw", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"mag", "task":"translation_to", "metric":"chrf", - "score":0.6201778863 + "score":0.5581098509 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ta", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"mai", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ta", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"mai", "task":"translation_from", "metric":"bleu", - "score":0.2510503336 + "score":0.2941552983 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ta", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"mai", "task":"translation_from", "metric":"chrf", - "score":0.4902642703 + "score":0.5344011771 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ta", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"mai", "task":"translation_to", "metric":"bleu", - "score":0.2210031154 + "score":0.2473518914 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ta", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"mai", "task":"translation_to", "metric":"chrf", - "score":0.4920579152 + "score":0.5038938769 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"te", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"mg", "task":"classification", "metric":"accuracy", - "score":0.0 - }, - { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"te", - "task":"mgsm", - "metric":"accuracy", - "score":0.3 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"te", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"mg", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"te", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"mg", "task":"translation_from", "metric":"bleu", - "score":0.3219720359 + "score":0.2928160974 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"te", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"mg", "task":"translation_from", "metric":"chrf", - "score":0.5542555367 + "score":0.531553217 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"te", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"mg", "task":"translation_to", "metric":"bleu", - "score":0.2813682269 + "score":0.2381371552 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"te", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"mg", "task":"translation_to", "metric":"chrf", - "score":0.5156714123 + "score":0.5343730926 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"th", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ml", "task":"classification", "metric":"accuracy", - "score":0.0 - }, - { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"th", - "task":"mgsm", - "metric":"accuracy", - "score":0.6 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"th", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ml", "task":"translation_from", "metric":"bleu", - "score":0.2423449507 + "score":0.3831267967 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"th", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ml", "task":"translation_from", "metric":"chrf", - "score":0.5073629744 + "score":0.5877718214 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"th", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ml", "task":"translation_to", "metric":"bleu", - "score":0.2856584071 + "score":0.3166439754 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"th", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ml", "task":"translation_to", "metric":"chrf", - "score":0.4617854306 + "score":0.5664991748 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"tr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"mr", "task":"classification", "metric":"accuracy", - "score":0.0 - }, - { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"tr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.2862677011 + "score":0.3248935831 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"tr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.5325160504 + "score":0.556535727 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"tr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.3443407299 + "score":0.2773274773 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"tr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.6019992774 + "score":0.5134253387 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ur", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ms", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ur", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ms", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ms", "task":"translation_from", "metric":"bleu", - "score":0.2049672714 + "score":0.3902392905 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ur", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ms", "task":"translation_from", "metric":"chrf", - "score":0.4409541903 + "score":0.6255884221 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ur", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ms", "task":"translation_to", "metric":"bleu", - "score":0.291136983 + "score":0.4320552013 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"ur", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ms", "task":"translation_to", "metric":"chrf", - "score":0.4722890493 + "score":0.7162987249 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"vi", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"my", "task":"classification", "metric":"accuracy", - "score":0.0 - }, - { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"vi", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"my", "task":"translation_from", "metric":"bleu", - "score":0.290841669 + "score":0.2973625302 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"vi", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"my", "task":"translation_from", "metric":"chrf", - "score":0.5420316418 + "score":0.5304507919 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"vi", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"my", "task":"translation_to", "metric":"bleu", - "score":0.4456194272 + "score":0.2814844596 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"vi", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"my", "task":"translation_to", "metric":"chrf", - "score":0.6359307779 + "score":0.5325214597 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"wuu", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ne", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"wuu", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ne", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ne", "task":"translation_from", "metric":"bleu", - "score":0.2592635841 + "score":0.3423342516 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"wuu", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ne", "task":"translation_from", "metric":"chrf", - "score":0.5029886217 + "score":0.5714046498 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"wuu", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ne", "task":"translation_to", "metric":"bleu", - "score":0.0439234831 + "score":0.3073801688 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"wuu", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ne", "task":"translation_to", "metric":"chrf", - "score":0.1458942547 + "score":0.535796278 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"yue", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"nl", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"yue", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"nl", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"nl", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"nl", "task":"translation_from", "metric":"bleu", - "score":0.2131332995 + "score":0.2915844659 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"yue", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"nl", "task":"translation_from", "metric":"chrf", - "score":0.4719991036 + "score":0.5233082306 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"yue", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"nl", "task":"translation_to", "metric":"bleu", - "score":0.117107351 + "score":0.3496367393 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"yue", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"nl", "task":"translation_to", "metric":"chrf", - "score":0.2063865989 + "score":0.6133721509 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"zh", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ny", "task":"classification", "metric":"accuracy", - "score":0.0 - }, - { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"zh", - "task":"mgsm", - "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"zh", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ny", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"zh", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ny", "task":"translation_from", "metric":"bleu", - "score":0.2199013913 + "score":0.1393773943 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"zh", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ny", "task":"translation_from", "metric":"chrf", - "score":0.4962775874 + "score":0.3742917816 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"zh", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ny", "task":"translation_to", "metric":"bleu", - "score":0.1813558493 + "score":0.1302935996 }, { - "model":"deepseek\/deepseek-r1-0528", - "bcp_47":"zh", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ny", "task":"translation_to", "metric":"chrf", - "score":0.3079482476 + "score":0.4828092948 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"am", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"om", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"am", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"om", "task":"mgsm", "metric":"accuracy", - "score":0.6 + "score":0.4 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"am", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"om", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"am", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"om", "task":"translation_from", "metric":"bleu", - "score":0.278130538 + "score":0.1183565284 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"am", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"om", "task":"translation_from", "metric":"chrf", - "score":0.5385292979 + "score":0.3604387918 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"am", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"om", "task":"translation_to", "metric":"bleu", - "score":0.2384630665 + "score":0.0926735247 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"am", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"om", "task":"translation_to", "metric":"chrf", - "score":0.3608782934 + "score":0.407269173 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"apc", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"or", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"apc", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"or", "task":"translation_from", "metric":"bleu", - "score":0.3417210123 + "score":0.3454626797 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"apc", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"or", "task":"translation_from", "metric":"chrf", - "score":0.5899435952 + "score":0.5668266666 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"apc", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"or", "task":"translation_to", "metric":"bleu", - "score":0.2808352256 + "score":0.2472009189 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"apc", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"or", "task":"translation_to", "metric":"chrf", - "score":0.5279437548 + "score":0.455460052 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"pa", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.3412745465 + "score":0.4397356804 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.5826925715 + "score":0.6588393086 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.390058702 + "score":0.4762161169 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.597901367 + "score":0.6165646404 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"arz", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"pl", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"arz", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"pl", "task":"translation_from", "metric":"bleu", - "score":0.2884896124 + "score":0.2837156349 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"arz", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"pl", "task":"translation_from", "metric":"chrf", - "score":0.4868568502 + "score":0.5580363271 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"arz", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"pl", "task":"translation_to", "metric":"bleu", - "score":0.2753136771 + "score":0.3506539621 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"arz", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"pl", "task":"translation_to", "metric":"chrf", - "score":0.4912165901 + "score":0.5826652331 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"az", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"pt", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"az", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.2496588936 + "score":0.3702288509 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"az", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.4813242802 + "score":0.603198011 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"az", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.1805770029 + "score":0.5348426193 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"az", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.4382698967 + "score":0.7292524118 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bho", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ro", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bho", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ro", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ro", "task":"translation_from", "metric":"bleu", - "score":0.2478040527 + "score":0.3025325263 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bho", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ro", "task":"translation_from", "metric":"chrf", - "score":0.5055046978 + "score":0.5428889158 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bho", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ro", "task":"translation_to", "metric":"bleu", - "score":0.2299760176 + "score":0.5423330128 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bho", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ro", "task":"translation_to", "metric":"chrf", - "score":0.4382930134 + "score":0.7003733903 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ru", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ru", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":1.0 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ru", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.2988263355 + "score":0.254709734 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.5680625724 + "score":0.5378272729 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.3895386095 + "score":0.4143683284 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.5693830083 + "score":0.6253967915 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"rw", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"rw", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.4 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"rw", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"rw", "task":"translation_from", "metric":"bleu", - "score":0.4245142301 + "score":0.1962212986 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"rw", "task":"translation_from", "metric":"chrf", - "score":0.6390046108 + "score":0.4367493461 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"rw", "task":"translation_to", "metric":"bleu", - "score":0.4937713215 + "score":0.1929905791 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"rw", "task":"translation_to", "metric":"chrf", - "score":0.6856946146 + "score":0.5044002449 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sd", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sd", "task":"translation_from", "metric":"bleu", - "score":0.5700014681 + "score":0.2918138373 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sd", "task":"translation_from", "metric":"chrf", - "score":0.7211557733 + "score":0.5417251668 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sd", "task":"translation_to", "metric":"bleu", - "score":0.6711231356 + "score":0.3037847598 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sd", "task":"translation_to", "metric":"chrf", - "score":0.8279616884 + "score":0.4992460758 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"si", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"si", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"si", "task":"translation_from", "metric":"bleu", - "score":0.3344072959 + "score":0.2617759894 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"si", "task":"translation_from", "metric":"chrf", - "score":0.5751886204 + "score":0.5276633986 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"si", "task":"translation_to", "metric":"bleu", - "score":0.3905772718 + "score":0.2777846992 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"si", "task":"translation_to", "metric":"chrf", - "score":0.6166676981 + "score":0.4645319126 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fa", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sn", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fa", - "task":"mmlu", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sn", + "task":"mgsm", "metric":"accuracy", "score":0.7 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fa", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sn", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sn", "task":"translation_from", "metric":"bleu", - "score":0.3438075851 + "score":0.1183361048 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fa", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sn", "task":"translation_from", "metric":"chrf", - "score":0.5772164708 + "score":0.3272094202 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fa", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sn", "task":"translation_to", "metric":"bleu", - "score":0.2647913841 + "score":0.079124328 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fa", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sn", "task":"translation_to", "metric":"chrf", - "score":0.489934723 + "score":0.3902046622 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fil", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"so", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fil", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"so", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fil", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"so", "task":"translation_from", "metric":"bleu", - "score":0.4465199237 + "score":0.2117678963 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fil", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"so", "task":"translation_from", "metric":"chrf", - "score":0.6601536062 + "score":0.4359443689 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fil", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"so", "task":"translation_to", "metric":"bleu", - "score":0.3429301939 + "score":0.1732885789 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fil", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"so", "task":"translation_to", "metric":"chrf", - "score":0.6176510545 + "score":0.4964169161 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sr", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":1.0 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sr", "task":"translation_from", "metric":"bleu", - "score":0.3411643102 + "score":0.3255971416 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sr", "task":"translation_from", "metric":"chrf", - "score":0.5823324237 + "score":0.6008485267 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sr", "task":"translation_to", "metric":"bleu", - "score":0.549646027 + "score":0.4485218422 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sr", "task":"translation_to", "metric":"chrf", - "score":0.7334440232 + "score":0.6288500197 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"gu", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"su", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"gu", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"su", "task":"translation_from", "metric":"bleu", - "score":0.3431336081 + "score":0.2558609607 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"gu", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"su", "task":"translation_from", "metric":"chrf", - "score":0.5478126679 + "score":0.4641225577 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"gu", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"su", "task":"translation_to", "metric":"bleu", - "score":0.1775808906 + "score":0.2212772916 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"gu", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"su", "task":"translation_to", "metric":"chrf", - "score":0.4530128509 + "score":0.5309758013 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ha", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sv", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ha", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sv", "task":"mgsm", "metric":"accuracy", - "score":0.6 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ha", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sv", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ha", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sv", "task":"translation_from", "metric":"bleu", - "score":0.2923469792 + "score":0.3158889064 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ha", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sv", "task":"translation_from", "metric":"chrf", - "score":0.5018131258 + "score":0.5748466359 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ha", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sv", "task":"translation_to", "metric":"bleu", - "score":0.2792533669 + "score":0.4289796381 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ha", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sv", "task":"translation_to", "metric":"chrf", - "score":0.5455037681 + "score":0.6719817133 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sw", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sw", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sw", "task":"mmlu", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.4434404142 + "score":0.2686859348 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.6607832834 + "score":0.5049847235 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.4308263411 + "score":0.3662710201 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.6353494719 + "score":0.6470689802 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ta", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ta", "task":"translation_from", "metric":"bleu", - "score":0.3626330278 + "score":0.276310564 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ta", "task":"translation_from", "metric":"chrf", - "score":0.5869542517 + "score":0.5265133216 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ta", "task":"translation_to", "metric":"bleu", - "score":0.4368014195 + "score":0.3356818462 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ta", "task":"translation_to", "metric":"chrf", - "score":0.6964617832 + "score":0.5995810459 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"it", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"te", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"it", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"te", "task":"mgsm", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"it", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"te", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"it", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.3422169639 + "score":0.4154607989 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"it", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.5695643744 + "score":0.6309805607 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"it", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.3590717293 + "score":0.3267961489 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"it", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.5878176707 + "score":0.5560375728 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"tg", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"mgsm", - "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"tg", "task":"translation_from", "metric":"bleu", - "score":0.3331002174 + "score":0.2492030159 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"tg", "task":"translation_from", "metric":"chrf", - "score":0.579659503 + "score":0.4785567235 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"tg", "task":"translation_to", "metric":"bleu", - "score":0.336969824 + "score":0.2416391156 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"tg", "task":"translation_to", "metric":"chrf", - "score":0.4913494739 + "score":0.4777363194 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"th", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"th", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"th", "task":"translation_from", "metric":"bleu", - "score":0.3700621486 + "score":0.2828625213 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"th", "task":"translation_from", "metric":"chrf", - "score":0.5837249923 + "score":0.5389976055 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"th", "task":"translation_to", "metric":"bleu", - "score":0.3088767184 + "score":0.379459074 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"th", "task":"translation_to", "metric":"chrf", - "score":0.5884562937 + "score":0.5425233372 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"kn", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ti", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"kn", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ti", "task":"translation_from", "metric":"bleu", - "score":0.3364506705 + "score":0.2043216296 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"kn", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ti", "task":"translation_from", "metric":"chrf", - "score":0.568444139 + "score":0.4630588295 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"kn", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ti", "task":"translation_to", "metric":"bleu", - "score":0.3756915681 + "score":0.170099018 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"kn", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ti", "task":"translation_to", "metric":"chrf", - "score":0.5684194735 + "score":0.285966574 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ko", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"tr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ko", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"tr", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ko", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"tr", "task":"translation_from", "metric":"bleu", - "score":0.2805488398 + "score":0.2999115931 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ko", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"tr", "task":"translation_from", "metric":"chrf", - "score":0.5298229011 + "score":0.5465058684 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ko", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"tr", "task":"translation_to", "metric":"bleu", - "score":0.2739358937 + "score":0.3389488489 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ko", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"tr", "task":"translation_to", "metric":"chrf", - "score":0.3591923755 + "score":0.6048347469 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ml", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"uk", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ml", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"uk", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"uk", "task":"translation_from", "metric":"bleu", - "score":0.3735487132 + "score":0.281242043 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ml", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"uk", "task":"translation_from", "metric":"chrf", - "score":0.5985929462 + "score":0.5334289579 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ml", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"uk", "task":"translation_to", "metric":"bleu", - "score":0.2991127987 + "score":0.429141026 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ml", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"uk", "task":"translation_to", "metric":"chrf", - "score":0.5530820193 + "score":0.5970789076 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"umb", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.6 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"umb", "task":"translation_from", "metric":"bleu", - "score":0.3338185652 + "score":0.0335871262 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"umb", "task":"translation_from", "metric":"chrf", - "score":0.5787491818 + "score":0.1685656521 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"umb", "task":"translation_to", "metric":"bleu", - "score":0.2806196555 + "score":0.0459514881 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"umb", "task":"translation_to", "metric":"chrf", - "score":0.4516145469 + "score":0.2949770962 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ms", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ur", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ms", - "task":"mmlu", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ur", + "task":"translation_from", + "metric":"bleu", + "score":0.2486274521 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ur", + "task":"translation_from", + "metric":"chrf", + "score":0.508189485 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ur", + "task":"translation_to", + "metric":"bleu", + "score":0.2880255112 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"ur", + "task":"translation_to", + "metric":"chrf", + "score":0.4836035417 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"uz", + "task":"classification", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ms", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"uz", "task":"translation_from", "metric":"bleu", - "score":0.4099406931 + "score":0.2152838338 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ms", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"uz", "task":"translation_from", "metric":"chrf", - "score":0.6343459464 + "score":0.4431377684 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ms", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"uz", "task":"translation_to", "metric":"bleu", - "score":0.4650961929 + "score":0.3439565173 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ms", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"uz", "task":"translation_to", "metric":"chrf", - "score":0.742377276 + "score":0.614390118 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"my", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"vi", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"my", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.3081644584 + "score":0.3184530249 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"my", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.567441399 + "score":0.5591378012 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"my", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.2529515223 + "score":0.3979752911 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"my", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.5121166935 + "score":0.6309674882 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"om", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"wo", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"om", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"wo", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.3 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"om", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"wo", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.5 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"om", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"wo", "task":"translation_from", "metric":"bleu", - "score":0.1546333274 + "score":0.0582735609 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"om", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"wo", "task":"translation_from", "metric":"chrf", - "score":0.3730093916 + "score":0.3023435605 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"om", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"wo", "task":"translation_to", "metric":"bleu", - "score":0.0699361494 + "score":0.078527211 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"om", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"wo", "task":"translation_to", "metric":"chrf", - "score":0.4093787348 + "score":0.3202313873 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"or", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"wuu", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"or", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"wuu", "task":"translation_from", "metric":"bleu", - "score":0.3421886958 + "score":0.2575010745 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"or", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"wuu", "task":"translation_from", "metric":"chrf", - "score":0.5848387431 + "score":0.5010134287 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"or", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"wuu", "task":"translation_to", "metric":"bleu", - "score":0.2784394077 + "score":0.1433567699 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"or", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"wuu", "task":"translation_to", "metric":"chrf", - "score":0.5108902329 + "score":0.1989285088 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"xh", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"xh", "task":"translation_from", "metric":"bleu", - "score":0.4372599799 + "score":0.1807854017 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"xh", "task":"translation_from", "metric":"chrf", - "score":0.658993109 + "score":0.4444459462 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"xh", "task":"translation_to", "metric":"bleu", - "score":0.4174871385 + "score":0.097668655 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"xh", "task":"translation_to", "metric":"chrf", - "score":0.5931595705 + "score":0.4425301092 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pl", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"yo", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pl", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"yo", "task":"mgsm", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pl", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"yo", "task":"mmlu", "metric":"accuracy", "score":0.7 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pl", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"yo", "task":"translation_from", "metric":"bleu", - "score":0.2722413511 + "score":0.138613234 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pl", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"yo", "task":"translation_from", "metric":"chrf", - "score":0.5398004754 + "score":0.3633380586 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pl", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"yo", "task":"translation_to", "metric":"bleu", - "score":0.3757453667 + "score":0.1255527769 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pl", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"yo", "task":"translation_to", "metric":"chrf", - "score":0.579529149 + "score":0.2943453041 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"yue", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"yue", "task":"translation_from", "metric":"bleu", - "score":0.3198419121 + "score":0.2202422573 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"yue", "task":"translation_from", "metric":"chrf", - "score":0.578067895 + "score":0.4809857806 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"yue", "task":"translation_to", "metric":"bleu", - "score":0.5056809967 + "score":0.2522298384 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"yue", "task":"translation_to", "metric":"chrf", - "score":0.6966172136 + "score":0.2981672562 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"zh", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"zh", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"zh", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.2839962776 + "score":0.2355051896 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.5461994333 + "score":0.5276826547 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.4589390255 + "score":0.3416160138 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.6469214364 + "score":0.4052096434 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sd", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"zu", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sd", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"zu", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"zu", "task":"translation_from", "metric":"bleu", - "score":0.3972794455 + "score":0.3330382198 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sd", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"zu", "task":"translation_from", "metric":"chrf", - "score":0.6232130593 + "score":0.5839627022 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sd", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"zu", "task":"translation_to", "metric":"bleu", - "score":0.3415088181 + "score":0.3449975051 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sd", + "model":"anthropic\/claude-3.7-sonnet", + "bcp_47":"zu", "task":"translation_to", "metric":"chrf", - "score":0.5390152372 + "score":0.5825497566 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"aeb", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.2669835517 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"mmlu", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.5240335993 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.2270338391 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.440172001 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"af", + "task":"classification", "metric":"accuracy", - "score":0.7 + "score":0.0 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"af", "task":"translation_from", "metric":"bleu", - "score":0.4043048116 + "score":0.0 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"af", "task":"translation_from", "metric":"chrf", - "score":0.5944297519 + "score":0.0 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"af", "task":"translation_to", "metric":"bleu", - "score":0.499303533 + "score":0.0 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"af", "task":"translation_to", "metric":"chrf", - "score":0.7212747243 + "score":0.0 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ta", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ak", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ta", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ak", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ak", "task":"translation_from", "metric":"bleu", - "score":0.2819090872 + "score":0.1929300991 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ta", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ak", "task":"translation_from", "metric":"chrf", - "score":0.5410426012 + "score":0.4140331595 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ta", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ak", "task":"translation_to", "metric":"bleu", - "score":0.2951438389 + "score":0.1217632337 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ta", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ak", "task":"translation_to", "metric":"chrf", - "score":0.5712604905 + "score":0.4239570091 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"am", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"am", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"am", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"am", "task":"translation_from", "metric":"bleu", - "score":0.4243816819 + "score":0.2668020262 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"am", "task":"translation_from", "metric":"chrf", - "score":0.6336752528 + "score":0.5382720996 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"am", "task":"translation_to", "metric":"bleu", - "score":0.3644641049 + "score":0.2942451115 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"am", "task":"translation_to", "metric":"chrf", - "score":0.5789291672 + "score":0.3948537197 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"th", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"apc", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"th", - "task":"mgsm", - "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"th", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"apc", "task":"translation_from", "metric":"bleu", - "score":0.3047162219 + "score":0.3183719205 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"th", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"apc", "task":"translation_from", "metric":"chrf", - "score":0.5499065244 + "score":0.5861114184 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"th", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"apc", "task":"translation_to", "metric":"bleu", - "score":0.4136384398 + "score":0.3080791098 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"th", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"apc", "task":"translation_to", "metric":"chrf", - "score":0.5513959132 + "score":0.5400496227 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"tr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ar", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"tr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ar", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"tr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.2782856704 + "score":0.3007148198 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"tr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.5422402953 + "score":0.56125031 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"tr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.419062749 + "score":0.4435216687 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"tr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.6455051222 + "score":0.6147226174 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ary", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ary", "task":"translation_from", "metric":"bleu", - "score":0.31244285 + "score":0.1875598171 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ary", "task":"translation_from", "metric":"chrf", - "score":0.5630479496 + "score":0.489336688 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ary", "task":"translation_to", "metric":"bleu", - "score":0.2911146353 + "score":0.1959881242 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ary", "task":"translation_to", "metric":"chrf", - "score":0.4826415387 + "score":0.4184181558 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"uz", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"arz", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"uz", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"arz", "task":"translation_from", "metric":"bleu", - "score":0.2813736334 + "score":0.226812714 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"uz", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"arz", "task":"translation_from", "metric":"chrf", - "score":0.5350839669 + "score":0.4624634504 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"uz", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"arz", "task":"translation_to", "metric":"bleu", - "score":0.3532409319 + "score":0.2455579306 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"uz", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"arz", "task":"translation_to", "metric":"chrf", - "score":0.6242374823 + "score":0.4672104169 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"as", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"as", "task":"translation_from", "metric":"bleu", - "score":0.3436662566 + "score":0.225211407 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"as", "task":"translation_from", "metric":"chrf", - "score":0.59026429 + "score":0.475337495 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"as", "task":"translation_to", "metric":"bleu", - "score":0.447007323 + "score":0.0987347036 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"as", "task":"translation_to", "metric":"chrf", - "score":0.6624838094 + "score":0.3710433705 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"wuu", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"awa", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"wuu", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"awa", "task":"translation_from", "metric":"bleu", - "score":0.3135484165 + "score":0.3664463476 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"wuu", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"awa", "task":"translation_from", "metric":"chrf", - "score":0.5406963315 + "score":0.5637794084 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"wuu", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"awa", "task":"translation_to", "metric":"bleu", - "score":0.1901478921 + "score":0.2102096564 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"wuu", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"awa", "task":"translation_to", "metric":"chrf", - "score":0.2245996516 + "score":0.4016844833 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"yue", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"az", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"yue", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"az", "task":"translation_from", "metric":"bleu", - "score":0.2392191989 + "score":0.2623718084 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"yue", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"az", "task":"translation_from", "metric":"chrf", - "score":0.4953232912 + "score":0.503088988 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"yue", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"az", "task":"translation_to", "metric":"bleu", - "score":0.2147687469 + "score":0.1154914703 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"yue", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"az", "task":"translation_to", "metric":"chrf", - "score":0.2691081013 + "score":0.3988570155 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"be", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"be", "task":"translation_from", "metric":"bleu", - "score":0.3075560511 + "score":0.1615117356 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"be", "task":"translation_from", "metric":"chrf", - "score":0.5721434339 + "score":0.4748907807 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"be", "task":"translation_to", "metric":"bleu", - "score":0.3628421643 + "score":0.2424817869 }, { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"be", "task":"translation_to", "metric":"chrf", - "score":0.3921364269 + "score":0.4495742511 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"am", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"bho", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"am", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"am", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"am", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"bho", "task":"translation_from", "metric":"bleu", - "score":0.2720072911 + "score":0.2787657292 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"am", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"bho", "task":"translation_from", "metric":"chrf", - "score":0.5061425801 + "score":0.5218950872 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"am", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"bho", "task":"translation_to", "metric":"bleu", - "score":0.1852281481 + "score":0.2026807977 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"am", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"bho", "task":"translation_to", "metric":"chrf", - "score":0.3131355766 + "score":0.4168764189 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"apc", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"bm", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"apc", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"bm", "task":"translation_from", "metric":"bleu", - "score":0.2661119281 + "score":0.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"apc", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"bm", "task":"translation_from", "metric":"chrf", - "score":0.5602064313 + "score":0.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"apc", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"bm", "task":"translation_to", "metric":"bleu", - "score":0.194000916 + "score":0.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"apc", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"bm", "task":"translation_to", "metric":"chrf", - "score":0.4535351144 + "score":0.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"bn", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"mmlu", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"bn", + "task":"mgsm", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.2723646085 + "score":0.3311551104 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.523730035 + "score":0.5619474693 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.3878873306 + "score":0.3738906354 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.592059186 + "score":0.5465489645 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ca", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ca", "task":"translation_from", "metric":"bleu", - "score":0.2181300738 + "score":0.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ca", "task":"translation_from", "metric":"chrf", - "score":0.4481685644 + "score":0.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ca", "task":"translation_to", "metric":"bleu", - "score":0.215871503 + "score":0.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ca", "task":"translation_to", "metric":"chrf", - "score":0.454646328 + "score":0.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"az", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ceb", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"az", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ceb", "task":"translation_from", "metric":"bleu", - "score":0.2101918607 + "score":0.4093718231 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"az", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ceb", "task":"translation_from", "metric":"chrf", - "score":0.4594084738 + "score":0.624497016 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"az", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ceb", "task":"translation_to", "metric":"bleu", - "score":0.171792145 + "score":0.3928115555 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"az", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ceb", "task":"translation_to", "metric":"chrf", - "score":0.4130816559 + "score":0.6357826484 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bho", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ckb", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bho", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ckb", "task":"translation_from", "metric":"bleu", - "score":0.2526226356 + "score":0.2618384456 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bho", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ckb", "task":"translation_from", "metric":"chrf", - "score":0.5007947756 + "score":0.5051359715 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bho", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ckb", "task":"translation_to", "metric":"bleu", - "score":0.2513374937 + "score":0.2370701457 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bho", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ckb", "task":"translation_to", "metric":"chrf", - "score":0.4492954272 + "score":0.5093826491 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"cs", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"cs", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"cs", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":1.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"cs", "task":"translation_from", "metric":"bleu", - "score":0.2672489266 + "score":0.3614997929 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"cs", "task":"translation_from", "metric":"chrf", - "score":0.4952818431 + "score":0.6075438302 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"cs", "task":"translation_to", "metric":"bleu", - "score":0.3639249804 + "score":0.4250759164 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"cs", "task":"translation_to", "metric":"chrf", - "score":0.5538942616 + "score":0.6148435167 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"de", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"de", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"de", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":1.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.3382313883 + "score":0.3322365647 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.5705047774 + "score":0.5893045134 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.5354923841 + "score":0.5389893408 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.7125417889 + "score":0.7126873721 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"el", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"el", + "task":"translation_from", + "metric":"bleu", + "score":0.3388316195 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"el", + "task":"translation_from", + "metric":"chrf", + "score":0.559085934 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"el", + "task":"translation_to", + "metric":"bleu", + "score":0.3169438238 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"el", + "task":"translation_to", + "metric":"chrf", + "score":0.4981307307 + }, + { + "model":"anthropic\/claude-sonnet-4", "bcp_47":"en", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"en", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"en", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.4617498931 + "score":0.4825264923 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.6321211549 + "score":0.68082594 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.5951204739 + "score":0.5992232007 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.7613397345 + "score":0.8046234958 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"es", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"es", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"es", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.3547349164 + "score":0.3430620741 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.5728186386 + "score":0.5743349585 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.3576086442 + "score":0.3926109516 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.6061019948 + "score":0.619328646 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"fa", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"fa", "task":"mmlu", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"fa", "task":"translation_from", "metric":"bleu", - "score":0.2676796828 + "score":0.3210865047 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"fa", "task":"translation_from", "metric":"chrf", - "score":0.5663114288 + "score":0.5628291341 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"fa", "task":"translation_to", "metric":"bleu", - "score":0.2591969049 + "score":0.2322885818 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"fa", "task":"translation_to", "metric":"chrf", - "score":0.4814104167 + "score":0.4668783462 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"fil", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"fil", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"fil", "task":"translation_from", "metric":"bleu", - "score":0.4277064952 + "score":0.4168839668 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"fil", "task":"translation_from", "metric":"chrf", - "score":0.6325003325 + "score":0.6386977285 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"fil", "task":"translation_to", "metric":"bleu", - "score":0.3269491361 + "score":0.3546234926 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"fil", "task":"translation_to", "metric":"chrf", - "score":0.612989238 + "score":0.6240074261 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"fr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"fr", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"fr", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.2978444639 + "score":0.3292803051 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.5625976718 + "score":0.5747992621 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.5244850062 + "score":0.5300268114 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.7081676298 + "score":0.7191025853 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.10328558 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.2982675123 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0624940624 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.2487717813 + }, + { + "model":"anthropic\/claude-sonnet-4", "bcp_47":"gu", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"gu", "task":"translation_from", "metric":"bleu", - "score":0.3150102324 + "score":0.3449460589 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"gu", "task":"translation_from", "metric":"chrf", - "score":0.5340625085 + "score":0.553592379 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"gu", "task":"translation_to", "metric":"bleu", - "score":0.2069349026 + "score":0.1978537012 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"gu", "task":"translation_to", "metric":"chrf", - "score":0.4761478869 + "score":0.4545082837 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"ha", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"ha", "task":"mgsm", "metric":"accuracy", - "score":0.6 + "score":0.7 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"ha", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":1.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"ha", "task":"translation_from", "metric":"bleu", - "score":0.218966139 + "score":0.2192965513 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"ha", "task":"translation_from", "metric":"chrf", - "score":0.4181042336 + "score":0.4642021162 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"ha", "task":"translation_to", "metric":"bleu", - "score":0.2395753169 + "score":0.2765720113 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"ha", "task":"translation_to", "metric":"chrf", - "score":0.5013466224 + "score":0.5462639917 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"hi", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"hi", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.4286739426 + "score":0.4144634414 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.6359453866 + "score":0.6214654965 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.4344801023 + "score":0.4534129099 }, { - "model":"google\/gemini-2.0-flash-lite-001", + "model":"anthropic\/claude-sonnet-4", "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.6474630132 + "score":0.6589590592 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"hne", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"mmlu", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"hne", + "task":"translation_from", + "metric":"bleu", + "score":0.2772612689 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"hne", + "task":"translation_from", + "metric":"chrf", + "score":0.5374508975 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"hne", + "task":"translation_to", + "metric":"bleu", + "score":0.1221025047 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"hne", + "task":"translation_to", + "metric":"chrf", + "score":0.3885482618 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ht", + "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ht", "task":"translation_from", "metric":"bleu", - "score":0.3126497326 + "score":0.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ht", "task":"translation_from", "metric":"chrf", - "score":0.5733116043 + "score":0.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ht", "task":"translation_to", "metric":"bleu", - "score":0.3882402101 + "score":0.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ht", "task":"translation_to", "metric":"chrf", - "score":0.6624914478 + "score":0.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"hu", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"hu", "task":"mgsm", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"hu", "task":"translation_from", "metric":"bleu", - "score":0.3116016155 + "score":0.3393506808 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"hu", "task":"translation_from", "metric":"chrf", - "score":0.5537049588 + "score":0.6050917672 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"hu", "task":"translation_to", "metric":"bleu", - "score":0.3440495149 + "score":0.3513113523 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"hu", "task":"translation_to", "metric":"chrf", - "score":0.6004337743 + "score":0.6039205342 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"id", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"id", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.289402493 + "score":0.3412154588 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.5452343766 + "score":0.5991114384 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.1879084772 + "score":0.4209501123 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.3787664659 + "score":0.6893145815 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ig", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ig", "task":"translation_from", "metric":"bleu", - "score":0.3561823456 + "score":0.2551553778 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ig", "task":"translation_from", "metric":"chrf", - "score":0.5619277442 + "score":0.5138522649 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ig", "task":"translation_to", "metric":"bleu", - "score":0.2609272138 + "score":0.2850564276 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ig", "task":"translation_to", "metric":"chrf", - "score":0.5344454302 + "score":0.5207891639 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ilo", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ilo", "task":"translation_from", "metric":"bleu", - "score":0.2485030856 + "score":0.2687344116 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ilo", "task":"translation_from", "metric":"chrf", - "score":0.4688750005 + "score":0.5272540777 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ilo", "task":"translation_to", "metric":"bleu", - "score":0.3577614115 + "score":0.2521419676 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ilo", "task":"translation_to", "metric":"chrf", - "score":0.5550425425 + "score":0.5246932394 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"it", "task":"classification", "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"it", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"it", "task":"translation_from", "metric":"bleu", - "score":0.2106519512 + "score":0.3022388162 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"it", "task":"translation_from", "metric":"chrf", - "score":0.4804338475 + "score":0.5435384668 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"it", "task":"translation_to", "metric":"bleu", - "score":0.2003821738 + "score":0.3764287035 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"it", "task":"translation_to", "metric":"chrf", - "score":0.2850409306 + "score":0.6223142999 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ja", "task":"classification", "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.3848912948 + "score":0.2645654805 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.6007084641 + "score":0.5314828839 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.3023908744 + "score":0.3107372447 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.5415851472 + "score":0.4566077399 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"jv", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.2906692433 + "score":0.3598923473 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.5058194876 + "score":0.5731300576 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.2450137243 + "score":0.3220023978 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.4736891146 + "score":0.5987896066 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ms", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ki", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ms", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 + "score":0.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ms", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ki", "task":"translation_from", "metric":"bleu", - "score":0.3362256422 + "score":0.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ms", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ki", "task":"translation_from", "metric":"chrf", - "score":0.5937301471 + "score":0.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ms", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ki", "task":"translation_to", "metric":"bleu", - "score":0.4506461939 + "score":0.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ms", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ki", "task":"translation_to", "metric":"chrf", - "score":0.7014575648 + "score":0.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"my", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"kk", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"my", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"kk", "task":"translation_from", "metric":"bleu", - "score":0.2814491551 + "score":0.2249890784 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"my", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"kk", "task":"translation_from", "metric":"chrf", - "score":0.5513455988 + "score":0.5034200882 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"my", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"kk", "task":"translation_to", "metric":"bleu", - "score":0.2724659132 + "score":0.3391843994 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"my", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"kk", "task":"translation_to", "metric":"chrf", - "score":0.5135188138 + "score":0.5707828412 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"om", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"km", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"om", - "task":"mgsm", - "metric":"accuracy", - "score":0.4 + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"km", + "task":"translation_from", + "metric":"bleu", + "score":0.3651900786 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"om", - "task":"mmlu", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"km", + "task":"translation_from", + "metric":"chrf", + "score":0.6151464618 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"km", + "task":"translation_to", + "metric":"bleu", + "score":0.1894654695 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"km", + "task":"translation_to", + "metric":"chrf", + "score":0.4093754295 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"kn", + "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"om", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"kn", "task":"translation_from", "metric":"bleu", - "score":0.1059783758 + "score":0.2918136532 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"om", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"kn", "task":"translation_from", "metric":"chrf", - "score":0.3306681685 + "score":0.5456800793 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"om", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"kn", "task":"translation_to", "metric":"bleu", - "score":0.044447102 + "score":0.2975642517 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"om", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"kn", "task":"translation_to", "metric":"chrf", - "score":0.379164388 + "score":0.5201018846 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ko", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ko", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ko", "task":"translation_from", "metric":"bleu", - "score":0.3044074075 + "score":0.262347554 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ko", "task":"translation_from", "metric":"chrf", - "score":0.5411406602 + "score":0.5086539396 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ko", "task":"translation_to", "metric":"bleu", - "score":0.2312884216 + "score":0.324863236 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ko", "task":"translation_to", "metric":"chrf", - "score":0.5063263205 + "score":0.3928185911 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"lua", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"lua", "task":"translation_from", "metric":"bleu", - "score":0.3792889323 + "score":0.0865732382 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"lua", "task":"translation_from", "metric":"chrf", - "score":0.6001893022 + "score":0.3303494458 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"lua", "task":"translation_to", "metric":"bleu", - "score":0.4267930078 + "score":0.0819614343 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"lua", "task":"translation_to", "metric":"chrf", - "score":0.583867208 + "score":0.30926584 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"mag", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"mgsm", - "metric":"accuracy", - "score":0.6 + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"mag", + "task":"translation_from", + "metric":"bleu", + "score":0.3814378567 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"mmlu", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"mag", + "task":"translation_from", + "metric":"chrf", + "score":0.5990132828 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"mag", + "task":"translation_to", + "metric":"bleu", + "score":0.2914418132 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"mag", + "task":"translation_to", + "metric":"chrf", + "score":0.5356815834 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"mai", + "task":"classification", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"mai", "task":"translation_from", "metric":"bleu", - "score":0.2910351794 + "score":0.3426987765 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"mai", "task":"translation_from", "metric":"chrf", - "score":0.5387220968 + "score":0.5951472349 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"mai", "task":"translation_to", "metric":"bleu", - "score":0.352446244 + "score":0.2551863067 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"mai", "task":"translation_to", "metric":"chrf", - "score":0.5847615168 + "score":0.5195593791 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"mg", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"mg", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"mg", "task":"translation_from", "metric":"bleu", - "score":0.3275326122 + "score":0.2538113904 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"mg", "task":"translation_from", "metric":"chrf", - "score":0.5672682921 + "score":0.5210775783 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"mg", "task":"translation_to", "metric":"bleu", - "score":0.4390630519 + "score":0.2197400214 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"mg", "task":"translation_to", "metric":"chrf", - "score":0.6588223005 + "score":0.5546741997 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ml", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ml", "task":"translation_from", "metric":"bleu", - "score":0.266439807 + "score":0.3912899265 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ml", "task":"translation_from", "metric":"chrf", - "score":0.5101737799 + "score":0.6091996357 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ml", "task":"translation_to", "metric":"bleu", - "score":0.4085478092 + "score":0.3473927547 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ml", "task":"translation_to", "metric":"chrf", - "score":0.5658655698 + "score":0.5540996255 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"mr", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.3431093451 + "score":0.3219708707 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.5329383828 + "score":0.5658325036 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.2838954554 + "score":0.267663768 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.48412 + "score":0.4820888027 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ms", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"mgsm", - "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ms", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":1.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ms", "task":"translation_from", "metric":"bleu", - "score":0.2763965367 + "score":0.3813299088 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ms", "task":"translation_from", "metric":"chrf", - "score":0.520411275 + "score":0.6248613325 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ms", "task":"translation_to", "metric":"bleu", - "score":0.4350912598 + "score":0.5190281346 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ms", "task":"translation_to", "metric":"chrf", - "score":0.6853284539 + "score":0.7387347937 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"my", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"my", "task":"translation_from", "metric":"bleu", - "score":0.2415112532 + "score":0.2217546445 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"my", "task":"translation_from", "metric":"chrf", - "score":0.4752276392 + "score":0.4614867807 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"my", "task":"translation_to", "metric":"bleu", - "score":0.2730244696 + "score":0.2018629647 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"my", "task":"translation_to", "metric":"chrf", - "score":0.5683000198 + "score":0.42603146 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ne", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ne", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ne", "task":"translation_from", "metric":"bleu", - "score":0.3528600199 + "score":0.3638956194 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ne", "task":"translation_from", "metric":"chrf", - "score":0.5850279702 + "score":0.6069685866 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ne", "task":"translation_to", "metric":"bleu", - "score":0.3231474889 + "score":0.2818004563 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ne", "task":"translation_to", "metric":"chrf", - "score":0.5470305035 + "score":0.520988987 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"nl", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"nl", "task":"mgsm", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"nl", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"nl", "task":"translation_from", "metric":"bleu", - "score":0.2681599618 + "score":0.2888744227 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"nl", "task":"translation_from", "metric":"chrf", - "score":0.5133569475 + "score":0.5305153826 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"nl", "task":"translation_to", "metric":"bleu", - "score":0.3973895019 + "score":0.3314709774 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"nl", "task":"translation_to", "metric":"chrf", - "score":0.564303282 + "score":0.5984996024 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ny", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ny", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ny", "task":"translation_from", "metric":"bleu", - "score":0.2806311806 + "score":0.2128497133 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ny", "task":"translation_from", "metric":"chrf", - "score":0.5431910468 + "score":0.4631762575 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ny", "task":"translation_to", "metric":"bleu", - "score":0.3916346072 + "score":0.170528296 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ny", "task":"translation_to", "metric":"chrf", - "score":0.6289997941 + "score":0.5195265013 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"om", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"om", "task":"translation_from", "metric":"bleu", - "score":0.2859928961 + "score":0.0865227031 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"om", "task":"translation_from", "metric":"chrf", - "score":0.5295533045 + "score":0.3281312148 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"om", "task":"translation_to", "metric":"bleu", - "score":0.3010091175 + "score":0.056144723 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"om", "task":"translation_to", "metric":"chrf", - "score":0.493353195 + "score":0.3812309298 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"uz", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"or", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"uz", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"or", "task":"translation_from", "metric":"bleu", - "score":0.2407351505 + "score":0.3285408012 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"uz", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"or", "task":"translation_from", "metric":"chrf", - "score":0.4734226532 + "score":0.5645168724 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"uz", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"or", "task":"translation_to", "metric":"bleu", - "score":0.3363563156 + "score":0.2820925848 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"uz", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"or", "task":"translation_to", "metric":"chrf", - "score":0.5891323556 + "score":0.5101934539 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"pa", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.3170290484 + "score":0.2859396371 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.5491010642 + "score":0.5523733153 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.4032471641 + "score":0.3163285848 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.6394566771 + "score":0.5051708575 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"wuu", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"pl", "task":"classification", "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"wuu", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"pl", "task":"translation_from", "metric":"bleu", - "score":0.2746262088 + "score":0.2442291975 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"wuu", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"pl", "task":"translation_from", "metric":"chrf", - "score":0.4924092277 + "score":0.5262128573 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"wuu", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"pl", "task":"translation_to", "metric":"bleu", - "score":0.1648044562 + "score":0.2978567509 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"wuu", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"pl", "task":"translation_to", "metric":"chrf", - "score":0.2037009528 + "score":0.5693090483 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"pt", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.1826865099 + "score":0.3458915528 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.4272648905 + "score":0.5893254106 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.1499743312 + "score":0.4849210354 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.2347308661 + "score":0.6981449573 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ro", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ro", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ro", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":1.0 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ro", "task":"translation_from", "metric":"bleu", - "score":0.2557280993 + "score":0.317731832 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ro", "task":"translation_from", "metric":"chrf", - "score":0.5212143675 + "score":0.5613754153 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ro", "task":"translation_to", "metric":"bleu", - "score":0.2610248692 + "score":0.4713164151 }, { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ro", "task":"translation_to", "metric":"chrf", - "score":0.314329989 + "score":0.6495822688 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"am", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ru", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"am", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ru", "task":"mgsm", "metric":"accuracy", + "score":1.0 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ru", + "task":"translation_from", + "metric":"bleu", + "score":0.2503325982 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ru", + "task":"translation_from", + "metric":"chrf", + "score":0.5416976917 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ru", + "task":"translation_to", + "metric":"bleu", + "score":0.3948676748 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ru", + "task":"translation_to", + "metric":"chrf", + "score":0.6159422103 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"rw", + "task":"classification", + "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"am", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"rw", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"rw", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.6 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"am", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"rw", "task":"translation_from", "metric":"bleu", - "score":0.339375511 + "score":0.2295101341 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"am", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"rw", "task":"translation_from", "metric":"chrf", - "score":0.566407043 + "score":0.4799966973 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"am", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"rw", "task":"translation_to", "metric":"bleu", - "score":0.2692320655 + "score":0.2510859963 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"am", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"rw", "task":"translation_to", "metric":"chrf", - "score":0.3685144367 + "score":0.5565619536 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"apc", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sd", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"apc", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sd", "task":"translation_from", "metric":"bleu", - "score":0.3872368514 + "score":0.3515638071 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"apc", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sd", "task":"translation_from", "metric":"chrf", - "score":0.6253206413 + "score":0.5824484364 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"apc", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sd", "task":"translation_to", "metric":"bleu", - "score":0.3385588073 + "score":0.3241789047 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"apc", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sd", "task":"translation_to", "metric":"chrf", - "score":0.5846751763 + "score":0.4829492302 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"si", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"si", "task":"mmlu", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"si", "task":"translation_from", "metric":"bleu", - "score":0.3462011916 + "score":0.2746497811 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"si", "task":"translation_from", "metric":"chrf", - "score":0.5813984303 + "score":0.5372002467 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"si", "task":"translation_to", "metric":"bleu", - "score":0.4319399394 + "score":0.3076981818 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"si", "task":"translation_to", "metric":"chrf", - "score":0.6269389132 + "score":0.4873474492 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sn", "task":"classification", "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sn", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sn", + "task":"mmlu", + "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sn", "task":"translation_from", "metric":"bleu", - "score":0.2639599801 + "score":0.1299381077 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sn", "task":"translation_from", "metric":"chrf", - "score":0.4789807253 + "score":0.3788726193 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sn", "task":"translation_to", "metric":"bleu", - "score":0.2907084686 + "score":0.1912277179 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sn", "task":"translation_to", "metric":"chrf", - "score":0.4882539682 + "score":0.4950017684 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"az", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"so", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"az", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"so", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"so", "task":"translation_from", "metric":"bleu", - "score":0.3101513593 + "score":0.2097508574 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"az", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"so", "task":"translation_from", "metric":"chrf", - "score":0.5253923906 + "score":0.445386701 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"az", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"so", "task":"translation_to", "metric":"bleu", - "score":0.216177525 + "score":0.1991170213 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"az", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"so", "task":"translation_to", "metric":"chrf", - "score":0.4555999734 + "score":0.4930051732 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bho", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sr", "task":"classification", "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sr", + "task":"mmlu", + "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bho", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sr", "task":"translation_from", "metric":"bleu", - "score":0.3246124272 + "score":0.2774555913 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bho", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sr", "task":"translation_from", "metric":"chrf", - "score":0.5547058357 + "score":0.5562717021 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bho", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sr", "task":"translation_to", "metric":"bleu", - "score":0.2300858071 + "score":0.4106937329 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bho", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sr", "task":"translation_to", "metric":"chrf", - "score":0.4391471287 + "score":0.6058388421 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"su", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"su", "task":"translation_from", "metric":"bleu", - "score":0.3332105938 + "score":0.2967826709 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"su", "task":"translation_from", "metric":"chrf", - "score":0.5788748413 + "score":0.5262571298 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"su", "task":"translation_to", "metric":"bleu", - "score":0.3925309816 + "score":0.2209836503 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"su", "task":"translation_to", "metric":"chrf", - "score":0.5671456285 + "score":0.5082942096 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sv", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sv", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sv", "task":"mmlu", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sv", "task":"translation_from", "metric":"bleu", - "score":0.4080538745 + "score":0.3011367305 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sv", "task":"translation_from", "metric":"chrf", - "score":0.6278026445 + "score":0.564663941 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sv", "task":"translation_to", "metric":"bleu", - "score":0.4940498755 + "score":0.448345108 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sv", "task":"translation_to", "metric":"chrf", - "score":0.6915113583 + "score":0.6666956471 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sw", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sw", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sw", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.5780592594 + "score":0.3244718268 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.727062887 + "score":0.5658165542 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.725042796 + "score":0.407475727 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.868453404 + "score":0.6425140836 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ta", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"mgsm", - "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ta", "task":"translation_from", "metric":"bleu", - "score":0.3228577771 + "score":0.2859927313 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ta", "task":"translation_from", "metric":"chrf", - "score":0.5691176688 + "score":0.543203281 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ta", "task":"translation_to", "metric":"bleu", - "score":0.4211069488 + "score":0.3180064929 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ta", "task":"translation_to", "metric":"chrf", - "score":0.6329026504 + "score":0.5878963723 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"te", "task":"classification", "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"te", "task":"mmlu", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.3659700454 + "score":0.457193264 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.5807664259 + "score":0.6605869611 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.2252471667 + "score":0.3695252842 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.4480100347 + "score":0.5799625426 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"tg", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"tg", "task":"translation_from", "metric":"bleu", - "score":0.447799796 + "score":0.2009085121 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"tg", "task":"translation_from", "metric":"chrf", - "score":0.6437494805 + "score":0.4600287687 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"tg", "task":"translation_to", "metric":"bleu", - "score":0.318387966 + "score":0.2198024006 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"tg", "task":"translation_to", "metric":"chrf", - "score":0.6173467767 + "score":0.4640276677 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"th", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"th", "task":"mgsm", "metric":"accuracy", - "score":0.7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"th", "task":"translation_from", "metric":"bleu", - "score":0.3683003934 + "score":0.2907627934 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"th", "task":"translation_from", "metric":"chrf", - "score":0.5961800274 + "score":0.5558044872 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"th", "task":"translation_to", "metric":"bleu", - "score":0.5899042948 + "score":0.3933820255 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"th", "task":"translation_to", "metric":"chrf", - "score":0.7506595836 + "score":0.5410635816 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ti", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ti", "task":"translation_from", "metric":"bleu", - "score":0.3793081536 + "score":0.1783537399 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ti", "task":"translation_from", "metric":"chrf", - "score":0.5865031052 + "score":0.4347699538 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ti", "task":"translation_to", "metric":"bleu", - "score":0.2344717249 + "score":0.1382203867 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ti", "task":"translation_to", "metric":"chrf", - "score":0.4873543825 + "score":0.2283013271 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"tr", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"mgsm", - "metric":"accuracy", - "score":0.5 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"tr", "task":"mmlu", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"tr", "task":"translation_from", "metric":"bleu", - "score":0.3157236901 + "score":0.3344661609 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"tr", "task":"translation_from", "metric":"chrf", - "score":0.5365403784 + "score":0.5823607578 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"tr", "task":"translation_to", "metric":"bleu", - "score":0.3221592053 + "score":0.3519575693 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"tr", "task":"translation_to", "metric":"chrf", - "score":0.565816945 + "score":0.5873812009 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"uk", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"uk", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"uk", "task":"translation_from", "metric":"bleu", - "score":0.4661333335 + "score":0.231149484 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"uk", "task":"translation_from", "metric":"chrf", - "score":0.6599650679 + "score":0.5147846224 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"uk", "task":"translation_to", "metric":"bleu", - "score":0.4319599559 + "score":0.4089741506 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"uk", "task":"translation_to", "metric":"chrf", - "score":0.6493733048 + "score":0.586691795 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"umb", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 + "score":0.4 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"umb", "task":"translation_from", "metric":"bleu", - "score":0.3507436052 + "score":0.0407386888 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"umb", "task":"translation_from", "metric":"chrf", - "score":0.5856872774 + "score":0.1524708774 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"umb", "task":"translation_to", "metric":"bleu", - "score":0.387557065 + "score":0.0615467888 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"umb", "task":"translation_to", "metric":"chrf", - "score":0.6730969345 + "score":0.2411879984 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ur", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.3498261827 + "score":0.2976308897 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.5707332142 + "score":0.5789469354 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.35475083 + "score":0.3161395969 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.5942822113 + "score":0.4958567702 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"uz", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"mgsm", - "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"uz", "task":"translation_from", "metric":"bleu", - "score":0.3590987818 + "score":0.2607779047 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"uz", "task":"translation_from", "metric":"chrf", - "score":0.5958999814 + "score":0.5026594084 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"uz", "task":"translation_to", "metric":"bleu", - "score":0.4151803591 + "score":0.3155204999 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"uz", "task":"translation_to", "metric":"chrf", - "score":0.5319028037 + "score":0.5892994562 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"vi", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3793672083 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.6054760312 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.3161702144 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5956895972 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"classification", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"vi", + "task":"mmlu", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.3051972526 + "score":0.2266398655 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.5542686332 + "score":0.4844747718 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.3567486129 + "score":0.3284536924 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.5611431734 + "score":0.5738443768 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"wo", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"wo", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.3 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"wo", "task":"translation_from", "metric":"bleu", - "score":0.2872143997 + "score":0.0897090973 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"wo", "task":"translation_from", "metric":"chrf", - "score":0.5525223441 + "score":0.3056008006 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"wo", "task":"translation_to", "metric":"bleu", - "score":0.3116476133 + "score":0.1036046651 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"wo", "task":"translation_to", "metric":"chrf", - "score":0.3648802199 + "score":0.3287187985 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"wuu", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"wuu", "task":"translation_from", "metric":"bleu", - "score":0.4065449181 + "score":0.2179300592 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"wuu", "task":"translation_from", "metric":"chrf", - "score":0.6069224309 + "score":0.5011175701 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"wuu", "task":"translation_to", "metric":"bleu", - "score":0.3084108149 + "score":0.1863553829 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"wuu", "task":"translation_to", "metric":"chrf", - "score":0.5610104654 + "score":0.2320124968 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"xh", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"xh", "task":"translation_from", "metric":"bleu", - "score":0.2888720948 + "score":0.2455042454 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"xh", "task":"translation_from", "metric":"chrf", - "score":0.5411662197 + "score":0.4980044603 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"xh", "task":"translation_to", "metric":"bleu", - "score":0.2820351359 + "score":0.1581907622 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"xh", "task":"translation_to", "metric":"chrf", - "score":0.5017455952 + "score":0.4829223036 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ms", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"yo", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ms", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"yo", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ms", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"yo", "task":"translation_from", "metric":"bleu", - "score":0.4137133794 + "score":0.109344665 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ms", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"yo", "task":"translation_from", "metric":"chrf", - "score":0.6312868188 + "score":0.3572196014 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ms", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"yo", "task":"translation_to", "metric":"bleu", - "score":0.4812654706 + "score":0.0982287816 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ms", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"yo", "task":"translation_to", "metric":"chrf", - "score":0.7314221816 + "score":0.2450420475 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"my", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"yue", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"my", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"yue", "task":"translation_from", "metric":"bleu", - "score":0.3696810103 + "score":0.2396091802 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"my", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"yue", "task":"translation_from", "metric":"chrf", - "score":0.5941720939 + "score":0.5123401487 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"my", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"yue", "task":"translation_to", "metric":"bleu", - "score":0.3374140159 + "score":0.2229490278 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"my", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"yue", "task":"translation_to", "metric":"chrf", - "score":0.5598126987 + "score":0.2797129431 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"om", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"zh", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"om", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"zh", "task":"mgsm", "metric":"accuracy", - "score":0.4 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"om", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"zh", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"om", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.1552982789 + "score":0.2637315312 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"om", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.4088650794 + "score":0.550920529 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"om", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.0578542594 + "score":0.3126940794 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"om", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.4227186624 + "score":0.3809708703 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"zu", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"zu", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"zu", "task":"translation_from", "metric":"bleu", - "score":0.3491547876 + "score":0.2898457226 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"zu", "task":"translation_from", "metric":"chrf", - "score":0.6003545703 + "score":0.563083348 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"zu", "task":"translation_to", "metric":"bleu", - "score":0.307748028 + "score":0.2463331565 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", + "model":"anthropic\/claude-sonnet-4", + "bcp_47":"zu", "task":"translation_to", "metric":"chrf", - "score":0.5199829894 + "score":0.5526475142 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", + "model":"deepseek\/deepseek-chat", + "bcp_47":"aeb", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", + "model":"deepseek\/deepseek-chat", + "bcp_47":"aeb", "task":"translation_from", "metric":"bleu", - "score":0.4833653569 + "score":0.2057963854 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", + "model":"deepseek\/deepseek-chat", + "bcp_47":"aeb", "task":"translation_from", "metric":"chrf", - "score":0.6877252787 + "score":0.4190801172 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", + "model":"deepseek\/deepseek-chat", + "bcp_47":"aeb", "task":"translation_to", "metric":"bleu", - "score":0.4959043786 + "score":0.1996247285 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", + "model":"deepseek\/deepseek-chat", + "bcp_47":"aeb", "task":"translation_to", "metric":"chrf", - "score":0.631939007 + "score":0.4442043679 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", + "model":"deepseek\/deepseek-chat", + "bcp_47":"af", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", + "model":"deepseek\/deepseek-chat", + "bcp_47":"af", "task":"translation_from", "metric":"bleu", - "score":0.345076722 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", + "model":"deepseek\/deepseek-chat", + "bcp_47":"af", "task":"translation_from", "metric":"chrf", - "score":0.5982949848 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", + "model":"deepseek\/deepseek-chat", + "bcp_47":"af", "task":"translation_to", "metric":"bleu", - "score":0.3888863333 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", + "model":"deepseek\/deepseek-chat", + "bcp_47":"af", "task":"translation_to", "metric":"chrf", - "score":0.6077722316 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ak", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ak", "task":"mmlu", "metric":"accuracy", - "score":1.0 + "score":0.5 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ak", "task":"translation_from", "metric":"bleu", - "score":0.4185968559 + "score":0.1217071927 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ak", "task":"translation_from", "metric":"chrf", - "score":0.6194298291 + "score":0.328265152 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ak", "task":"translation_to", "metric":"bleu", - "score":0.5066913819 + "score":0.0291184089 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ak", "task":"translation_to", "metric":"chrf", - "score":0.7045563325 + "score":0.3034981634 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", + "model":"deepseek\/deepseek-chat", + "bcp_47":"am", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", + "model":"deepseek\/deepseek-chat", + "bcp_47":"am", "task":"mgsm", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", + "model":"deepseek\/deepseek-chat", + "bcp_47":"am", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", + "model":"deepseek\/deepseek-chat", + "bcp_47":"am", "task":"translation_from", "metric":"bleu", - "score":0.2835606416 + "score":0.2026417516 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", + "model":"deepseek\/deepseek-chat", + "bcp_47":"am", "task":"translation_from", "metric":"chrf", - "score":0.5525332546 + "score":0.463337874 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", + "model":"deepseek\/deepseek-chat", + "bcp_47":"am", "task":"translation_to", "metric":"bleu", - "score":0.5294387768 + "score":0.1217867685 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", + "model":"deepseek\/deepseek-chat", + "bcp_47":"am", "task":"translation_to", "metric":"chrf", - "score":0.6814959444 + "score":0.2662662886 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", + "model":"deepseek\/deepseek-chat", + "bcp_47":"apc", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", + "model":"deepseek\/deepseek-chat", + "bcp_47":"apc", "task":"translation_from", "metric":"bleu", - "score":0.4019575944 + "score":0.2523784543 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", + "model":"deepseek\/deepseek-chat", + "bcp_47":"apc", "task":"translation_from", "metric":"chrf", - "score":0.6276858351 + "score":0.5195328715 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", + "model":"deepseek\/deepseek-chat", + "bcp_47":"apc", "task":"translation_to", "metric":"bleu", - "score":0.3830695907 + "score":0.2422451252 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", + "model":"deepseek\/deepseek-chat", + "bcp_47":"apc", "task":"translation_to", "metric":"chrf", - "score":0.5452929704 + "score":0.5264317244 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ar", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ar", "task":"mmlu", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.4452506057 + "score":0.2660357996 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.6299322033 + "score":0.5489237487 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.4773237879 + "score":0.3431691167 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.6983325706 + "score":0.5659025601 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ary", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ary", "task":"translation_from", "metric":"bleu", - "score":0.2765535661 + "score":0.1411356359 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ary", "task":"translation_from", "metric":"chrf", - "score":0.5553462948 + "score":0.4480483081 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ary", "task":"translation_to", "metric":"bleu", - "score":0.3584530222 + "score":0.1518080432 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ary", "task":"translation_to", "metric":"chrf", - "score":0.6096517359 + "score":0.3858829748 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", + "model":"deepseek\/deepseek-chat", + "bcp_47":"arz", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", + "model":"deepseek\/deepseek-chat", + "bcp_47":"arz", "task":"translation_from", "metric":"bleu", - "score":0.4838983303 + "score":0.221843468 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", + "model":"deepseek\/deepseek-chat", + "bcp_47":"arz", "task":"translation_from", "metric":"chrf", - "score":0.6878651593 + "score":0.4559655934 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", + "model":"deepseek\/deepseek-chat", + "bcp_47":"arz", "task":"translation_to", "metric":"bleu", - "score":0.4225689448 + "score":0.1965127641 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", + "model":"deepseek\/deepseek-chat", + "bcp_47":"arz", "task":"translation_to", "metric":"chrf", - "score":0.6171822766 + "score":0.4448745325 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", + "model":"deepseek\/deepseek-chat", + "bcp_47":"as", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", + "model":"deepseek\/deepseek-chat", + "bcp_47":"as", "task":"translation_from", "metric":"bleu", - "score":0.363389223 + "score":0.2397069931 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", + "model":"deepseek\/deepseek-chat", + "bcp_47":"as", "task":"translation_from", "metric":"chrf", - "score":0.5927603201 + "score":0.475288864 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", + "model":"deepseek\/deepseek-chat", + "bcp_47":"as", "task":"translation_to", "metric":"bleu", - "score":0.4280908922 + "score":0.1580418587 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", + "model":"deepseek\/deepseek-chat", + "bcp_47":"as", "task":"translation_to", "metric":"chrf", - "score":0.5695430758 + "score":0.3840415666 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", + "model":"deepseek\/deepseek-chat", + "bcp_47":"awa", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", + "model":"deepseek\/deepseek-chat", + "bcp_47":"awa", "task":"translation_from", "metric":"bleu", - "score":0.3532965173 + "score":0.3229660121 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", + "model":"deepseek\/deepseek-chat", + "bcp_47":"awa", "task":"translation_from", "metric":"chrf", - "score":0.6170908018 + "score":0.5510776215 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", + "model":"deepseek\/deepseek-chat", + "bcp_47":"awa", "task":"translation_to", "metric":"bleu", - "score":0.4401941591 + "score":0.1731926352 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", + "model":"deepseek\/deepseek-chat", + "bcp_47":"awa", "task":"translation_to", "metric":"chrf", - "score":0.6752054069 + "score":0.3746553107 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", + "model":"deepseek\/deepseek-chat", + "bcp_47":"az", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", + "model":"deepseek\/deepseek-chat", + "bcp_47":"az", "task":"translation_from", "metric":"bleu", - "score":0.3194163699 + "score":0.1557419708 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", + "model":"deepseek\/deepseek-chat", + "bcp_47":"az", "task":"translation_from", "metric":"chrf", - "score":0.5758075077 + "score":0.4249908572 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", + "model":"deepseek\/deepseek-chat", + "bcp_47":"az", "task":"translation_to", "metric":"bleu", - "score":0.2609063103 + "score":0.1551519146 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", + "model":"deepseek\/deepseek-chat", + "bcp_47":"az", "task":"translation_to", "metric":"chrf", - "score":0.4351160146 + "score":0.4046874828 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"uz", + "model":"deepseek\/deepseek-chat", + "bcp_47":"be", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"uz", + "model":"deepseek\/deepseek-chat", + "bcp_47":"be", "task":"translation_from", "metric":"bleu", - "score":0.3488574237 + "score":0.1827705659 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"uz", + "model":"deepseek\/deepseek-chat", + "bcp_47":"be", "task":"translation_from", "metric":"chrf", - "score":0.5833892626 + "score":0.4758300316 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"uz", + "model":"deepseek\/deepseek-chat", + "bcp_47":"be", "task":"translation_to", "metric":"bleu", - "score":0.3525318348 + "score":0.2887000518 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"uz", + "model":"deepseek\/deepseek-chat", + "bcp_47":"be", "task":"translation_to", "metric":"chrf", - "score":0.600901419 + "score":0.4689651175 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", + "model":"deepseek\/deepseek-chat", + "bcp_47":"bho", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", + "model":"deepseek\/deepseek-chat", + "bcp_47":"bho", "task":"translation_from", "metric":"bleu", - "score":0.4227968054 + "score":0.2524146198 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", + "model":"deepseek\/deepseek-chat", + "bcp_47":"bho", "task":"translation_from", "metric":"chrf", - "score":0.6326522416 + "score":0.4953606649 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", + "model":"deepseek\/deepseek-chat", + "bcp_47":"bho", "task":"translation_to", "metric":"bleu", - "score":0.4693432911 + "score":0.1826604742 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", + "model":"deepseek\/deepseek-chat", + "bcp_47":"bho", "task":"translation_to", "metric":"chrf", - "score":0.6659480306 + "score":0.3887388562 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"wuu", + "model":"deepseek\/deepseek-chat", + "bcp_47":"bm", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"wuu", + "model":"deepseek\/deepseek-chat", + "bcp_47":"bm", "task":"translation_from", "metric":"bleu", - "score":0.3241760602 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"wuu", + "model":"deepseek\/deepseek-chat", + "bcp_47":"bm", "task":"translation_from", "metric":"chrf", - "score":0.5694459727 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"wuu", + "model":"deepseek\/deepseek-chat", + "bcp_47":"bm", "task":"translation_to", "metric":"bleu", - "score":0.1373684835 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"wuu", + "model":"deepseek\/deepseek-chat", + "bcp_47":"bm", "task":"translation_to", "metric":"chrf", - "score":0.1808455778 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", + "model":"deepseek\/deepseek-chat", + "bcp_47":"bn", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", + "model":"deepseek\/deepseek-chat", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.2666023686 + "score":0.2999810338 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", + "model":"deepseek\/deepseek-chat", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.5200218275 + "score":0.5315905896 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", + "model":"deepseek\/deepseek-chat", + "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.1881613886 + "score":0.3568113924 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", + "model":"deepseek\/deepseek-chat", + "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.2877597368 + "score":0.5379558638 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ca", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ca", "task":"translation_from", "metric":"bleu", - "score":0.2632355471 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ca", "task":"translation_from", "metric":"chrf", - "score":0.5527183044 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ca", "task":"translation_to", "metric":"bleu", - "score":0.3128970722 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ca", "task":"translation_to", "metric":"chrf", - "score":0.3699956681 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"am", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ceb", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"am", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"am", - "task":"mmlu", - "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"am", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ceb", "task":"translation_from", "metric":"bleu", - "score":0.2883756135 + "score":0.3821149754 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"am", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ceb", "task":"translation_from", "metric":"chrf", - "score":0.5452929372 + "score":0.5961975536 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"am", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ceb", "task":"translation_to", "metric":"bleu", - "score":0.2563045907 + "score":0.346540273 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"am", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ceb", "task":"translation_to", "metric":"chrf", - "score":0.3587997566 + "score":0.6141374461 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"apc", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ckb", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"apc", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ckb", "task":"translation_from", "metric":"bleu", - "score":0.3529391424 + "score":0.1899525093 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"apc", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ckb", "task":"translation_from", "metric":"chrf", - "score":0.6061230642 + "score":0.4989816408 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"apc", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ckb", "task":"translation_to", "metric":"bleu", - "score":0.3735935027 + "score":0.1315130933 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"apc", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ckb", "task":"translation_to", "metric":"chrf", - "score":0.6118752881 + "score":0.4341433104 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ar", + "model":"deepseek\/deepseek-chat", + "bcp_47":"cs", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ar", + "model":"deepseek\/deepseek-chat", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"cs", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ar", + "model":"deepseek\/deepseek-chat", + "bcp_47":"cs", "task":"translation_from", "metric":"bleu", - "score":0.3509446122 + "score":0.3339653303 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ar", + "model":"deepseek\/deepseek-chat", + "bcp_47":"cs", "task":"translation_from", "metric":"chrf", - "score":0.5872861306 + "score":0.5865996685 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ar", + "model":"deepseek\/deepseek-chat", + "bcp_47":"cs", "task":"translation_to", "metric":"bleu", - "score":0.4369226272 + "score":0.4005566788 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ar", + "model":"deepseek\/deepseek-chat", + "bcp_47":"cs", "task":"translation_to", "metric":"chrf", - "score":0.6357392299 + "score":0.5928360984 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"arz", + "model":"deepseek\/deepseek-chat", + "bcp_47":"de", "task":"classification", "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"arz", + "model":"deepseek\/deepseek-chat", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.2689181562 + "score":0.3410327538 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"arz", + "model":"deepseek\/deepseek-chat", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.5103302194 + "score":0.5702449417 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"arz", + "model":"deepseek\/deepseek-chat", + "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.2811045733 + "score":0.4621824412 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"arz", + "model":"deepseek\/deepseek-chat", + "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.4796679654 + "score":0.6644677733 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"az", + "model":"deepseek\/deepseek-chat", + "bcp_47":"el", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"az", + "model":"deepseek\/deepseek-chat", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"el", "task":"translation_from", "metric":"bleu", - "score":0.2402619776 + "score":0.3296804956 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"az", + "model":"deepseek\/deepseek-chat", + "bcp_47":"el", "task":"translation_from", "metric":"chrf", - "score":0.4816842061 + "score":0.5432353476 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"az", + "model":"deepseek\/deepseek-chat", + "bcp_47":"el", "task":"translation_to", "metric":"bleu", - "score":0.2017479595 + "score":0.3361581186 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"az", + "model":"deepseek\/deepseek-chat", + "bcp_47":"el", "task":"translation_to", "metric":"chrf", - "score":0.4438028104 + "score":0.528779004 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"bho", + "model":"deepseek\/deepseek-chat", + "bcp_47":"en", "task":"classification", "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"bho", + "model":"deepseek\/deepseek-chat", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.3118354834 + "score":0.5530727537 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"bho", + "model":"deepseek\/deepseek-chat", + "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.5301057957 + "score":0.7075859327 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"bho", + "model":"deepseek\/deepseek-chat", + "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.2712094702 + "score":0.6368037655 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"bho", + "model":"deepseek\/deepseek-chat", + "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.4554148161 + "score":0.8170495194 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"bn", + "model":"deepseek\/deepseek-chat", + "bcp_47":"es", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"bn", + "model":"deepseek\/deepseek-chat", + "bcp_47":"es", "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"bn", + "model":"deepseek\/deepseek-chat", + "bcp_47":"es", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"bn", + "model":"deepseek\/deepseek-chat", + "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.2928560114 + "score":0.3558328881 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"bn", + "model":"deepseek\/deepseek-chat", + "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.5373877759 + "score":0.5816613686 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"bn", + "model":"deepseek\/deepseek-chat", + "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.371713483 + "score":0.3018683161 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"bn", + "model":"deepseek\/deepseek-chat", + "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.5467648432 + "score":0.5862734644 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"de", + "model":"deepseek\/deepseek-chat", + "bcp_47":"fa", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"de", - "task":"mgsm", - "metric":"accuracy", - "score":0.3 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"de", + "model":"deepseek\/deepseek-chat", + "bcp_47":"fa", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"de", + "model":"deepseek\/deepseek-chat", + "bcp_47":"fa", "task":"translation_from", "metric":"bleu", - "score":0.3827187056 + "score":0.2520796337 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"de", + "model":"deepseek\/deepseek-chat", + "bcp_47":"fa", "task":"translation_from", "metric":"chrf", - "score":0.6092943987 + "score":0.5331446204 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"de", + "model":"deepseek\/deepseek-chat", + "bcp_47":"fa", "task":"translation_to", "metric":"bleu", - "score":0.5181328066 + "score":0.1921744404 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"de", + "model":"deepseek\/deepseek-chat", + "bcp_47":"fa", "task":"translation_to", "metric":"chrf", - "score":0.6981190119 + "score":0.407787256 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"en", + "model":"deepseek\/deepseek-chat", + "bcp_47":"fil", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"en", - "task":"mgsm", - "metric":"accuracy", - "score":0.1 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"en", + "model":"deepseek\/deepseek-chat", + "bcp_47":"fil", "task":"mmlu", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"en", + "model":"deepseek\/deepseek-chat", + "bcp_47":"fil", "task":"translation_from", "metric":"bleu", - "score":0.5942868447 + "score":0.3243217549 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"en", + "model":"deepseek\/deepseek-chat", + "bcp_47":"fil", "task":"translation_from", "metric":"chrf", - "score":0.7298379077 + "score":0.5392052945 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"en", + "model":"deepseek\/deepseek-chat", + "bcp_47":"fil", "task":"translation_to", "metric":"bleu", - "score":0.7309888475 + "score":0.3295144102 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"en", + "model":"deepseek\/deepseek-chat", + "bcp_47":"fil", "task":"translation_to", "metric":"chrf", - "score":0.8534239972 + "score":0.5926958618 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"es", + "model":"deepseek\/deepseek-chat", + "bcp_47":"fr", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"es", + "model":"deepseek\/deepseek-chat", + "bcp_47":"fr", "task":"mgsm", "metric":"accuracy", - "score":0.3 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"es", + "model":"deepseek\/deepseek-chat", + "bcp_47":"fr", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"es", + "model":"deepseek\/deepseek-chat", + "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.3497891701 + "score":0.3482763208 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"es", + "model":"deepseek\/deepseek-chat", + "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.5889817614 + "score":0.5982327963 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"es", + "model":"deepseek\/deepseek-chat", + "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.395885417 + "score":0.452269216 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"es", + "model":"deepseek\/deepseek-chat", + "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.6273835234 + "score":0.6590312745 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"fa", + "model":"deepseek\/deepseek-chat", + "bcp_47":"fuv", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"fa", - "task":"mmlu", + "model":"deepseek\/deepseek-chat", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.038115978 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.2335371377 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0230267925 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.2225585574 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"gu", + "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"fa", + "model":"deepseek\/deepseek-chat", + "bcp_47":"gu", "task":"translation_from", "metric":"bleu", - "score":0.3764428485 + "score":0.2919455567 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"fa", + "model":"deepseek\/deepseek-chat", + "bcp_47":"gu", "task":"translation_from", "metric":"chrf", - "score":0.5794911256 + "score":0.5131981959 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"fa", + "model":"deepseek\/deepseek-chat", + "bcp_47":"gu", "task":"translation_to", "metric":"bleu", - "score":0.3019679958 + "score":0.1292315656 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"fa", + "model":"deepseek\/deepseek-chat", + "bcp_47":"gu", "task":"translation_to", "metric":"chrf", - "score":0.5314471888 + "score":0.4092770954 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"fil", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ha", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"fil", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ha", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ha", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"fil", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ha", "task":"translation_from", "metric":"bleu", - "score":0.3970330872 + "score":0.1854918728 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"fil", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ha", "task":"translation_from", "metric":"chrf", - "score":0.6224300541 + "score":0.3934600154 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"fil", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ha", "task":"translation_to", "metric":"bleu", - "score":0.3731416111 + "score":0.266974078 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"fil", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ha", "task":"translation_to", "metric":"chrf", - "score":0.6421804886 + "score":0.5393383261 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"fr", + "model":"deepseek\/deepseek-chat", + "bcp_47":"hi", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"fr", - "task":"mgsm", - "metric":"accuracy", - "score":0.5 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"fr", + "model":"deepseek\/deepseek-chat", + "bcp_47":"hi", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"fr", + "model":"deepseek\/deepseek-chat", + "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.3737227872 + "score":0.3747394322 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"fr", + "model":"deepseek\/deepseek-chat", + "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.6039484183 + "score":0.6079633657 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"fr", + "model":"deepseek\/deepseek-chat", + "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.5555743798 + "score":0.4420465241 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"fr", + "model":"deepseek\/deepseek-chat", + "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.7229519037 + "score":0.6372857982 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"gu", + "model":"deepseek\/deepseek-chat", + "bcp_47":"hne", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"gu", + "model":"deepseek\/deepseek-chat", + "bcp_47":"hne", "task":"translation_from", "metric":"bleu", - "score":0.344471287 + "score":0.2331017118 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"gu", + "model":"deepseek\/deepseek-chat", + "bcp_47":"hne", "task":"translation_from", "metric":"chrf", - "score":0.5591834446 + "score":0.4736195736 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"gu", + "model":"deepseek\/deepseek-chat", + "bcp_47":"hne", "task":"translation_to", "metric":"bleu", - "score":0.180119873 + "score":0.1022265448 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"gu", + "model":"deepseek\/deepseek-chat", + "bcp_47":"hne", "task":"translation_to", "metric":"chrf", - "score":0.4654772276 + "score":0.3883925189 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ha", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ht", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ha", - "task":"mgsm", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ht", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ht", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ht", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ht", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"hu", + "task":"classification", "metric":"accuracy", - "score":0.5 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ha", - "task":"mmlu", + "model":"deepseek\/deepseek-chat", + "bcp_47":"hu", + "task":"mgsm", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ha", + "model":"deepseek\/deepseek-chat", + "bcp_47":"hu", "task":"translation_from", "metric":"bleu", - "score":0.2852268084 + "score":0.2769514475 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ha", + "model":"deepseek\/deepseek-chat", + "bcp_47":"hu", "task":"translation_from", "metric":"chrf", - "score":0.4820918601 + "score":0.5440818488 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ha", + "model":"deepseek\/deepseek-chat", + "bcp_47":"hu", "task":"translation_to", "metric":"bleu", - "score":0.318588004 + "score":0.3439976656 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ha", + "model":"deepseek\/deepseek-chat", + "bcp_47":"hu", "task":"translation_to", "metric":"chrf", - "score":0.5675346049 + "score":0.583941298 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"hi", + "model":"deepseek\/deepseek-chat", + "bcp_47":"id", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"hi", + "model":"deepseek\/deepseek-chat", + "bcp_47":"id", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"hi", + "model":"deepseek\/deepseek-chat", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.4387215588 + "score":0.3120299438 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"hi", + "model":"deepseek\/deepseek-chat", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.6443095169 + "score":0.5421647326 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"hi", + "model":"deepseek\/deepseek-chat", + "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.4255607348 + "score":0.3139800299 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"hi", + "model":"deepseek\/deepseek-chat", + "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.6457270128 + "score":0.6305869448 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"id", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ig", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"id", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ig", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.6 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"id", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ig", "task":"translation_from", "metric":"bleu", - "score":0.3789722313 + "score":0.1948861013 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"id", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ig", "task":"translation_from", "metric":"chrf", - "score":0.5973074889 + "score":0.4359300942 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"id", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ig", "task":"translation_to", "metric":"bleu", - "score":0.406320567 + "score":0.2500136994 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"id", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ig", "task":"translation_to", "metric":"chrf", - "score":0.6828299565 + "score":0.4929182362 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ilo", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"bleu", + "score":0.1414246135 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"chrf", + "score":0.400392952 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"bleu", + "score":0.1754521219 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"chrf", + "score":0.4706209345 + }, + { + "model":"deepseek\/deepseek-chat", "bcp_47":"it", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"deepseek\/deepseek-chat", "bcp_47":"it", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"deepseek\/deepseek-chat", "bcp_47":"it", "task":"mmlu", "metric":"accuracy", "score":0.7 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"deepseek\/deepseek-chat", "bcp_47":"it", "task":"translation_from", "metric":"bleu", - "score":0.3177725576 + "score":0.2726271593 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"deepseek\/deepseek-chat", "bcp_47":"it", "task":"translation_from", "metric":"chrf", - "score":0.5648818053 + "score":0.5135668055 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"deepseek\/deepseek-chat", "bcp_47":"it", "task":"translation_to", "metric":"bleu", - "score":0.3654943432 + "score":0.3420319137 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"deepseek\/deepseek-chat", "bcp_47":"it", "task":"translation_to", "metric":"chrf", - "score":0.5949572053 + "score":0.6095914494 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"deepseek\/deepseek-chat", "bcp_47":"ja", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"deepseek\/deepseek-chat", "bcp_47":"ja", "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"deepseek\/deepseek-chat", "bcp_47":"ja", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"deepseek\/deepseek-chat", "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.3423388267 + "score":0.2121435327 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"deepseek\/deepseek-chat", "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.5884893314 + "score":0.5165098934 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"deepseek\/deepseek-chat", "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.3740472584 + "score":0.3965805608 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"deepseek\/deepseek-chat", "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.4832664839 + "score":0.5197322727 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"deepseek\/deepseek-chat", "bcp_47":"jv", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"deepseek\/deepseek-chat", "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.3540174328 + "score":0.2594796679 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"deepseek\/deepseek-chat", "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.5513315973 + "score":0.4780086047 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"deepseek\/deepseek-chat", "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.329885986 + "score":0.3009966401 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"deepseek\/deepseek-chat", "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.5805485408 + "score":0.5761529867 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"kn", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ki", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"kn", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ki", "task":"translation_from", "metric":"bleu", - "score":0.2512885128 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"kn", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ki", "task":"translation_from", "metric":"chrf", - "score":0.4934774392 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"kn", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ki", "task":"translation_to", "metric":"bleu", - "score":0.3278617048 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"kn", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ki", "task":"translation_to", "metric":"chrf", - "score":0.5102619479 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ko", + "model":"deepseek\/deepseek-chat", + "bcp_47":"kk", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ko", + "model":"deepseek\/deepseek-chat", + "bcp_47":"kk", "task":"translation_from", "metric":"bleu", - "score":0.2465751079 + "score":0.2316697911 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ko", + "model":"deepseek\/deepseek-chat", + "bcp_47":"kk", "task":"translation_from", "metric":"chrf", - "score":0.515705028 + "score":0.4912151365 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ko", + "model":"deepseek\/deepseek-chat", + "bcp_47":"kk", "task":"translation_to", "metric":"bleu", - "score":0.2528779436 + "score":0.2880260216 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ko", + "model":"deepseek\/deepseek-chat", + "bcp_47":"kk", "task":"translation_to", "metric":"chrf", - "score":0.3488788279 + "score":0.5039209227 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ml", + "model":"deepseek\/deepseek-chat", + "bcp_47":"km", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ml", + "model":"deepseek\/deepseek-chat", + "bcp_47":"km", "task":"translation_from", "metric":"bleu", - "score":0.3532448793 + "score":0.2667770035 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ml", + "model":"deepseek\/deepseek-chat", + "bcp_47":"km", "task":"translation_from", "metric":"chrf", - "score":0.5657281022 + "score":0.5371226098 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ml", + "model":"deepseek\/deepseek-chat", + "bcp_47":"km", "task":"translation_to", "metric":"bleu", - "score":0.3046979511 + "score":0.1137141251 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ml", + "model":"deepseek\/deepseek-chat", + "bcp_47":"km", "task":"translation_to", "metric":"chrf", - "score":0.5523287159 + "score":0.3542419226 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"mr", + "model":"deepseek\/deepseek-chat", + "bcp_47":"kn", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"mr", + "model":"deepseek\/deepseek-chat", + "bcp_47":"kn", "task":"translation_from", "metric":"bleu", - "score":0.3055522766 + "score":0.2597105982 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"mr", + "model":"deepseek\/deepseek-chat", + "bcp_47":"kn", "task":"translation_from", "metric":"chrf", - "score":0.5435968357 + "score":0.4929733942 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"mr", + "model":"deepseek\/deepseek-chat", + "bcp_47":"kn", "task":"translation_to", "metric":"bleu", - "score":0.257460039 + "score":0.1901313405 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"mr", + "model":"deepseek\/deepseek-chat", + "bcp_47":"kn", "task":"translation_to", "metric":"chrf", - "score":0.4845716024 + "score":0.4793446685 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ms", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ko", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ms", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ko", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ms", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ko", "task":"translation_from", "metric":"bleu", - "score":0.3746934831 + "score":0.2650641815 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ms", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ko", "task":"translation_from", "metric":"chrf", - "score":0.6046609636 + "score":0.5151986111 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ms", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ko", "task":"translation_to", "metric":"bleu", - "score":0.4734156929 + "score":0.2220814456 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ms", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ko", "task":"translation_to", "metric":"chrf", - "score":0.7284733826 + "score":0.318063422 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"my", + "model":"deepseek\/deepseek-chat", + "bcp_47":"lua", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"my", + "model":"deepseek\/deepseek-chat", + "bcp_47":"lua", "task":"translation_from", "metric":"bleu", - "score":0.3552781219 + "score":0.0836411722 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"my", + "model":"deepseek\/deepseek-chat", + "bcp_47":"lua", "task":"translation_from", "metric":"chrf", - "score":0.5977013775 + "score":0.2984177736 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"my", + "model":"deepseek\/deepseek-chat", + "bcp_47":"lua", "task":"translation_to", "metric":"bleu", - "score":0.3211140622 + "score":0.043655724 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"my", + "model":"deepseek\/deepseek-chat", + "bcp_47":"lua", "task":"translation_to", "metric":"chrf", - "score":0.544805929 + "score":0.2335929953 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"om", + "model":"deepseek\/deepseek-chat", + "bcp_47":"mag", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"om", - "task":"mgsm", - "metric":"accuracy", - "score":0.3 + "model":"deepseek\/deepseek-chat", + "bcp_47":"mag", + "task":"translation_from", + "metric":"bleu", + "score":0.3229689104 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"om", - "task":"mmlu", + "model":"deepseek\/deepseek-chat", + "bcp_47":"mag", + "task":"translation_from", + "metric":"chrf", + "score":0.5803873354 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"mag", + "task":"translation_to", + "metric":"bleu", + "score":0.2069505913 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"mag", + "task":"translation_to", + "metric":"chrf", + "score":0.489819774 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"mai", + "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"om", + "model":"deepseek\/deepseek-chat", + "bcp_47":"mai", "task":"translation_from", "metric":"bleu", - "score":0.1871006972 + "score":0.2481653983 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"om", + "model":"deepseek\/deepseek-chat", + "bcp_47":"mai", "task":"translation_from", "metric":"chrf", - "score":0.4365658925 + "score":0.5271356217 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"om", + "model":"deepseek\/deepseek-chat", + "bcp_47":"mai", "task":"translation_to", "metric":"bleu", - "score":0.106229994 + "score":0.182427997 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"om", + "model":"deepseek\/deepseek-chat", + "bcp_47":"mai", "task":"translation_to", "metric":"chrf", - "score":0.4277182017 + "score":0.4654775647 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"or", + "model":"deepseek\/deepseek-chat", + "bcp_47":"mg", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"or", + "model":"deepseek\/deepseek-chat", + "bcp_47":"mg", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"mg", "task":"translation_from", "metric":"bleu", - "score":0.3740486194 + "score":0.1686533634 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"or", + "model":"deepseek\/deepseek-chat", + "bcp_47":"mg", "task":"translation_from", "metric":"chrf", - "score":0.6141131486 + "score":0.3897581367 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"or", + "model":"deepseek\/deepseek-chat", + "bcp_47":"mg", "task":"translation_to", "metric":"bleu", - "score":0.31231668 + "score":0.1950122982 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"or", + "model":"deepseek\/deepseek-chat", + "bcp_47":"mg", "task":"translation_to", "metric":"chrf", - "score":0.5222572922 + "score":0.4912322205 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"pa", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ml", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"pa", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ml", "task":"translation_from", "metric":"bleu", - "score":0.4182659606 + "score":0.3261687004 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"pa", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ml", "task":"translation_from", "metric":"chrf", - "score":0.6696655487 + "score":0.5570892069 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"pa", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ml", "task":"translation_to", "metric":"bleu", - "score":0.4665320226 + "score":0.3239362726 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"pa", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ml", "task":"translation_to", "metric":"chrf", - "score":0.6280330147 + "score":0.5507453743 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"pl", + "model":"deepseek\/deepseek-chat", + "bcp_47":"mr", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"pl", - "task":"mgsm", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"pl", + "model":"deepseek\/deepseek-chat", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.3282584844 + "score":0.2536168105 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"pl", + "model":"deepseek\/deepseek-chat", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.5713765921 + "score":0.5193737639 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"pl", + "model":"deepseek\/deepseek-chat", + "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.3762753954 + "score":0.2743904396 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"pl", + "model":"deepseek\/deepseek-chat", + "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.5940500139 + "score":0.4918283752 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"pt", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ms", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"pt", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ms", "task":"mmlu", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"pt", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ms", "task":"translation_from", "metric":"bleu", - "score":0.3485890022 + "score":0.2986347511 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"pt", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ms", "task":"translation_from", "metric":"chrf", - "score":0.574915747 + "score":0.5339411724 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"pt", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ms", "task":"translation_to", "metric":"bleu", - "score":0.4760104707 + "score":0.3783664491 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"pt", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ms", "task":"translation_to", "metric":"chrf", - "score":0.6891420805 + "score":0.6540376697 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ru", + "model":"deepseek\/deepseek-chat", + "bcp_47":"my", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ru", - "task":"mgsm", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ru", + "model":"deepseek\/deepseek-chat", + "bcp_47":"my", "task":"translation_from", "metric":"bleu", - "score":0.2893557086 + "score":0.2199531275 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ru", + "model":"deepseek\/deepseek-chat", + "bcp_47":"my", "task":"translation_from", "metric":"chrf", - "score":0.5514512546 + "score":0.4736214414 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ru", + "model":"deepseek\/deepseek-chat", + "bcp_47":"my", "task":"translation_to", "metric":"bleu", - "score":0.4910352633 + "score":0.2571304866 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ru", + "model":"deepseek\/deepseek-chat", + "bcp_47":"my", "task":"translation_to", "metric":"chrf", - "score":0.6636379715 + "score":0.5221658577 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"sd", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ne", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"sd", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ne", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ne", "task":"translation_from", "metric":"bleu", - "score":0.3296224998 + "score":0.3141227729 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"sd", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ne", "task":"translation_from", "metric":"chrf", - "score":0.5499189472 + "score":0.545378522 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"sd", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ne", "task":"translation_to", "metric":"bleu", - "score":0.2231786181 + "score":0.2384329055 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"sd", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ne", "task":"translation_to", "metric":"chrf", - "score":0.407169401 + "score":0.4946334042 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"sw", + "model":"deepseek\/deepseek-chat", + "bcp_47":"nl", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"sw", + "model":"deepseek\/deepseek-chat", + "bcp_47":"nl", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"sw", + "model":"deepseek\/deepseek-chat", + "bcp_47":"nl", "task":"mmlu", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"sw", + "model":"deepseek\/deepseek-chat", + "bcp_47":"nl", "task":"translation_from", "metric":"bleu", - "score":0.397583037 + "score":0.2960130626 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"sw", + "model":"deepseek\/deepseek-chat", + "bcp_47":"nl", "task":"translation_from", "metric":"chrf", - "score":0.6014699575 + "score":0.5398408986 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"sw", + "model":"deepseek\/deepseek-chat", + "bcp_47":"nl", "task":"translation_to", "metric":"bleu", - "score":0.4540021563 + "score":0.2642890319 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"sw", + "model":"deepseek\/deepseek-chat", + "bcp_47":"nl", "task":"translation_to", "metric":"chrf", - "score":0.7002830052 + "score":0.5934736192 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ta", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ny", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ta", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ny", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ny", "task":"translation_from", "metric":"bleu", - "score":0.2981018347 + "score":0.1039040494 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ta", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ny", "task":"translation_from", "metric":"chrf", - "score":0.5573394656 + "score":0.343251081 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ta", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ny", "task":"translation_to", "metric":"bleu", - "score":0.3033361537 + "score":0.0893012181 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ta", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ny", "task":"translation_to", "metric":"chrf", - "score":0.5406646936 + "score":0.42437101 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"te", + "model":"deepseek\/deepseek-chat", + "bcp_47":"om", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"te", + "model":"deepseek\/deepseek-chat", + "bcp_47":"om", "task":"mgsm", "metric":"accuracy", - "score":0.1 + "score":0.4 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"te", + "model":"deepseek\/deepseek-chat", + "bcp_47":"om", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.6 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"te", + "model":"deepseek\/deepseek-chat", + "bcp_47":"om", "task":"translation_from", "metric":"bleu", - "score":0.4025505277 + "score":0.0512543236 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"te", + "model":"deepseek\/deepseek-chat", + "bcp_47":"om", "task":"translation_from", "metric":"chrf", - "score":0.6339036498 + "score":0.2613232237 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"te", + "model":"deepseek\/deepseek-chat", + "bcp_47":"om", "task":"translation_to", "metric":"bleu", - "score":0.4166086163 + "score":0.0260385015 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"te", + "model":"deepseek\/deepseek-chat", + "bcp_47":"om", "task":"translation_to", "metric":"chrf", - "score":0.6171953291 + "score":0.3274101513 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"th", + "model":"deepseek\/deepseek-chat", + "bcp_47":"or", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"th", - "task":"mgsm", - "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"th", + "model":"deepseek\/deepseek-chat", + "bcp_47":"or", "task":"translation_from", "metric":"bleu", - "score":0.3196721957 + "score":0.271766815 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"th", + "model":"deepseek\/deepseek-chat", + "bcp_47":"or", "task":"translation_from", "metric":"chrf", - "score":0.5597673276 + "score":0.5041819226 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"th", + "model":"deepseek\/deepseek-chat", + "bcp_47":"or", "task":"translation_to", "metric":"bleu", - "score":0.4114706745 + "score":0.1870998997 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"th", + "model":"deepseek\/deepseek-chat", + "bcp_47":"or", "task":"translation_to", "metric":"chrf", - "score":0.560767027 + "score":0.4329741844 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"tr", + "model":"deepseek\/deepseek-chat", + "bcp_47":"pa", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"tr", + "model":"deepseek\/deepseek-chat", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.3291780472 + "score":0.4307107958 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"tr", + "model":"deepseek\/deepseek-chat", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.5900439285 + "score":0.6547934264 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"tr", + "model":"deepseek\/deepseek-chat", + "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.4285247051 + "score":0.3789232965 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"tr", + "model":"deepseek\/deepseek-chat", + "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.6508035663 + "score":0.5490387026 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ur", + "model":"deepseek\/deepseek-chat", + "bcp_47":"pl", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.3212777323 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5735084601 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3027958989 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4912965943 + "model":"deepseek\/deepseek-chat", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"uz", - "task":"classification", + "model":"deepseek\/deepseek-chat", + "bcp_47":"pl", + "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"uz", + "model":"deepseek\/deepseek-chat", + "bcp_47":"pl", "task":"translation_from", "metric":"bleu", - "score":0.2583582755 + "score":0.2715804037 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"uz", + "model":"deepseek\/deepseek-chat", + "bcp_47":"pl", "task":"translation_from", "metric":"chrf", - "score":0.483302551 + "score":0.5307525116 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"uz", + "model":"deepseek\/deepseek-chat", + "bcp_47":"pl", "task":"translation_to", "metric":"bleu", - "score":0.3579243963 + "score":0.3285527346 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"uz", + "model":"deepseek\/deepseek-chat", + "bcp_47":"pl", "task":"translation_to", "metric":"chrf", - "score":0.6083657804 + "score":0.5692291394 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"vi", + "model":"deepseek\/deepseek-chat", + "bcp_47":"pt", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"vi", + "model":"deepseek\/deepseek-chat", + "bcp_47":"pt", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"vi", + "model":"deepseek\/deepseek-chat", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.3471784526 + "score":0.3491027097 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"vi", + "model":"deepseek\/deepseek-chat", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.5719753053 + "score":0.5771246685 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"vi", + "model":"deepseek\/deepseek-chat", + "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.4601231177 + "score":0.3737440632 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"vi", + "model":"deepseek\/deepseek-chat", + "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.6644848789 + "score":0.6547073078 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"wuu", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ro", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"wuu", - "task":"translation_from", - "metric":"bleu", - "score":0.2968992777 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"wuu", - "task":"translation_from", - "metric":"chrf", - "score":0.5258850631 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"wuu", - "task":"translation_to", - "metric":"bleu", - "score":0.1321430026 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"wuu", - "task":"translation_to", - "metric":"chrf", - "score":0.176594989 + "model":"deepseek\/deepseek-chat", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"yue", - "task":"classification", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ro", + "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"yue", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ro", "task":"translation_from", "metric":"bleu", - "score":0.2756047962 + "score":0.2650680958 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"yue", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ro", "task":"translation_from", "metric":"chrf", - "score":0.518253876 + "score":0.5205343441 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"yue", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ro", "task":"translation_to", "metric":"bleu", - "score":0.2356751392 + "score":0.4511284085 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"yue", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ro", "task":"translation_to", "metric":"chrf", - "score":0.3051882861 + "score":0.6282365697 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"zh", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ru", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"zh", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ru", "task":"mgsm", "metric":"accuracy", - "score":0.4 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"zh", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ru", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"zh", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.2989639846 + "score":0.2584319121 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"zh", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.5646599732 + "score":0.5177022275 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"zh", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.2915310914 + "score":0.371218137 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"zh", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.3358004159 + "score":0.5948906549 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"am", + "model":"deepseek\/deepseek-chat", + "bcp_47":"rw", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"am", + "model":"deepseek\/deepseek-chat", + "bcp_47":"rw", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.4 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"am", + "model":"deepseek\/deepseek-chat", + "bcp_47":"rw", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.7 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"am", + "model":"deepseek\/deepseek-chat", + "bcp_47":"rw", "task":"translation_from", "metric":"bleu", - "score":0.2393172056 + "score":0.0926162696 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"am", + "model":"deepseek\/deepseek-chat", + "bcp_47":"rw", "task":"translation_from", "metric":"chrf", - "score":0.4971254293 + "score":0.3328045162 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"am", + "model":"deepseek\/deepseek-chat", + "bcp_47":"rw", "task":"translation_to", "metric":"bleu", - "score":0.2089212841 + "score":0.1301545031 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"am", + "model":"deepseek\/deepseek-chat", + "bcp_47":"rw", "task":"translation_to", "metric":"chrf", - "score":0.3406916002 + "score":0.4379044144 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"apc", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sd", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"apc", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sd", "task":"translation_from", "metric":"bleu", - "score":0.2712045148 + "score":0.2619487807 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"apc", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sd", "task":"translation_from", "metric":"chrf", - "score":0.5477096036 + "score":0.4937679545 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"apc", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sd", "task":"translation_to", "metric":"bleu", - "score":0.178052271 + "score":0.2097242522 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"apc", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sd", "task":"translation_to", "metric":"chrf", - "score":0.468064885 + "score":0.4402768379 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", + "model":"deepseek\/deepseek-chat", + "bcp_47":"si", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", + "model":"deepseek\/deepseek-chat", + "bcp_47":"si", "task":"mmlu", "metric":"accuracy", - "score":1.0 + "score":0.7 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", + "model":"deepseek\/deepseek-chat", + "bcp_47":"si", "task":"translation_from", "metric":"bleu", - "score":0.2747843596 + "score":0.2206007581 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", + "model":"deepseek\/deepseek-chat", + "bcp_47":"si", "task":"translation_from", "metric":"chrf", - "score":0.5519960681 + "score":0.4841625224 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", + "model":"deepseek\/deepseek-chat", + "bcp_47":"si", "task":"translation_to", "metric":"bleu", - "score":0.2863967069 + "score":0.2418583032 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", + "model":"deepseek\/deepseek-chat", + "bcp_47":"si", "task":"translation_to", "metric":"chrf", - "score":0.5318173199 + "score":0.4464397214 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"arz", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sn", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"arz", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sn", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"sn", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"sn", "task":"translation_from", "metric":"bleu", - "score":0.1892846534 + "score":0.0858734443 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"arz", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sn", "task":"translation_from", "metric":"chrf", - "score":0.4212342522 + "score":0.3340485034 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"arz", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sn", "task":"translation_to", "metric":"bleu", - "score":0.1938470016 + "score":0.1646186552 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"arz", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sn", "task":"translation_to", "metric":"chrf", - "score":0.4527968539 + "score":0.4670539114 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"az", + "model":"deepseek\/deepseek-chat", + "bcp_47":"so", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"az", + "model":"deepseek\/deepseek-chat", + "bcp_47":"so", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"so", "task":"translation_from", "metric":"bleu", - "score":0.200456445 + "score":0.2147068836 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"az", + "model":"deepseek\/deepseek-chat", + "bcp_47":"so", "task":"translation_from", "metric":"chrf", - "score":0.4226152307 + "score":0.4416005881 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"az", + "model":"deepseek\/deepseek-chat", + "bcp_47":"so", "task":"translation_to", "metric":"bleu", - "score":0.1414132922 + "score":0.1631062755 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"az", + "model":"deepseek\/deepseek-chat", + "bcp_47":"so", "task":"translation_to", "metric":"chrf", - "score":0.4170843853 + "score":0.4541385931 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bho", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sr", "task":"classification", "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"sr", + "task":"mmlu", + "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bho", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sr", "task":"translation_from", "metric":"bleu", - "score":0.2663307677 + "score":0.2705284479 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bho", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sr", "task":"translation_from", "metric":"chrf", - "score":0.519985227 + "score":0.5472822854 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bho", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sr", "task":"translation_to", "metric":"bleu", - "score":0.1913577407 + "score":0.3949384152 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bho", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sr", "task":"translation_to", "metric":"chrf", - "score":0.4064669591 + "score":0.5962190033 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", + "model":"deepseek\/deepseek-chat", + "bcp_47":"su", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", + "model":"deepseek\/deepseek-chat", + "bcp_47":"su", "task":"translation_from", "metric":"bleu", - "score":0.271237739 + "score":0.247144381 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", + "model":"deepseek\/deepseek-chat", + "bcp_47":"su", "task":"translation_from", "metric":"chrf", - "score":0.5173954387 + "score":0.472335293 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", + "model":"deepseek\/deepseek-chat", + "bcp_47":"su", "task":"translation_to", "metric":"bleu", - "score":0.3067537945 + "score":0.2147391336 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", + "model":"deepseek\/deepseek-chat", + "bcp_47":"su", "task":"translation_to", "metric":"chrf", - "score":0.5194482945 + "score":0.5213195361 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sv", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sv", "task":"mgsm", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sv", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.7 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sv", "task":"translation_from", "metric":"bleu", - "score":0.3189602129 + "score":0.3112375203 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sv", "task":"translation_from", "metric":"chrf", - "score":0.5548503533 + "score":0.5600711232 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sv", "task":"translation_to", "metric":"bleu", - "score":0.5229096392 + "score":0.3915983131 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sv", "task":"translation_to", "metric":"chrf", - "score":0.7023434262 + "score":0.6470079791 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sw", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sw", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sw", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.3889146477 + "score":0.2583542451 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.628092835 + "score":0.5157482031 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_to", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sw", + "task":"translation_to", + "metric":"bleu", + "score":0.3458513734 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"sw", + "task":"translation_to", + "metric":"chrf", + "score":0.634706105 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ta", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ta", + "task":"translation_from", + "metric":"bleu", + "score":0.2339300786 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ta", + "task":"translation_from", + "metric":"chrf", + "score":0.4691042738 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ta", + "task":"translation_to", + "metric":"bleu", + "score":0.2567323645 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ta", + "task":"translation_to", + "metric":"chrf", + "score":0.5361849509 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"te", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"te", + "task":"translation_from", + "metric":"bleu", + "score":0.3887890595 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"te", + "task":"translation_from", + "metric":"chrf", + "score":0.6100201392 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"te", + "task":"translation_to", + "metric":"bleu", + "score":0.3146346509 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"te", + "task":"translation_to", + "metric":"chrf", + "score":0.5476489231 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"tg", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"tg", + "task":"translation_from", + "metric":"bleu", + "score":0.1544230564 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"tg", + "task":"translation_from", + "metric":"chrf", + "score":0.4169441821 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"tg", + "task":"translation_to", + "metric":"bleu", + "score":0.203628947 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"tg", + "task":"translation_to", + "metric":"chrf", + "score":0.4354012087 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"th", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"th", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"th", + "task":"translation_from", + "metric":"bleu", + "score":0.2554271374 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"th", + "task":"translation_from", + "metric":"chrf", + "score":0.5059580785 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"th", + "task":"translation_to", + "metric":"bleu", + "score":0.3635410685 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"th", + "task":"translation_to", + "metric":"chrf", + "score":0.5132811401 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ti", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ti", + "task":"translation_from", + "metric":"bleu", + "score":0.1818206483 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ti", + "task":"translation_from", + "metric":"chrf", + "score":0.3817278149 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ti", + "task":"translation_to", + "metric":"bleu", + "score":0.1031390295 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ti", + "task":"translation_to", + "metric":"chrf", + "score":0.2139568479 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"tr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"tr", + "task":"translation_from", + "metric":"bleu", + "score":0.3173811815 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"tr", + "task":"translation_from", + "metric":"chrf", + "score":0.5742755278 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"tr", + "task":"translation_to", + "metric":"bleu", + "score":0.3658586977 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"tr", + "task":"translation_to", + "metric":"chrf", + "score":0.5886644893 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"uk", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"uk", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"uk", + "task":"translation_from", + "metric":"bleu", + "score":0.2739927286 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"uk", + "task":"translation_from", + "metric":"chrf", + "score":0.5313085407 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"uk", + "task":"translation_to", + "metric":"bleu", + "score":0.3396470191 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"uk", + "task":"translation_to", + "metric":"chrf", + "score":0.56896944 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"umb", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"umb", + "task":"translation_from", + "metric":"bleu", + "score":0.0391048872 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"umb", + "task":"translation_from", + "metric":"chrf", + "score":0.1804054377 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"umb", + "task":"translation_to", + "metric":"bleu", + "score":0.0422939527 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"umb", + "task":"translation_to", + "metric":"chrf", + "score":0.2015864716 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ur", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ur", + "task":"translation_from", + "metric":"bleu", + "score":0.2324983634 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ur", + "task":"translation_from", + "metric":"chrf", + "score":0.497221173 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ur", + "task":"translation_to", + "metric":"bleu", + "score":0.2976387517 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ur", + "task":"translation_to", + "metric":"chrf", + "score":0.4761547661 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"uz", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"uz", + "task":"translation_from", + "metric":"bleu", + "score":0.2305488159 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"uz", + "task":"translation_from", + "metric":"chrf", + "score":0.4723700911 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"uz", + "task":"translation_to", + "metric":"bleu", + "score":0.2058479152 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"uz", + "task":"translation_to", + "metric":"chrf", + "score":0.4902380763 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"vi", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"vi", + "task":"translation_from", + "metric":"bleu", + "score":0.3027505857 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"vi", + "task":"translation_from", + "metric":"chrf", + "score":0.5506378818 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"vi", + "task":"translation_to", + "metric":"bleu", + "score":0.3708866541 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"vi", + "task":"translation_to", + "metric":"chrf", + "score":0.5846851624 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"wo", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"wo", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"wo", + "task":"translation_from", + "metric":"bleu", + "score":0.0772031909 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"wo", + "task":"translation_from", + "metric":"chrf", + "score":0.238183844 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"wo", + "task":"translation_to", + "metric":"bleu", + "score":0.0504923015 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"wo", + "task":"translation_to", + "metric":"chrf", + "score":0.3006315368 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"wuu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"bleu", + "score":0.2388037754 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"chrf", + "score":0.5072972409 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"bleu", + "score":0.1136417481 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"chrf", + "score":0.1766903691 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"xh", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"xh", + "task":"translation_from", + "metric":"bleu", + "score":0.1425657247 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"xh", + "task":"translation_from", + "metric":"chrf", + "score":0.3799312791 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"xh", + "task":"translation_to", + "metric":"bleu", + "score":0.0602102371 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"xh", + "task":"translation_to", + "metric":"chrf", + "score":0.4158042285 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"yo", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"yo", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"yo", + "task":"translation_from", + "metric":"bleu", + "score":0.0751924362 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"yo", + "task":"translation_from", + "metric":"chrf", + "score":0.27475056 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"yo", + "task":"translation_to", + "metric":"bleu", + "score":0.0837679098 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"yo", + "task":"translation_to", + "metric":"chrf", + "score":0.2484365945 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"yue", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"yue", + "task":"translation_from", + "metric":"bleu", + "score":0.143983328 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"yue", + "task":"translation_from", + "metric":"chrf", + "score":0.3955437811 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"yue", + "task":"translation_to", + "metric":"bleu", + "score":0.2002778421 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"yue", + "task":"translation_to", + "metric":"chrf", + "score":0.2907084137 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"zh", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"zh", + "task":"translation_from", + "metric":"bleu", + "score":0.2377253988 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"zh", + "task":"translation_from", + "metric":"chrf", + "score":0.5405656214 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"zh", + "task":"translation_to", + "metric":"bleu", + "score":0.2660263348 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"zh", + "task":"translation_to", + "metric":"chrf", + "score":0.3459946232 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"zu", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"zu", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"zu", + "task":"translation_from", + "metric":"bleu", + "score":0.1095698729 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"zu", + "task":"translation_from", + "metric":"chrf", + "score":0.379524938 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"zu", + "task":"translation_to", + "metric":"bleu", + "score":0.2569801761 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"zu", + "task":"translation_to", + "metric":"chrf", + "score":0.5416847655 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"aeb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.2340706769 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.4849021224 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.2324871288 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.463163379 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"af", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"af", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"af", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"af", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"af", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ak", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ak", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ak", + "task":"translation_from", + "metric":"bleu", + "score":0.1145237929 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ak", + "task":"translation_from", + "metric":"chrf", + "score":0.321984884 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ak", + "task":"translation_to", + "metric":"bleu", + "score":0.0457100188 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ak", + "task":"translation_to", + "metric":"chrf", + "score":0.345736773 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"am", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"am", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"am", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"am", + "task":"translation_from", + "metric":"bleu", + "score":0.2016755199 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"am", + "task":"translation_from", + "metric":"chrf", + "score":0.4502815524 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"am", + "task":"translation_to", + "metric":"bleu", + "score":0.1687061726 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"am", + "task":"translation_to", + "metric":"chrf", + "score":0.2849440478 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"apc", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"apc", + "task":"translation_from", + "metric":"bleu", + "score":0.2569252635 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"apc", + "task":"translation_from", + "metric":"chrf", + "score":0.5329928091 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"apc", + "task":"translation_to", + "metric":"bleu", + "score":0.2423805131 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"apc", + "task":"translation_to", + "metric":"chrf", + "score":0.5144112629 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ar", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ar", + "task":"translation_from", + "metric":"bleu", + "score":0.2993048546 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ar", + "task":"translation_from", + "metric":"chrf", + "score":0.5651988199 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ar", + "task":"translation_to", + "metric":"bleu", + "score":0.3853695566 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ar", + "task":"translation_to", + "metric":"chrf", + "score":0.602672086 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ary", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ary", + "task":"translation_from", + "metric":"bleu", + "score":0.1414242697 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ary", + "task":"translation_from", + "metric":"chrf", + "score":0.4491969143 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ary", + "task":"translation_to", + "metric":"bleu", + "score":0.1969875411 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ary", + "task":"translation_to", + "metric":"chrf", + "score":0.4112680984 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"arz", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"arz", + "task":"translation_from", + "metric":"bleu", + "score":0.1819096557 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"arz", + "task":"translation_from", + "metric":"chrf", + "score":0.4374822654 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"arz", + "task":"translation_to", + "metric":"bleu", + "score":0.2316387528 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"arz", + "task":"translation_to", + "metric":"chrf", + "score":0.4676592617 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"as", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"as", + "task":"translation_from", + "metric":"bleu", + "score":0.2150708922 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"as", + "task":"translation_from", + "metric":"chrf", + "score":0.4723591307 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"as", + "task":"translation_to", + "metric":"bleu", + "score":0.1405266408 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"as", + "task":"translation_to", + "metric":"chrf", + "score":0.3821492664 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"awa", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"awa", + "task":"translation_from", + "metric":"bleu", + "score":0.3061008878 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"awa", + "task":"translation_from", + "metric":"chrf", + "score":0.5403845189 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"awa", + "task":"translation_to", + "metric":"bleu", + "score":0.1651572659 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"awa", + "task":"translation_to", + "metric":"chrf", + "score":0.3834555839 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"az", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"az", + "task":"translation_from", + "metric":"bleu", + "score":0.1950569484 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"az", + "task":"translation_from", + "metric":"chrf", + "score":0.4560500844 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"az", + "task":"translation_to", + "metric":"bleu", + "score":0.1448904562 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"az", + "task":"translation_to", + "metric":"chrf", + "score":0.4007813245 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"be", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"be", + "task":"translation_from", + "metric":"bleu", + "score":0.1568183376 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"be", + "task":"translation_from", + "metric":"chrf", + "score":0.4733150063 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"be", + "task":"translation_to", + "metric":"bleu", + "score":0.2952652338 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"be", + "task":"translation_to", + "metric":"chrf", + "score":0.4756055948 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"bho", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"bho", + "task":"translation_from", + "metric":"bleu", + "score":0.2098690628 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"bho", + "task":"translation_from", + "metric":"chrf", + "score":0.4737398201 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"bho", + "task":"translation_to", + "metric":"bleu", + "score":0.1892048942 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"bho", + "task":"translation_to", + "metric":"chrf", + "score":0.3849575805 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"bm", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"bm", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"bm", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"bm", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"bm", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"bn", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"bn", + "task":"translation_from", + "metric":"bleu", + "score":0.2798537803 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"bn", + "task":"translation_from", + "metric":"chrf", + "score":0.5394779979 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"bn", + "task":"translation_to", + "metric":"bleu", + "score":0.3719179468 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"bn", + "task":"translation_to", + "metric":"chrf", + "score":0.539682577 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ca", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ca", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ca", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ca", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ca", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ceb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"bleu", + "score":0.40271244 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"chrf", + "score":0.6036828752 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"bleu", + "score":0.3295443052 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"chrf", + "score":0.592814404 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ckb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"bleu", + "score":0.1908998381 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"chrf", + "score":0.4722273522 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"bleu", + "score":0.1077730104 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"chrf", + "score":0.4189694789 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"cs", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"cs", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"cs", + "task":"translation_from", + "metric":"bleu", + "score":0.3296294187 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"cs", + "task":"translation_from", + "metric":"chrf", + "score":0.5743852794 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"cs", + "task":"translation_to", + "metric":"bleu", + "score":0.3965244172 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"cs", + "task":"translation_to", + "metric":"chrf", + "score":0.6187707189 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"de", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"de", + "task":"translation_from", + "metric":"bleu", + "score":0.3207762021 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"de", + "task":"translation_from", + "metric":"chrf", + "score":0.5555389401 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"de", + "task":"translation_to", + "metric":"bleu", + "score":0.4227752207 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"de", + "task":"translation_to", + "metric":"chrf", + "score":0.6601015066 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"el", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"el", + "task":"translation_from", + "metric":"bleu", + "score":0.3139195907 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"el", + "task":"translation_from", + "metric":"chrf", + "score":0.5175917627 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"el", + "task":"translation_to", + "metric":"bleu", + "score":0.3178080544 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"el", + "task":"translation_to", + "metric":"chrf", + "score":0.5080472014 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"en", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"en", + "task":"translation_from", + "metric":"bleu", + "score":0.5548034204 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"en", + "task":"translation_from", + "metric":"chrf", + "score":0.7071106777 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"en", + "task":"translation_to", + "metric":"bleu", + "score":0.6432470265 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"en", + "task":"translation_to", + "metric":"chrf", + "score":0.8278285651 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"es", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"es", + "task":"translation_from", + "metric":"bleu", + "score":0.3223436235 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"es", + "task":"translation_from", + "metric":"chrf", + "score":0.5379000389 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"es", + "task":"translation_to", + "metric":"bleu", + "score":0.3061941236 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"es", + "task":"translation_to", + "metric":"chrf", + "score":0.5918382188 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fa", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fa", + "task":"translation_from", + "metric":"bleu", + "score":0.3294693656 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fa", + "task":"translation_from", + "metric":"chrf", + "score":0.5673243159 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fa", + "task":"translation_to", + "metric":"bleu", + "score":0.1938427279 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fa", + "task":"translation_to", + "metric":"chrf", + "score":0.4526315895 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fil", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fil", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fil", + "task":"translation_from", + "metric":"bleu", + "score":0.3412226864 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fil", + "task":"translation_from", + "metric":"chrf", + "score":0.5602175563 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fil", + "task":"translation_to", + "metric":"bleu", + "score":0.2910894115 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fil", + "task":"translation_to", + "metric":"chrf", + "score":0.5672691361 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fr", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fr", + "task":"translation_from", + "metric":"bleu", + "score":0.3297556296 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fr", + "task":"translation_from", + "metric":"chrf", + "score":0.5925809306 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fr", + "task":"translation_to", + "metric":"bleu", + "score":0.4619761505 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fr", + "task":"translation_to", + "metric":"chrf", + "score":0.6734036273 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.0307272557 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.2077475007 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0256705679 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.2168141904 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"gu", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"gu", + "task":"translation_from", + "metric":"bleu", + "score":0.3055790363 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"gu", + "task":"translation_from", + "metric":"chrf", + "score":0.5265498141 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"gu", + "task":"translation_to", + "metric":"bleu", + "score":0.1365241949 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"gu", + "task":"translation_to", + "metric":"chrf", + "score":0.4093204393 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ha", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ha", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ha", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ha", + "task":"translation_from", + "metric":"bleu", + "score":0.1778454432 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ha", + "task":"translation_from", + "metric":"chrf", + "score":0.4028796881 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ha", + "task":"translation_to", + "metric":"bleu", + "score":0.2463440773 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ha", + "task":"translation_to", + "metric":"chrf", + "score":0.5200026897 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"hi", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"hi", + "task":"translation_from", + "metric":"bleu", + "score":0.3412169553 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"hi", + "task":"translation_from", + "metric":"chrf", + "score":0.598919602 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"hi", + "task":"translation_to", + "metric":"bleu", + "score":0.3937102354 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"hi", + "task":"translation_to", + "metric":"chrf", + "score":0.6229439454 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"hne", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"hne", + "task":"translation_from", + "metric":"bleu", + "score":0.2297889676 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"hne", + "task":"translation_from", + "metric":"chrf", + "score":0.4704431893 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"hne", + "task":"translation_to", + "metric":"bleu", + "score":0.1375213911 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"hne", + "task":"translation_to", + "metric":"chrf", + "score":0.388908417 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ht", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ht", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ht", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ht", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ht", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"hu", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"hu", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"hu", + "task":"translation_from", + "metric":"bleu", + "score":0.2789946732 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"hu", + "task":"translation_from", + "metric":"chrf", + "score":0.5442737128 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"hu", + "task":"translation_to", + "metric":"bleu", + "score":0.3066060037 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"hu", + "task":"translation_to", + "metric":"chrf", + "score":0.556064896 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"id", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"id", + "task":"translation_from", + "metric":"bleu", + "score":0.3020610187 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"id", + "task":"translation_from", + "metric":"chrf", + "score":0.5462026627 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"id", + "task":"translation_to", + "metric":"bleu", + "score":0.299038365 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"id", + "task":"translation_to", + "metric":"chrf", + "score":0.625735911 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ig", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ig", + "task":"translation_from", + "metric":"bleu", + "score":0.1946429546 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ig", + "task":"translation_from", + "metric":"chrf", + "score":0.4570475303 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ig", + "task":"translation_to", + "metric":"bleu", + "score":0.2287931181 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ig", + "task":"translation_to", + "metric":"chrf", + "score":0.4943000447 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ilo", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"bleu", + "score":0.233903322 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"chrf", + "score":0.4813311361 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"bleu", + "score":0.160985695 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"chrf", + "score":0.4538812051 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"it", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"it", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"it", + "task":"translation_from", + "metric":"bleu", + "score":0.254215081 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"it", + "task":"translation_from", + "metric":"chrf", + "score":0.5128620442 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"it", + "task":"translation_to", + "metric":"bleu", + "score":0.3318074211 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"it", + "task":"translation_to", + "metric":"chrf", + "score":0.5973973733 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ja", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ja", + "task":"translation_from", + "metric":"bleu", + "score":0.1875636541 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ja", + "task":"translation_from", + "metric":"chrf", + "score":0.5136106256 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ja", + "task":"translation_to", + "metric":"bleu", + "score":0.3333377273 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ja", + "task":"translation_to", + "metric":"chrf", + "score":0.4709407515 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"jv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"jv", + "task":"translation_from", + "metric":"bleu", + "score":0.2789250445 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"jv", + "task":"translation_from", + "metric":"chrf", + "score":0.52614288 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"jv", + "task":"translation_to", + "metric":"bleu", + "score":0.2580648249 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"jv", + "task":"translation_to", + "metric":"chrf", + "score":0.574708573 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ki", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ki", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ki", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ki", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ki", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"kk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"kk", + "task":"translation_from", + "metric":"bleu", + "score":0.18097458 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"kk", + "task":"translation_from", + "metric":"chrf", + "score":0.4665455335 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"kk", + "task":"translation_to", + "metric":"bleu", + "score":0.1950643939 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"kk", + "task":"translation_to", + "metric":"chrf", + "score":0.4676749835 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"km", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"km", + "task":"translation_from", + "metric":"bleu", + "score":0.3008270138 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"km", + "task":"translation_from", + "metric":"chrf", + "score":0.5432166189 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"km", + "task":"translation_to", + "metric":"bleu", + "score":0.0884771533 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"km", + "task":"translation_to", + "metric":"chrf", + "score":0.3265400527 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"kn", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"kn", + "task":"translation_from", + "metric":"bleu", + "score":0.2431929513 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"kn", + "task":"translation_from", + "metric":"chrf", + "score":0.4397197217 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"kn", + "task":"translation_to", + "metric":"bleu", + "score":0.1999599641 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"kn", + "task":"translation_to", + "metric":"chrf", + "score":0.4781553813 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ko", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ko", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ko", + "task":"translation_from", + "metric":"bleu", + "score":0.2497463416 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ko", + "task":"translation_from", + "metric":"chrf", + "score":0.5083726446 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ko", + "task":"translation_to", + "metric":"bleu", + "score":0.2002123483 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ko", + "task":"translation_to", + "metric":"chrf", + "score":0.2845065116 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"lua", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"lua", + "task":"translation_from", + "metric":"bleu", + "score":0.0855626682 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"lua", + "task":"translation_from", + "metric":"chrf", + "score":0.2894501335 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"lua", + "task":"translation_to", + "metric":"bleu", + "score":0.0163561936 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"lua", + "task":"translation_to", + "metric":"chrf", + "score":0.2383002969 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"mag", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"mag", + "task":"translation_from", + "metric":"bleu", + "score":0.3116845131 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"mag", + "task":"translation_from", + "metric":"chrf", + "score":0.5936722206 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"mag", + "task":"translation_to", + "metric":"bleu", + "score":0.2244694024 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"mag", + "task":"translation_to", + "metric":"chrf", + "score":0.491879277 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"mai", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"mai", + "task":"translation_from", + "metric":"bleu", + "score":0.3230054961 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"mai", + "task":"translation_from", + "metric":"chrf", + "score":0.5636252799 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"mai", + "task":"translation_to", + "metric":"bleu", + "score":0.2128915517 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"mai", + "task":"translation_to", + "metric":"chrf", + "score":0.4613197046 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"mg", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"mg", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"mg", + "task":"translation_from", + "metric":"bleu", + "score":0.2499065804 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"mg", + "task":"translation_from", + "metric":"chrf", + "score":0.4673527976 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"mg", + "task":"translation_to", + "metric":"bleu", + "score":0.1281964384 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"mg", + "task":"translation_to", + "metric":"chrf", + "score":0.4588308902 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ml", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ml", + "task":"translation_from", + "metric":"bleu", + "score":0.319035437 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ml", + "task":"translation_from", + "metric":"chrf", + "score":0.555554753 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ml", + "task":"translation_to", + "metric":"bleu", + "score":0.2835968152 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ml", + "task":"translation_to", + "metric":"chrf", + "score":0.5094572017 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"mr", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"mr", + "task":"translation_from", + "metric":"bleu", + "score":0.2487969868 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"mr", + "task":"translation_from", + "metric":"chrf", + "score":0.518708582 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"mr", + "task":"translation_to", + "metric":"bleu", + "score":0.2238578938 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"mr", + "task":"translation_to", + "metric":"chrf", + "score":0.4748109447 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ms", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ms", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ms", + "task":"translation_from", + "metric":"bleu", + "score":0.3058774517 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ms", + "task":"translation_from", + "metric":"chrf", + "score":0.5603224049 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ms", + "task":"translation_to", + "metric":"bleu", + "score":0.3684068806 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ms", + "task":"translation_to", + "metric":"chrf", + "score":0.6535736283 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"my", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"my", + "task":"translation_from", + "metric":"bleu", + "score":0.2253225205 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"my", + "task":"translation_from", + "metric":"chrf", + "score":0.4798221167 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"my", + "task":"translation_to", + "metric":"bleu", + "score":0.2383027705 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"my", + "task":"translation_to", + "metric":"chrf", + "score":0.504994716 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ne", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ne", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ne", + "task":"translation_from", + "metric":"bleu", + "score":0.3350990447 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ne", + "task":"translation_from", + "metric":"chrf", + "score":0.5554923615 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ne", + "task":"translation_to", + "metric":"bleu", + "score":0.2492753068 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ne", + "task":"translation_to", + "metric":"chrf", + "score":0.5052232921 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"nl", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"nl", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"nl", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"nl", + "task":"translation_from", + "metric":"bleu", + "score":0.2733774487 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"nl", + "task":"translation_from", + "metric":"chrf", + "score":0.4886433877 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"nl", + "task":"translation_to", + "metric":"bleu", + "score":0.2525535773 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"nl", + "task":"translation_to", + "metric":"chrf", + "score":0.5869217143 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ny", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ny", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ny", + "task":"translation_from", + "metric":"bleu", + "score":0.1449724535 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ny", + "task":"translation_from", + "metric":"chrf", + "score":0.3965148993 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ny", + "task":"translation_to", + "metric":"bleu", + "score":0.0942041621 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ny", + "task":"translation_to", + "metric":"chrf", + "score":0.4155041047 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"om", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"om", + "task":"translation_from", + "metric":"bleu", + "score":0.0235872225 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"om", + "task":"translation_from", + "metric":"chrf", + "score":0.2475231508 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"om", + "task":"translation_to", + "metric":"bleu", + "score":0.0365961569 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"om", + "task":"translation_to", + "metric":"chrf", + "score":0.3050512265 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"or", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"or", + "task":"translation_from", + "metric":"bleu", + "score":0.2767258101 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"or", + "task":"translation_from", + "metric":"chrf", + "score":0.514091898 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"or", + "task":"translation_to", + "metric":"bleu", + "score":0.1796236972 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"or", + "task":"translation_to", + "metric":"chrf", + "score":0.4422888692 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"pa", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"pa", + "task":"translation_from", + "metric":"bleu", + "score":0.3823229705 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"pa", + "task":"translation_from", + "metric":"chrf", + "score":0.6453681393 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"pa", + "task":"translation_to", + "metric":"bleu", + "score":0.3548387061 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"pa", + "task":"translation_to", + "metric":"chrf", + "score":0.5492435889 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"pl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"pl", + "task":"translation_from", + "metric":"bleu", + "score":0.2581682802 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"pl", + "task":"translation_from", + "metric":"chrf", + "score":0.5198796684 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"pl", + "task":"translation_to", + "metric":"bleu", + "score":0.2662027737 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"pl", + "task":"translation_to", + "metric":"chrf", + "score":0.540420297 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"pt", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"pt", + "task":"translation_from", + "metric":"bleu", + "score":0.3091555064 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"pt", + "task":"translation_from", + "metric":"chrf", + "score":0.5528775735 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"pt", + "task":"translation_to", + "metric":"bleu", + "score":0.3860807525 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"pt", + "task":"translation_to", + "metric":"chrf", + "score":0.6710753294 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ro", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ro", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ro", + "task":"translation_from", + "metric":"bleu", + "score":0.2477037529 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ro", + "task":"translation_from", + "metric":"chrf", + "score":0.5045143807 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ro", + "task":"translation_to", + "metric":"bleu", + "score":0.394880747 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ro", + "task":"translation_to", + "metric":"chrf", + "score":0.6072982987 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ru", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ru", + "task":"translation_from", + "metric":"bleu", + "score":0.2464304597 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ru", + "task":"translation_from", + "metric":"chrf", + "score":0.5343201712 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ru", + "task":"translation_to", + "metric":"bleu", + "score":0.3592456339 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ru", + "task":"translation_to", + "metric":"chrf", + "score":0.5816925415 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"rw", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"rw", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"rw", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"rw", + "task":"translation_from", + "metric":"bleu", + "score":0.1293187691 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"rw", + "task":"translation_from", + "metric":"chrf", + "score":0.3738214096 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"rw", + "task":"translation_to", + "metric":"bleu", + "score":0.1003361282 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"rw", + "task":"translation_to", + "metric":"chrf", + "score":0.3952274191 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sd", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sd", + "task":"translation_from", + "metric":"bleu", + "score":0.2486377856 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sd", + "task":"translation_from", + "metric":"chrf", + "score":0.5019133104 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sd", + "task":"translation_to", + "metric":"bleu", + "score":0.2573787999 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sd", + "task":"translation_to", + "metric":"chrf", + "score":0.4669380076 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"si", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"si", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"si", + "task":"translation_from", + "metric":"bleu", + "score":0.257967718 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"si", + "task":"translation_from", + "metric":"chrf", + "score":0.5080229639 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"si", + "task":"translation_to", + "metric":"bleu", + "score":0.2025556713 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"si", + "task":"translation_to", + "metric":"chrf", + "score":0.3947833 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sn", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sn", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sn", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sn", + "task":"translation_from", + "metric":"bleu", + "score":0.0690009512 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sn", + "task":"translation_from", + "metric":"chrf", + "score":0.3268004816 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sn", + "task":"translation_to", + "metric":"bleu", + "score":0.1294343719 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sn", + "task":"translation_to", + "metric":"chrf", + "score":0.4480995236 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"so", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"so", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"so", + "task":"translation_from", + "metric":"bleu", + "score":0.1898460053 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"so", + "task":"translation_from", + "metric":"chrf", + "score":0.4405765457 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"so", + "task":"translation_to", + "metric":"bleu", + "score":0.1095645758 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"so", + "task":"translation_to", + "metric":"chrf", + "score":0.4118027966 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sr", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sr", + "task":"translation_from", + "metric":"bleu", + "score":0.2800732787 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sr", + "task":"translation_from", + "metric":"chrf", + "score":0.5502272532 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sr", + "task":"translation_to", + "metric":"bleu", + "score":0.4072726699 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sr", + "task":"translation_to", + "metric":"chrf", + "score":0.6058201233 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"su", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"su", + "task":"translation_from", + "metric":"bleu", + "score":0.2040949055 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"su", + "task":"translation_from", + "metric":"chrf", + "score":0.43974538 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"su", + "task":"translation_to", + "metric":"bleu", + "score":0.2090628208 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"su", + "task":"translation_to", + "metric":"chrf", + "score":0.5097240815 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sv", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sv", + "task":"translation_from", + "metric":"bleu", + "score":0.2774768567 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sv", + "task":"translation_from", + "metric":"chrf", + "score":0.5443247574 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sv", + "task":"translation_to", + "metric":"bleu", + "score":0.3840976738 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sv", + "task":"translation_to", + "metric":"chrf", + "score":0.6378529698 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sw", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sw", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sw", + "task":"translation_from", + "metric":"bleu", + "score":0.2438930348 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sw", + "task":"translation_from", + "metric":"chrf", + "score":0.5213646779 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sw", + "task":"translation_to", + "metric":"bleu", + "score":0.2864351463 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sw", + "task":"translation_to", + "metric":"chrf", + "score":0.6249321785 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ta", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ta", + "task":"translation_from", + "metric":"bleu", + "score":0.2312626914 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ta", + "task":"translation_from", + "metric":"chrf", + "score":0.4818505098 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ta", + "task":"translation_to", + "metric":"bleu", + "score":0.2916695233 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ta", + "task":"translation_to", + "metric":"chrf", + "score":0.5596704495 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"te", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"te", + "task":"translation_from", + "metric":"bleu", + "score":0.3464968589 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"te", + "task":"translation_from", + "metric":"chrf", + "score":0.5970733128 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"te", + "task":"translation_to", + "metric":"bleu", + "score":0.2948086539 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"te", + "task":"translation_to", + "metric":"chrf", + "score":0.5417485172 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"tg", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"tg", + "task":"translation_from", + "metric":"bleu", + "score":0.1765221595 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"tg", + "task":"translation_from", + "metric":"chrf", + "score":0.4369131192 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"tg", + "task":"translation_to", + "metric":"bleu", + "score":0.2151708901 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"tg", + "task":"translation_to", + "metric":"chrf", + "score":0.4392843531 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"th", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"th", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"th", + "task":"translation_from", + "metric":"bleu", + "score":0.2555109482 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"th", + "task":"translation_from", + "metric":"chrf", + "score":0.4905742401 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"th", + "task":"translation_to", + "metric":"bleu", + "score":0.3470151937 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"th", + "task":"translation_to", + "metric":"chrf", + "score":0.512427307 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ti", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ti", + "task":"translation_from", + "metric":"bleu", + "score":0.1515985315 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ti", + "task":"translation_from", + "metric":"chrf", + "score":0.3742059137 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ti", + "task":"translation_to", + "metric":"bleu", + "score":0.1108390908 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ti", + "task":"translation_to", + "metric":"chrf", + "score":0.210084949 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"tr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"tr", + "task":"translation_from", + "metric":"bleu", + "score":0.3319169877 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"tr", + "task":"translation_from", + "metric":"chrf", + "score":0.5670040682 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"tr", + "task":"translation_to", + "metric":"bleu", + "score":0.3882912951 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"tr", + "task":"translation_to", + "metric":"chrf", + "score":0.6304381337 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"uk", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"uk", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"uk", + "task":"translation_from", + "metric":"bleu", + "score":0.2755215402 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"uk", + "task":"translation_from", + "metric":"chrf", + "score":0.5261420761 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"uk", + "task":"translation_to", + "metric":"bleu", + "score":0.3549575463 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"uk", + "task":"translation_to", + "metric":"chrf", + "score":0.5828055284 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"umb", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"umb", + "task":"translation_from", + "metric":"bleu", + "score":0.0366134631 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"umb", + "task":"translation_from", + "metric":"chrf", + "score":0.1741100437 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"umb", + "task":"translation_to", + "metric":"bleu", + "score":0.0154547723 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"umb", + "task":"translation_to", + "metric":"chrf", + "score":0.1399251318 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ur", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ur", + "task":"translation_from", + "metric":"bleu", + "score":0.2290327476 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ur", + "task":"translation_from", + "metric":"chrf", + "score":0.5229250115 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ur", + "task":"translation_to", + "metric":"bleu", + "score":0.3122409611 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ur", + "task":"translation_to", + "metric":"chrf", + "score":0.4921734247 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"uz", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"uz", + "task":"translation_from", + "metric":"bleu", + "score":0.2244630159 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"uz", + "task":"translation_from", + "metric":"chrf", + "score":0.4814457852 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"uz", + "task":"translation_to", + "metric":"bleu", + "score":0.2007945741 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"uz", + "task":"translation_to", + "metric":"chrf", + "score":0.4705479648 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"vi", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"vi", + "task":"translation_from", + "metric":"bleu", + "score":0.2150236607 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"vi", + "task":"translation_from", + "metric":"chrf", + "score":0.4970978512 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"vi", + "task":"translation_to", + "metric":"bleu", + "score":0.3603191861 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"vi", + "task":"translation_to", + "metric":"chrf", + "score":0.5938509481 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"wo", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"wo", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"wo", + "task":"translation_from", + "metric":"bleu", + "score":0.0717040801 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"wo", + "task":"translation_from", + "metric":"chrf", + "score":0.2570725566 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"wo", + "task":"translation_to", + "metric":"bleu", + "score":0.0371460136 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"wo", + "task":"translation_to", + "metric":"chrf", + "score":0.2645911946 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"wuu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"bleu", + "score":0.2230132444 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"chrf", + "score":0.49266873 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"bleu", + "score":0.0804541385 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"chrf", + "score":0.1593791779 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"xh", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"xh", + "task":"translation_from", + "metric":"bleu", + "score":0.1516053677 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"xh", + "task":"translation_from", + "metric":"chrf", + "score":0.3870787615 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"xh", + "task":"translation_to", + "metric":"bleu", + "score":0.051561205 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"xh", + "task":"translation_to", + "metric":"chrf", + "score":0.3871526823 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"yo", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"yo", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"yo", + "task":"translation_from", + "metric":"bleu", + "score":0.0693546179 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"yo", + "task":"translation_from", + "metric":"chrf", + "score":0.2831628097 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"yo", + "task":"translation_to", + "metric":"bleu", + "score":0.1008748312 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"yo", + "task":"translation_to", + "metric":"chrf", + "score":0.2529276987 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"yue", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"yue", + "task":"translation_from", + "metric":"bleu", + "score":0.1997334357 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"yue", + "task":"translation_from", + "metric":"chrf", + "score":0.4568839976 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"yue", + "task":"translation_to", + "metric":"bleu", + "score":0.2322349452 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"yue", + "task":"translation_to", + "metric":"chrf", + "score":0.3049134513 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"zh", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"zh", + "task":"translation_from", + "metric":"bleu", + "score":0.2350235637 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"zh", + "task":"translation_from", + "metric":"chrf", + "score":0.528086246 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"zh", + "task":"translation_to", + "metric":"bleu", + "score":0.2524231151 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"zh", + "task":"translation_to", + "metric":"chrf", + "score":0.3456705882 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"zu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"zu", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"zu", + "task":"translation_from", + "metric":"bleu", + "score":0.1624728483 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"zu", + "task":"translation_from", + "metric":"chrf", + "score":0.4496327865 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"zu", + "task":"translation_to", + "metric":"bleu", + "score":0.2537223237 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"zu", + "task":"translation_to", + "metric":"chrf", + "score":0.5463123746 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"aeb", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.2402975983 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.4194922076 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.1338075038 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.3511060104 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"af", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"af", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"af", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"af", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"af", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ak", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ak", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ak", + "task":"translation_from", + "metric":"bleu", + "score":0.1357614328 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ak", + "task":"translation_from", + "metric":"chrf", + "score":0.3566810684 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ak", + "task":"translation_to", + "metric":"bleu", + "score":0.0294893106 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ak", + "task":"translation_to", + "metric":"chrf", + "score":0.2512539061 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"am", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"am", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"am", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"am", + "task":"translation_from", + "metric":"bleu", + "score":0.1512958639 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"am", + "task":"translation_from", + "metric":"chrf", + "score":0.3039734334 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"am", + "task":"translation_to", + "metric":"bleu", + "score":0.0801602615 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"am", + "task":"translation_to", + "metric":"chrf", + "score":0.1225273024 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"apc", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"apc", + "task":"translation_from", + "metric":"bleu", + "score":0.1445854242 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"apc", + "task":"translation_from", + "metric":"chrf", + "score":0.3358973891 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"apc", + "task":"translation_to", + "metric":"bleu", + "score":0.1013154049 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"apc", + "task":"translation_to", + "metric":"chrf", + "score":0.3155908724 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ar", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ar", + "task":"translation_from", + "metric":"bleu", + "score":0.2238237549 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ar", + "task":"translation_from", + "metric":"chrf", + "score":0.4534366926 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ar", + "task":"translation_to", + "metric":"bleu", + "score":0.2689055687 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ar", + "task":"translation_to", + "metric":"chrf", + "score":0.4149416248 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ary", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ary", + "task":"translation_from", + "metric":"bleu", + "score":0.0975874673 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ary", + "task":"translation_from", + "metric":"chrf", + "score":0.3248757407 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ary", + "task":"translation_to", + "metric":"bleu", + "score":0.1178477307 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ary", + "task":"translation_to", + "metric":"chrf", + "score":0.2954831248 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"arz", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"arz", + "task":"translation_from", + "metric":"bleu", + "score":0.159326316 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"arz", + "task":"translation_from", + "metric":"chrf", + "score":0.382299198 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"arz", + "task":"translation_to", + "metric":"bleu", + "score":0.1975279012 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"arz", + "task":"translation_to", + "metric":"chrf", + "score":0.434347868 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"as", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"as", + "task":"translation_from", + "metric":"bleu", + "score":0.1616056325 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"as", + "task":"translation_from", + "metric":"chrf", + "score":0.333451919 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"as", + "task":"translation_to", + "metric":"bleu", + "score":0.0517558436 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"as", + "task":"translation_to", + "metric":"chrf", + "score":0.1667611675 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"awa", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"awa", + "task":"translation_from", + "metric":"bleu", + "score":0.1822663929 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"awa", + "task":"translation_from", + "metric":"chrf", + "score":0.3603211978 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"awa", + "task":"translation_to", + "metric":"bleu", + "score":0.0853061805 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"awa", + "task":"translation_to", + "metric":"chrf", + "score":0.2591570919 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"az", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"az", + "task":"translation_from", + "metric":"bleu", + "score":0.156849916 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"az", + "task":"translation_from", + "metric":"chrf", + "score":0.3691380603 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"az", + "task":"translation_to", + "metric":"bleu", + "score":0.1100740183 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"az", + "task":"translation_to", + "metric":"chrf", + "score":0.3479696433 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"be", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"be", + "task":"translation_from", + "metric":"bleu", + "score":0.1450162321 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"be", + "task":"translation_from", + "metric":"chrf", + "score":0.4059490259 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"be", + "task":"translation_to", + "metric":"bleu", + "score":0.2328037895 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"be", + "task":"translation_to", + "metric":"chrf", + "score":0.3851910422 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"bho", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"bho", + "task":"translation_from", + "metric":"bleu", + "score":0.1735533986 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"bho", + "task":"translation_from", + "metric":"chrf", + "score":0.393764966 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"bho", + "task":"translation_to", + "metric":"bleu", + "score":0.1575864364 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"bho", + "task":"translation_to", + "metric":"chrf", + "score":0.3025413929 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"bm", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"bm", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"bm", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"bm", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"bm", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"bn", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"bn", + "task":"translation_from", + "metric":"bleu", + "score":0.2443635406 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"bn", + "task":"translation_from", + "metric":"chrf", + "score":0.4676159664 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"bn", + "task":"translation_to", + "metric":"bleu", + "score":0.2223182846 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"bn", + "task":"translation_to", + "metric":"chrf", + "score":0.3685961254 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ca", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ca", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ca", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ca", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ca", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ceb", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"bleu", + "score":0.3180611809 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"chrf", + "score":0.5065841887 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"bleu", + "score":0.2680634152 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"chrf", + "score":0.5259443653 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ckb", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"bleu", + "score":0.1699873084 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"chrf", + "score":0.4049081719 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"bleu", + "score":0.1497155398 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"chrf", + "score":0.3184438517 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"cs", + "task":"classification", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"cs", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"cs", + "task":"translation_from", + "metric":"bleu", + "score":0.2338536957 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"cs", + "task":"translation_from", + "metric":"chrf", + "score":0.4766184042 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"cs", + "task":"translation_to", + "metric":"bleu", + "score":0.2064068309 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"cs", + "task":"translation_to", + "metric":"chrf", + "score":0.3746311154 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"de", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"de", + "task":"translation_from", + "metric":"bleu", + "score":0.2633055293 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"de", + "task":"translation_from", + "metric":"chrf", + "score":0.451378667 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"de", + "task":"translation_to", + "metric":"bleu", + "score":0.2576565152 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"de", + "task":"translation_to", + "metric":"chrf", + "score":0.3874723625 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"el", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"el", + "task":"translation_from", + "metric":"bleu", + "score":0.262811264 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"el", + "task":"translation_from", + "metric":"chrf", + "score":0.4775521011 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"el", + "task":"translation_to", + "metric":"bleu", + "score":0.1965649232 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"el", + "task":"translation_to", + "metric":"chrf", + "score":0.3326158945 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"en", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"en", + "task":"translation_from", + "metric":"bleu", + "score":0.3974650186 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"en", + "task":"translation_from", + "metric":"chrf", + "score":0.5373829936 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"en", + "task":"translation_to", + "metric":"bleu", + "score":0.5868227988 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"en", + "task":"translation_to", + "metric":"chrf", + "score":0.7574063883 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"es", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"es", + "task":"translation_from", + "metric":"bleu", + "score":0.2163623393 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"es", + "task":"translation_from", + "metric":"chrf", + "score":0.4705179867 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"es", + "task":"translation_to", + "metric":"bleu", + "score":0.2458237388 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"es", + "task":"translation_to", + "metric":"chrf", + "score":0.426538099 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"fa", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"fa", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"fa", + "task":"translation_from", + "metric":"bleu", + "score":0.2533539434 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"fa", + "task":"translation_from", + "metric":"chrf", + "score":0.4119435555 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"fa", + "task":"translation_to", + "metric":"bleu", + "score":0.1546982368 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"fa", + "task":"translation_to", + "metric":"chrf", + "score":0.461201833 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"fil", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"fil", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"fil", + "task":"translation_from", + "metric":"bleu", + "score":0.2168672818 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"fil", + "task":"translation_from", + "metric":"chrf", + "score":0.4298161123 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"fil", + "task":"translation_to", + "metric":"bleu", + "score":0.2544899664 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"fil", + "task":"translation_to", + "metric":"chrf", + "score":0.4510886635 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"fr", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"fr", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"fr", + "task":"translation_from", + "metric":"bleu", + "score":0.3182982487 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"fr", + "task":"translation_from", + "metric":"chrf", + "score":0.5389072956 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"fr", + "task":"translation_to", + "metric":"bleu", + "score":0.47314841 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"fr", + "task":"translation_to", + "metric":"chrf", + "score":0.6884710951 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.0355335694 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.1603046868 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0146310492 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.1847185113 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"gu", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"gu", + "task":"translation_from", + "metric":"bleu", + "score":0.2054043097 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"gu", + "task":"translation_from", + "metric":"chrf", + "score":0.3989649156 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"gu", + "task":"translation_to", + "metric":"bleu", + "score":0.0395886562 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"gu", + "task":"translation_to", + "metric":"chrf", + "score":0.1860957619 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ha", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ha", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ha", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ha", + "task":"translation_from", + "metric":"bleu", + "score":0.1042634561 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ha", + "task":"translation_from", + "metric":"chrf", + "score":0.2700025792 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ha", + "task":"translation_to", + "metric":"bleu", + "score":0.2494923018 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ha", + "task":"translation_to", + "metric":"chrf", + "score":0.4977126554 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"hi", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"hi", + "task":"translation_from", + "metric":"bleu", + "score":0.2684001499 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"hi", + "task":"translation_from", + "metric":"chrf", + "score":0.416230929 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"hi", + "task":"translation_to", + "metric":"bleu", + "score":0.2827365983 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"hi", + "task":"translation_to", + "metric":"chrf", + "score":0.5128198247 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"hne", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"hne", + "task":"translation_from", + "metric":"bleu", + "score":0.1483876396 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"hne", + "task":"translation_from", + "metric":"chrf", + "score":0.3041127486 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"hne", + "task":"translation_to", + "metric":"bleu", + "score":0.0867728202 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"hne", + "task":"translation_to", + "metric":"chrf", + "score":0.2892236166 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ht", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ht", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ht", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ht", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ht", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"hu", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"hu", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"hu", + "task":"translation_from", + "metric":"bleu", + "score":0.2451203581 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"hu", + "task":"translation_from", + "metric":"chrf", + "score":0.4667806078 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"hu", + "task":"translation_to", + "metric":"bleu", + "score":0.2680074322 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"hu", + "task":"translation_to", + "metric":"chrf", + "score":0.4714945694 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"id", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"id", + "task":"translation_from", + "metric":"bleu", + "score":0.223787985 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"id", + "task":"translation_from", + "metric":"chrf", + "score":0.485186041 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"id", + "task":"translation_to", + "metric":"bleu", + "score":0.3571004344 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"id", + "task":"translation_to", + "metric":"chrf", + "score":0.6398491182 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ig", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ig", + "task":"translation_from", + "metric":"bleu", + "score":0.1560495384 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ig", + "task":"translation_from", + "metric":"chrf", + "score":0.3475080534 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ig", + "task":"translation_to", + "metric":"bleu", + "score":0.1427020575 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ig", + "task":"translation_to", + "metric":"chrf", + "score":0.2902772917 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ilo", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"bleu", + "score":0.2002526169 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"chrf", + "score":0.4138800613 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"bleu", + "score":0.1417817824 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"chrf", + "score":0.3836219075 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"it", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"it", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"it", + "task":"translation_from", + "metric":"bleu", + "score":0.2225226541 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"it", + "task":"translation_from", + "metric":"chrf", + "score":0.4359559623 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"it", + "task":"translation_to", + "metric":"bleu", + "score":0.2708679556 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"it", + "task":"translation_to", + "metric":"chrf", + "score":0.4908463656 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ja", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ja", + "task":"translation_from", + "metric":"bleu", + "score":0.1711796281 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ja", + "task":"translation_from", + "metric":"chrf", + "score":0.4108641598 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ja", + "task":"translation_to", + "metric":"bleu", + "score":0.2194500975 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ja", + "task":"translation_to", + "metric":"chrf", + "score":0.3589526769 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"jv", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"jv", + "task":"translation_from", + "metric":"bleu", + "score":0.1994883012 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"jv", + "task":"translation_from", + "metric":"chrf", + "score":0.3942042616 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"jv", + "task":"translation_to", + "metric":"bleu", + "score":0.2570478693 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"jv", + "task":"translation_to", + "metric":"chrf", + "score":0.5215463463 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ki", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ki", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ki", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ki", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ki", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"kk", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"kk", + "task":"translation_from", + "metric":"bleu", + "score":0.1546042692 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"kk", + "task":"translation_from", + "metric":"chrf", + "score":0.4407575564 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"kk", + "task":"translation_to", + "metric":"bleu", + "score":0.2471551193 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"kk", + "task":"translation_to", + "metric":"chrf", + "score":0.4847447773 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"km", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"km", + "task":"translation_from", + "metric":"bleu", + "score":0.273955881 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"km", + "task":"translation_from", + "metric":"chrf", + "score":0.5078342939 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"km", + "task":"translation_to", + "metric":"bleu", + "score":0.05512322 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"km", + "task":"translation_to", + "metric":"chrf", + "score":0.1415530353 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"kn", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"kn", + "task":"translation_from", + "metric":"bleu", + "score":0.1622823381 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"kn", + "task":"translation_from", + "metric":"chrf", + "score":0.3112906344 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"kn", + "task":"translation_to", + "metric":"bleu", + "score":0.0777950259 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"kn", + "task":"translation_to", + "metric":"chrf", + "score":0.286449259 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ko", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ko", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ko", + "task":"translation_from", + "metric":"bleu", + "score":0.2242267538 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ko", + "task":"translation_from", + "metric":"chrf", + "score":0.4739719705 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ko", + "task":"translation_to", + "metric":"bleu", + "score":0.2193704377 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ko", + "task":"translation_to", + "metric":"chrf", + "score":0.2898139055 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"lua", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"lua", + "task":"translation_from", + "metric":"bleu", + "score":0.1346054696 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"lua", + "task":"translation_from", + "metric":"chrf", + "score":0.3409559995 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"lua", + "task":"translation_to", + "metric":"bleu", + "score":0.0394802393 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"lua", + "task":"translation_to", + "metric":"chrf", + "score":0.2573657649 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"mag", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"mag", + "task":"translation_from", + "metric":"bleu", + "score":0.1819054463 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"mag", + "task":"translation_from", + "metric":"chrf", + "score":0.3169358876 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"mag", + "task":"translation_to", + "metric":"bleu", + "score":0.104449722 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"mag", + "task":"translation_to", + "metric":"chrf", + "score":0.3335661802 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"mai", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"mai", + "task":"translation_from", + "metric":"bleu", + "score":0.1790591986 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"mai", + "task":"translation_from", + "metric":"chrf", + "score":0.3273464644 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"mai", + "task":"translation_to", + "metric":"bleu", + "score":0.0709002184 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"mai", + "task":"translation_to", + "metric":"chrf", + "score":0.2564650613 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"mg", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"mg", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"mg", + "task":"translation_from", + "metric":"bleu", + "score":0.1088802366 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"mg", + "task":"translation_from", + "metric":"chrf", + "score":0.3340713822 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"mg", + "task":"translation_to", + "metric":"bleu", + "score":0.138140887 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"mg", + "task":"translation_to", + "metric":"chrf", + "score":0.5001663831 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ml", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ml", + "task":"translation_from", + "metric":"bleu", + "score":0.2496973594 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ml", + "task":"translation_from", + "metric":"chrf", + "score":0.435485932 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ml", + "task":"translation_to", + "metric":"bleu", + "score":0.1379373956 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ml", + "task":"translation_to", + "metric":"chrf", + "score":0.2513871995 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"mr", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"mr", + "task":"translation_from", + "metric":"bleu", + "score":0.1828389227 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"mr", + "task":"translation_from", + "metric":"chrf", + "score":0.3179756072 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"mr", + "task":"translation_to", + "metric":"bleu", + "score":0.2129586558 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"mr", + "task":"translation_to", + "metric":"chrf", + "score":0.4314516197 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ms", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ms", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ms", + "task":"translation_from", + "metric":"bleu", + "score":0.24401684 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ms", + "task":"translation_from", + "metric":"chrf", + "score":0.4592926922 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ms", + "task":"translation_to", + "metric":"bleu", + "score":0.3739586622 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ms", + "task":"translation_to", + "metric":"chrf", + "score":0.6802015628 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"my", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"my", + "task":"translation_from", + "metric":"bleu", + "score":0.1237069224 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"my", + "task":"translation_from", + "metric":"chrf", + "score":0.3000426144 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"my", + "task":"translation_to", + "metric":"bleu", + "score":0.0752750224 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"my", + "task":"translation_to", + "metric":"chrf", + "score":0.1972354123 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ne", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ne", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ne", + "task":"translation_from", + "metric":"bleu", + "score":0.2657383448 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ne", + "task":"translation_from", + "metric":"chrf", + "score":0.5050071583 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ne", + "task":"translation_to", + "metric":"bleu", + "score":0.1687285867 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ne", + "task":"translation_to", + "metric":"chrf", + "score":0.4021301132 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"nl", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"nl", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"nl", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"nl", + "task":"translation_from", + "metric":"bleu", + "score":0.2202972405 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"nl", + "task":"translation_from", + "metric":"chrf", + "score":0.4092623804 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"nl", + "task":"translation_to", + "metric":"bleu", + "score":0.3159175655 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"nl", + "task":"translation_to", + "metric":"chrf", + "score":0.5588876314 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ny", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ny", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ny", + "task":"translation_from", + "metric":"bleu", + "score":0.092498489 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ny", + "task":"translation_from", + "metric":"chrf", + "score":0.2505889593 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ny", + "task":"translation_to", + "metric":"bleu", + "score":0.0281527677 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ny", + "task":"translation_to", + "metric":"chrf", + "score":0.1893859434 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"om", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"om", + "task":"translation_from", + "metric":"bleu", + "score":0.0257539048 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"om", + "task":"translation_from", + "metric":"chrf", + "score":0.2236454943 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"om", + "task":"translation_to", + "metric":"bleu", + "score":0.0203648136 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"om", + "task":"translation_to", + "metric":"chrf", + "score":0.2172604464 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"or", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"or", + "task":"translation_from", + "metric":"bleu", + "score":0.1894457708 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"or", + "task":"translation_from", + "metric":"chrf", + "score":0.380925147 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"or", + "task":"translation_to", + "metric":"bleu", + "score":0.0698032229 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"or", + "task":"translation_to", + "metric":"chrf", + "score":0.2623376551 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"pa", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"pa", + "task":"translation_from", + "metric":"bleu", + "score":0.252814761 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"pa", + "task":"translation_from", + "metric":"chrf", + "score":0.4131775231 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"pa", + "task":"translation_to", + "metric":"bleu", + "score":0.2671823746 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"pa", + "task":"translation_to", + "metric":"chrf", + "score":0.3966391033 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"pl", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"pl", + "task":"translation_from", + "metric":"bleu", + "score":0.2278356993 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"pl", + "task":"translation_from", + "metric":"chrf", + "score":0.4590175615 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"pl", + "task":"translation_to", + "metric":"bleu", + "score":0.2772231531 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"pl", + "task":"translation_to", + "metric":"chrf", + "score":0.4560149918 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"pt", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"pt", + "task":"translation_from", + "metric":"bleu", + "score":0.2348823133 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"pt", + "task":"translation_from", + "metric":"chrf", + "score":0.4500923911 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"pt", + "task":"translation_to", + "metric":"bleu", + "score":0.4182790857 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"pt", + "task":"translation_to", + "metric":"chrf", + "score":0.649967582 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ro", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ro", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ro", + "task":"translation_from", + "metric":"bleu", + "score":0.2343936577 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ro", + "task":"translation_from", + "metric":"chrf", + "score":0.4827310176 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ro", + "task":"translation_to", + "metric":"bleu", + "score":0.3388526407 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ro", + "task":"translation_to", + "metric":"chrf", + "score":0.5454578721 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ru", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ru", + "task":"translation_from", + "metric":"bleu", + "score":0.1839314203 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ru", + "task":"translation_from", + "metric":"chrf", + "score":0.4234191674 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ru", + "task":"translation_to", + "metric":"bleu", + "score":0.3489148579 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ru", + "task":"translation_to", + "metric":"chrf", + "score":0.5567945257 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"rw", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"rw", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"rw", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"rw", + "task":"translation_from", + "metric":"bleu", + "score":0.1402474958 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"rw", + "task":"translation_from", + "metric":"chrf", + "score":0.3500619576 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"rw", + "task":"translation_to", + "metric":"bleu", + "score":0.0777850092 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"rw", + "task":"translation_to", + "metric":"chrf", + "score":0.3273785033 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sd", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sd", + "task":"translation_from", + "metric":"bleu", + "score":0.1949440941 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sd", + "task":"translation_from", + "metric":"chrf", + "score":0.4275372517 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sd", + "task":"translation_to", + "metric":"bleu", + "score":0.1720625024 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sd", + "task":"translation_to", + "metric":"chrf", + "score":0.387179761 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"si", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"si", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"si", + "task":"translation_from", + "metric":"bleu", + "score":0.2272550261 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"si", + "task":"translation_from", + "metric":"chrf", + "score":0.5004185979 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"si", + "task":"translation_to", + "metric":"bleu", + "score":0.1082324911 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"si", + "task":"translation_to", + "metric":"chrf", + "score":0.2676221295 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sn", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sn", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sn", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sn", + "task":"translation_from", + "metric":"bleu", + "score":0.122708093 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sn", + "task":"translation_from", + "metric":"chrf", + "score":0.3763985899 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sn", + "task":"translation_to", + "metric":"bleu", + "score":0.1795400131 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sn", + "task":"translation_to", + "metric":"chrf", + "score":0.4606246254 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"so", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"so", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"so", + "task":"translation_from", + "metric":"bleu", + "score":0.1736253216 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"so", + "task":"translation_from", + "metric":"chrf", + "score":0.3845743827 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"so", + "task":"translation_to", + "metric":"bleu", + "score":0.1212907088 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"so", + "task":"translation_to", + "metric":"chrf", + "score":0.3790107218 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sr", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sr", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sr", + "task":"translation_from", + "metric":"bleu", + "score":0.2260669876 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sr", + "task":"translation_from", + "metric":"chrf", + "score":0.4794686178 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sr", + "task":"translation_to", + "metric":"bleu", + "score":0.4126611726 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sr", + "task":"translation_to", + "metric":"chrf", + "score":0.5967801454 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"su", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"su", + "task":"translation_from", + "metric":"bleu", + "score":0.1563243249 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"su", + "task":"translation_from", + "metric":"chrf", + "score":0.3099234307 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"su", + "task":"translation_to", + "metric":"bleu", + "score":0.2041414382 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"su", + "task":"translation_to", + "metric":"chrf", + "score":0.5298340938 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sv", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sv", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sv", + "task":"translation_from", + "metric":"bleu", + "score":0.2570489843 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sv", + "task":"translation_from", + "metric":"chrf", + "score":0.4028888696 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sv", + "task":"translation_to", + "metric":"bleu", + "score":0.2324980283 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sv", + "task":"translation_to", + "metric":"chrf", + "score":0.4203934844 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sw", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sw", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sw", + "task":"translation_from", + "metric":"bleu", + "score":0.2041105012 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sw", + "task":"translation_from", + "metric":"chrf", + "score":0.3657796945 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sw", + "task":"translation_to", + "metric":"bleu", + "score":0.3130978532 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sw", + "task":"translation_to", + "metric":"chrf", + "score":0.5950962977 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ta", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ta", + "task":"translation_from", + "metric":"bleu", + "score":0.2525982324 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ta", + "task":"translation_from", + "metric":"chrf", + "score":0.4605822105 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ta", + "task":"translation_to", + "metric":"bleu", + "score":0.1739645144 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ta", + "task":"translation_to", + "metric":"chrf", + "score":0.3984988334 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"te", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"te", + "task":"translation_from", + "metric":"bleu", + "score":0.1200373123 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"te", + "task":"translation_from", + "metric":"chrf", + "score":0.3196364935 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"te", + "task":"translation_to", + "metric":"bleu", + "score":0.1814754432 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"te", + "task":"translation_to", + "metric":"chrf", + "score":0.3157059838 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"tg", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"tg", + "task":"translation_from", + "metric":"bleu", + "score":0.187751348 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"tg", + "task":"translation_from", + "metric":"chrf", + "score":0.4405758845 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"tg", + "task":"translation_to", + "metric":"bleu", + "score":0.2191046369 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"tg", + "task":"translation_to", + "metric":"chrf", + "score":0.4677894227 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"th", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"th", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"th", + "task":"translation_from", + "metric":"bleu", + "score":0.1984127492 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"th", + "task":"translation_from", + "metric":"chrf", + "score":0.4104368787 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"th", + "task":"translation_to", + "metric":"bleu", + "score":0.2929382742 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"th", + "task":"translation_to", + "metric":"chrf", + "score":0.4500167319 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ti", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ti", + "task":"translation_from", + "metric":"bleu", + "score":0.1223581489 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ti", + "task":"translation_from", + "metric":"chrf", + "score":0.3679278604 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ti", + "task":"translation_to", + "metric":"bleu", + "score":0.0119991714 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ti", + "task":"translation_to", + "metric":"chrf", + "score":0.0656655661 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"tr", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"tr", + "task":"translation_from", + "metric":"bleu", + "score":0.264346972 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"tr", + "task":"translation_from", + "metric":"chrf", + "score":0.4993975063 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"tr", + "task":"translation_to", + "metric":"bleu", + "score":0.31801505 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"tr", + "task":"translation_to", + "metric":"chrf", + "score":0.5317972494 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"uk", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"uk", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"uk", + "task":"translation_from", + "metric":"bleu", + "score":0.2705929623 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"uk", + "task":"translation_from", + "metric":"chrf", + "score":0.5134621473 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"uk", + "task":"translation_to", + "metric":"bleu", + "score":0.256831195 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"uk", + "task":"translation_to", + "metric":"chrf", + "score":0.4554987689 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"umb", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"umb", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"umb", + "task":"translation_from", + "metric":"chrf", + "score":0.0897426047 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"umb", + "task":"translation_to", + "metric":"bleu", + "score":0.0174118264 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"umb", + "task":"translation_to", + "metric":"chrf", + "score":0.1924672099 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ur", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ur", + "task":"translation_from", + "metric":"bleu", + "score":0.181272453 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ur", + "task":"translation_from", + "metric":"chrf", + "score":0.386776605 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ur", + "task":"translation_to", + "metric":"bleu", + "score":0.2603415771 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ur", + "task":"translation_to", + "metric":"chrf", + "score":0.4241396601 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"uz", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"uz", + "task":"translation_from", + "metric":"bleu", + "score":0.1963447008 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"uz", + "task":"translation_from", + "metric":"chrf", + "score":0.4236533517 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"uz", + "task":"translation_to", + "metric":"bleu", + "score":0.1559833307 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"uz", + "task":"translation_to", + "metric":"chrf", + "score":0.3946264183 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"vi", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"vi", + "task":"translation_from", + "metric":"bleu", + "score":0.1705385375 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"vi", + "task":"translation_from", + "metric":"chrf", + "score":0.3747437419 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"vi", + "task":"translation_to", + "metric":"bleu", + "score":0.257036702 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"vi", + "task":"translation_to", + "metric":"chrf", + "score":0.4598854693 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"wo", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"wo", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"wo", + "task":"translation_from", + "metric":"bleu", + "score":0.0825950269 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"wo", + "task":"translation_from", + "metric":"chrf", + "score":0.2748258429 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"wo", + "task":"translation_to", + "metric":"bleu", + "score":0.039067574 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"wo", + "task":"translation_to", + "metric":"chrf", + "score":0.2124733373 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"wuu", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"bleu", + "score":0.192705772 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"chrf", + "score":0.444563462 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"bleu", + "score":0.078814153 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"chrf", + "score":0.1049283878 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"xh", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"xh", + "task":"translation_from", + "metric":"bleu", + "score":0.0644184223 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"xh", + "task":"translation_from", + "metric":"chrf", + "score":0.2244706008 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"xh", + "task":"translation_to", + "metric":"bleu", + "score":0.0232220251 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"xh", + "task":"translation_to", + "metric":"chrf", + "score":0.2052740772 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"yo", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"yo", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"yo", + "task":"translation_from", + "metric":"bleu", + "score":0.0620084814 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"yo", + "task":"translation_from", + "metric":"chrf", + "score":0.2964981916 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"yo", + "task":"translation_to", + "metric":"bleu", + "score":0.0414688547 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"yo", + "task":"translation_to", + "metric":"chrf", + "score":0.1387297621 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"yue", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"yue", + "task":"translation_from", + "metric":"bleu", + "score":0.1352563368 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"yue", + "task":"translation_from", + "metric":"chrf", + "score":0.3763213166 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"yue", + "task":"translation_to", + "metric":"bleu", + "score":0.2591777223 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"yue", + "task":"translation_to", + "metric":"chrf", + "score":0.3119832776 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"zh", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"zh", + "task":"translation_from", + "metric":"bleu", + "score":0.2137844239 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"zh", + "task":"translation_from", + "metric":"chrf", + "score":0.5028557922 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"zh", + "task":"translation_to", + "metric":"bleu", + "score":0.3129908127 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"zh", + "task":"translation_to", + "metric":"chrf", + "score":0.3710290799 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"zu", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"zu", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"zu", + "task":"translation_from", + "metric":"bleu", + "score":0.1943812143 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"zu", + "task":"translation_from", + "metric":"chrf", + "score":0.4323832185 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"zu", + "task":"translation_to", + "metric":"bleu", + "score":0.094824393 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"zu", + "task":"translation_to", + "metric":"chrf", + "score":0.2713939288 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ar", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ar", + "task":"translation_from", + "metric":"bleu", + "score":0.2373672543 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ar", + "task":"translation_from", + "metric":"chrf", + "score":0.5260757727 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ar", + "task":"translation_to", + "metric":"bleu", + "score":0.3285274303 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ar", + "task":"translation_to", + "metric":"chrf", + "score":0.5590237808 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"arz", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"arz", + "task":"translation_from", + "metric":"bleu", + "score":0.2406381299 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"arz", + "task":"translation_from", + "metric":"chrf", + "score":0.4810229449 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"arz", + "task":"translation_to", + "metric":"bleu", + "score":0.2249075936 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"arz", + "task":"translation_to", + "metric":"chrf", + "score":0.4437585001 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"bn", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"bn", + "task":"translation_from", + "metric":"bleu", + "score":0.251982914 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"bn", + "task":"translation_from", + "metric":"chrf", + "score":0.5269588388 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"bn", + "task":"translation_to", + "metric":"bleu", + "score":0.3081294684 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"bn", + "task":"translation_to", + "metric":"chrf", + "score":0.5221618044 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"de", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"de", + "task":"translation_from", + "metric":"bleu", + "score":0.3226520344 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"de", + "task":"translation_from", + "metric":"chrf", + "score":0.5750653902 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"de", + "task":"translation_to", + "metric":"bleu", + "score":0.3833943767 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"de", + "task":"translation_to", + "metric":"chrf", + "score":0.5822540388 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"en", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"en", + "task":"translation_from", + "metric":"bleu", + "score":0.5414890567 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"en", + "task":"translation_from", + "metric":"chrf", + "score":0.6901603131 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"en", + "task":"translation_to", + "metric":"bleu", + "score":0.65136344 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"en", + "task":"translation_to", + "metric":"chrf", + "score":0.814288256 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"es", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"es", + "task":"translation_from", + "metric":"bleu", + "score":0.2479212607 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"es", + "task":"translation_from", + "metric":"chrf", + "score":0.4998884286 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"es", + "task":"translation_to", + "metric":"bleu", + "score":0.2970650759 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"es", + "task":"translation_to", + "metric":"chrf", + "score":0.5373052889 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"fa", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"fa", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"fa", + "task":"translation_from", + "metric":"bleu", + "score":0.2793086929 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"fa", + "task":"translation_from", + "metric":"chrf", + "score":0.4720611769 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"fa", + "task":"translation_to", + "metric":"bleu", + "score":0.1318325912 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"fa", + "task":"translation_to", + "metric":"chrf", + "score":0.3864569881 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"fil", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"fil", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"fil", + "task":"translation_from", + "metric":"bleu", + "score":0.3666373087 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"fil", + "task":"translation_from", + "metric":"chrf", + "score":0.5839902989 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"fil", + "task":"translation_to", + "metric":"bleu", + "score":0.2824386471 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"fil", + "task":"translation_to", + "metric":"chrf", + "score":0.5388064333 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"fr", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"fr", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"fr", + "task":"translation_from", + "metric":"bleu", + "score":0.3186845256 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"fr", + "task":"translation_from", + "metric":"chrf", + "score":0.5933794038 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"fr", + "task":"translation_to", + "metric":"bleu", + "score":0.4349494723 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"fr", + "task":"translation_to", + "metric":"chrf", + "score":0.6079740627 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"gu", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"gu", + "task":"translation_from", + "metric":"bleu", + "score":0.1773927146 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"gu", + "task":"translation_from", + "metric":"chrf", + "score":0.3630036378 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"gu", + "task":"translation_to", + "metric":"bleu", + "score":0.0949811313 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"gu", + "task":"translation_to", + "metric":"chrf", + "score":0.3340540429 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ha", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ha", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ha", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ha", + "task":"translation_from", + "metric":"bleu", + "score":0.1872829527 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ha", + "task":"translation_from", + "metric":"chrf", + "score":0.3848483899 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ha", + "task":"translation_to", + "metric":"bleu", + "score":0.2170056607 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ha", + "task":"translation_to", + "metric":"chrf", + "score":0.485021658 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"hi", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"hi", + "task":"translation_from", + "metric":"bleu", + "score":0.3564149867 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"hi", + "task":"translation_from", + "metric":"chrf", + "score":0.5972656918 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"hi", + "task":"translation_to", + "metric":"bleu", + "score":0.3029237977 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"hi", + "task":"translation_to", + "metric":"chrf", + "score":0.5276781303 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"id", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"id", + "task":"translation_from", + "metric":"bleu", + "score":0.2876911945 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"id", + "task":"translation_from", + "metric":"chrf", + "score":0.5482159609 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"id", + "task":"translation_to", + "metric":"bleu", + "score":0.2940448188 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"id", + "task":"translation_to", + "metric":"chrf", + "score":0.5448923741 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"it", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"it", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"it", + "task":"translation_from", + "metric":"bleu", + "score":0.2897223986 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"it", + "task":"translation_from", + "metric":"chrf", + "score":0.5436301176 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"it", + "task":"translation_to", + "metric":"bleu", + "score":0.2571014471 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"it", + "task":"translation_to", + "metric":"chrf", + "score":0.4731076434 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ja", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ja", + "task":"translation_from", + "metric":"bleu", + "score":0.1827387853 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ja", + "task":"translation_from", + "metric":"chrf", + "score":0.4769620326 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ja", + "task":"translation_to", + "metric":"bleu", + "score":0.0613359658 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ja", + "task":"translation_to", + "metric":"chrf", + "score":0.2105103816 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"jv", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"jv", + "task":"translation_from", + "metric":"bleu", + "score":0.2802837747 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"jv", + "task":"translation_from", + "metric":"chrf", + "score":0.4893845985 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"jv", + "task":"translation_to", + "metric":"bleu", + "score":0.1179961209 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"jv", + "task":"translation_to", + "metric":"chrf", + "score":0.3697436656 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"kn", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"kn", + "task":"translation_from", + "metric":"bleu", + "score":0.2346057729 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"kn", + "task":"translation_from", + "metric":"chrf", + "score":0.4744017815 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"kn", + "task":"translation_to", + "metric":"bleu", + "score":0.1793887241 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"kn", + "task":"translation_to", + "metric":"chrf", + "score":0.4368728644 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ko", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ko", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ko", + "task":"translation_from", + "metric":"bleu", + "score":0.2249815138 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ko", + "task":"translation_from", + "metric":"chrf", + "score":0.5077874682 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ko", + "task":"translation_to", + "metric":"bleu", + "score":0.2125650621 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ko", + "task":"translation_to", + "metric":"chrf", + "score":0.2904132435 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ml", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ml", + "task":"translation_from", + "metric":"bleu", + "score":0.3249125796 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ml", + "task":"translation_from", + "metric":"chrf", + "score":0.5545635633 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ml", + "task":"translation_to", + "metric":"bleu", + "score":0.2625209874 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ml", + "task":"translation_to", + "metric":"chrf", + "score":0.5042437741 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"mr", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"mr", + "task":"translation_from", + "metric":"bleu", + "score":0.1520275352 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"mr", + "task":"translation_from", + "metric":"chrf", + "score":0.3905524229 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"mr", + "task":"translation_to", + "metric":"bleu", + "score":0.0999041852 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"mr", + "task":"translation_to", + "metric":"chrf", + "score":0.3246573528 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"or", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"or", + "task":"translation_from", + "metric":"bleu", + "score":0.2703816733 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"or", + "task":"translation_from", + "metric":"chrf", + "score":0.5070503073 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"or", + "task":"translation_to", + "metric":"bleu", + "score":0.1229430143 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"or", + "task":"translation_to", + "metric":"chrf", + "score":0.3831192143 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"pa", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"pa", + "task":"translation_from", + "metric":"bleu", + "score":0.361635926 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"pa", + "task":"translation_from", + "metric":"chrf", + "score":0.5409988692 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"pa", + "task":"translation_to", + "metric":"bleu", + "score":0.3917357782 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"pa", + "task":"translation_to", + "metric":"chrf", + "score":0.5329271965 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"pl", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"pl", + "task":"translation_from", + "metric":"bleu", + "score":0.26251395 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"pl", + "task":"translation_from", + "metric":"chrf", + "score":0.5352694678 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"pl", + "task":"translation_to", + "metric":"bleu", + "score":0.3264296122 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"pl", + "task":"translation_to", + "metric":"chrf", + "score":0.5528035231 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"pt", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"pt", + "task":"translation_from", + "metric":"bleu", + "score":0.3390879053 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"pt", + "task":"translation_from", + "metric":"chrf", + "score":0.5804013742 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"pt", + "task":"translation_to", + "metric":"bleu", + "score":0.3506563803 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"pt", + "task":"translation_to", + "metric":"chrf", + "score":0.5763378703 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ru", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ru", + "task":"translation_from", + "metric":"bleu", + "score":0.2246840158 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ru", + "task":"translation_from", + "metric":"chrf", + "score":0.5244113055 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ru", + "task":"translation_to", + "metric":"bleu", + "score":0.3594079605 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ru", + "task":"translation_to", + "metric":"chrf", + "score":0.5726823578 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"sd", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"sd", + "task":"translation_from", + "metric":"bleu", + "score":0.1351642547 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"sd", + "task":"translation_from", + "metric":"chrf", + "score":0.419979284 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"sd", + "task":"translation_to", + "metric":"bleu", + "score":0.1783822717 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"sd", + "task":"translation_to", + "metric":"chrf", + "score":0.3420045131 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"sw", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"sw", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"sw", + "task":"translation_from", + "metric":"bleu", + "score":0.2074916818 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"sw", + "task":"translation_from", + "metric":"chrf", + "score":0.4529002152 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"sw", + "task":"translation_to", + "metric":"bleu", + "score":0.3320288719 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"sw", + "task":"translation_to", + "metric":"chrf", + "score":0.6201778863 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ta", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ta", + "task":"translation_from", + "metric":"bleu", + "score":0.2510503336 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ta", + "task":"translation_from", + "metric":"chrf", + "score":0.4902642703 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ta", + "task":"translation_to", + "metric":"bleu", + "score":0.2210031154 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ta", + "task":"translation_to", + "metric":"chrf", + "score":0.4920579152 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"te", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"te", + "task":"translation_from", + "metric":"bleu", + "score":0.3219720359 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"te", + "task":"translation_from", + "metric":"chrf", + "score":0.5542555367 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"te", + "task":"translation_to", + "metric":"bleu", + "score":0.2813682269 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"te", + "task":"translation_to", + "metric":"chrf", + "score":0.5156714123 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"th", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"th", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"th", + "task":"translation_from", + "metric":"bleu", + "score":0.2423449507 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"th", + "task":"translation_from", + "metric":"chrf", + "score":0.5073629744 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"th", + "task":"translation_to", + "metric":"bleu", + "score":0.2856584071 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"th", + "task":"translation_to", + "metric":"chrf", + "score":0.4617854306 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"tr", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"tr", + "task":"translation_from", + "metric":"bleu", + "score":0.2862677011 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"tr", + "task":"translation_from", + "metric":"chrf", + "score":0.5325160504 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"tr", + "task":"translation_to", + "metric":"bleu", + "score":0.3443407299 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"tr", + "task":"translation_to", + "metric":"chrf", + "score":0.6019992774 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ur", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ur", + "task":"translation_from", + "metric":"bleu", + "score":0.2049672714 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ur", + "task":"translation_from", + "metric":"chrf", + "score":0.4409541903 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ur", + "task":"translation_to", + "metric":"bleu", + "score":0.291136983 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"ur", + "task":"translation_to", + "metric":"chrf", + "score":0.4722890493 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"vi", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"vi", + "task":"translation_from", + "metric":"bleu", + "score":0.290841669 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"vi", + "task":"translation_from", + "metric":"chrf", + "score":0.5420316418 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"vi", + "task":"translation_to", + "metric":"bleu", + "score":0.4456194272 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"vi", + "task":"translation_to", + "metric":"chrf", + "score":0.6359307779 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"wuu", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"bleu", + "score":0.2592635841 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"chrf", + "score":0.5029886217 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"bleu", + "score":0.0439234831 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"chrf", + "score":0.1458942547 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"yue", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"yue", + "task":"translation_from", + "metric":"bleu", + "score":0.2131332995 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"yue", + "task":"translation_from", + "metric":"chrf", + "score":0.4719991036 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"yue", + "task":"translation_to", + "metric":"bleu", + "score":0.117107351 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"yue", + "task":"translation_to", + "metric":"chrf", + "score":0.2063865989 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"zh", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"zh", + "task":"translation_from", + "metric":"bleu", + "score":0.2199013913 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"zh", + "task":"translation_from", + "metric":"chrf", + "score":0.4962775874 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"zh", + "task":"translation_to", + "metric":"bleu", + "score":0.1813558493 + }, + { + "model":"deepseek\/deepseek-r1-0528", + "bcp_47":"zh", + "task":"translation_to", + "metric":"chrf", + "score":0.3079482476 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"aeb", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.311563429 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.5377881998 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.2396682484 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.4396755163 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"af", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"af", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"af", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"af", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"af", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ak", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ak", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ak", + "task":"translation_from", + "metric":"bleu", + "score":0.2166814512 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ak", + "task":"translation_from", + "metric":"chrf", + "score":0.4841980873 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ak", + "task":"translation_to", + "metric":"bleu", + "score":0.1410606918 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ak", + "task":"translation_to", + "metric":"chrf", + "score":0.4325882329 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"am", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"am", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"am", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"am", + "task":"translation_from", + "metric":"bleu", + "score":0.278130538 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"am", + "task":"translation_from", + "metric":"chrf", + "score":0.5385292979 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"am", + "task":"translation_to", + "metric":"bleu", + "score":0.2384630665 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"am", + "task":"translation_to", + "metric":"chrf", + "score":0.3608782934 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"apc", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"apc", + "task":"translation_from", + "metric":"bleu", + "score":0.3417210123 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"apc", + "task":"translation_from", + "metric":"chrf", + "score":0.5899435952 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"apc", + "task":"translation_to", + "metric":"bleu", + "score":0.2808352256 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"apc", + "task":"translation_to", + "metric":"chrf", + "score":0.5279437548 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ar", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ar", + "task":"translation_from", + "metric":"bleu", + "score":0.3412745465 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ar", + "task":"translation_from", + "metric":"chrf", + "score":0.5826925715 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ar", + "task":"translation_to", + "metric":"bleu", + "score":0.390058702 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ar", + "task":"translation_to", + "metric":"chrf", + "score":0.597901367 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ary", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ary", + "task":"translation_from", + "metric":"bleu", + "score":0.2090093301 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ary", + "task":"translation_from", + "metric":"chrf", + "score":0.4788545798 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ary", + "task":"translation_to", + "metric":"bleu", + "score":0.2182033882 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ary", + "task":"translation_to", + "metric":"chrf", + "score":0.4418555529 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"arz", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"arz", + "task":"translation_from", + "metric":"bleu", + "score":0.2884896124 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"arz", + "task":"translation_from", + "metric":"chrf", + "score":0.4868568502 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"arz", + "task":"translation_to", + "metric":"bleu", + "score":0.2753136771 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"arz", + "task":"translation_to", + "metric":"chrf", + "score":0.4912165901 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"as", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"as", + "task":"translation_from", + "metric":"bleu", + "score":0.2570929124 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"as", + "task":"translation_from", + "metric":"chrf", + "score":0.4913361477 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"as", + "task":"translation_to", + "metric":"bleu", + "score":0.2251696435 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"as", + "task":"translation_to", + "metric":"chrf", + "score":0.4568625878 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"awa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"awa", + "task":"translation_from", + "metric":"bleu", + "score":0.3669654657 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"awa", + "task":"translation_from", + "metric":"chrf", + "score":0.6010168651 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"awa", + "task":"translation_to", + "metric":"bleu", + "score":0.2158729847 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"awa", + "task":"translation_to", + "metric":"chrf", + "score":0.4281994918 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"az", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"az", + "task":"translation_from", + "metric":"bleu", + "score":0.2496588936 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"az", + "task":"translation_from", + "metric":"chrf", + "score":0.4813242802 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"az", + "task":"translation_to", + "metric":"bleu", + "score":0.1805770029 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"az", + "task":"translation_to", + "metric":"chrf", + "score":0.4382698967 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"be", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"be", + "task":"translation_from", + "metric":"bleu", + "score":0.2061377509 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"be", + "task":"translation_from", + "metric":"chrf", + "score":0.5025518062 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"be", + "task":"translation_to", + "metric":"bleu", + "score":0.2617461401 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"be", + "task":"translation_to", + "metric":"chrf", + "score":0.4657078066 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"bho", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"bho", + "task":"translation_from", + "metric":"bleu", + "score":0.2478040527 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"bho", + "task":"translation_from", + "metric":"chrf", + "score":0.5055046978 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"bho", + "task":"translation_to", + "metric":"bleu", + "score":0.2299760176 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"bho", + "task":"translation_to", + "metric":"chrf", + "score":0.4382930134 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"bm", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"bm", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"bm", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"bm", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"bm", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"bn", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"bn", + "task":"translation_from", + "metric":"bleu", + "score":0.2988263355 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"bn", + "task":"translation_from", + "metric":"chrf", + "score":0.5680625724 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"bn", + "task":"translation_to", + "metric":"bleu", + "score":0.3895386095 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"bn", + "task":"translation_to", + "metric":"chrf", + "score":0.5693830083 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ca", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ca", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ca", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ca", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ca", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ceb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"bleu", + "score":0.3954134409 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"chrf", + "score":0.6048442845 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"bleu", + "score":0.4087786463 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"chrf", + "score":0.6570148202 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ckb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"bleu", + "score":0.3123005535 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"chrf", + "score":0.5830505467 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"bleu", + "score":0.335884194 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"chrf", + "score":0.5760217609 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"cs", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"cs", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"cs", + "task":"translation_from", + "metric":"bleu", + "score":0.3897427607 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"cs", + "task":"translation_from", + "metric":"chrf", + "score":0.6211463161 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"cs", + "task":"translation_to", + "metric":"bleu", + "score":0.3989536756 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"cs", + "task":"translation_to", + "metric":"chrf", + "score":0.5939433432 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"de", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"de", + "task":"translation_from", + "metric":"bleu", + "score":0.4245142301 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"de", + "task":"translation_from", + "metric":"chrf", + "score":0.6390046108 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"de", + "task":"translation_to", + "metric":"bleu", + "score":0.4937713215 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"de", + "task":"translation_to", + "metric":"chrf", + "score":0.6856946146 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"el", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"el", + "task":"translation_from", + "metric":"bleu", + "score":0.3112735556 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"el", + "task":"translation_from", + "metric":"chrf", + "score":0.5352584968 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"el", + "task":"translation_to", + "metric":"bleu", + "score":0.3040377019 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"el", + "task":"translation_to", + "metric":"chrf", + "score":0.513213381 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"en", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"en", + "task":"translation_from", + "metric":"bleu", + "score":0.5700014681 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"en", + "task":"translation_from", + "metric":"chrf", + "score":0.7211557733 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"en", + "task":"translation_to", + "metric":"bleu", + "score":0.6711231356 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"en", + "task":"translation_to", + "metric":"chrf", + "score":0.8279616884 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"es", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"es", + "task":"translation_from", + "metric":"bleu", + "score":0.3344072959 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"es", + "task":"translation_from", + "metric":"chrf", + "score":0.5751886204 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"es", + "task":"translation_to", + "metric":"bleu", + "score":0.3905772718 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"es", + "task":"translation_to", + "metric":"chrf", + "score":0.6166676981 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fa", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fa", + "task":"translation_from", + "metric":"bleu", + "score":0.3438075851 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fa", + "task":"translation_from", + "metric":"chrf", + "score":0.5772164708 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fa", + "task":"translation_to", + "metric":"bleu", + "score":0.2647913841 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fa", + "task":"translation_to", + "metric":"chrf", + "score":0.489934723 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fil", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fil", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fil", + "task":"translation_from", + "metric":"bleu", + "score":0.4465199237 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fil", + "task":"translation_from", + "metric":"chrf", + "score":0.6601536062 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fil", + "task":"translation_to", + "metric":"bleu", + "score":0.3429301939 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fil", + "task":"translation_to", + "metric":"chrf", + "score":0.6176510545 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fr", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fr", + "task":"translation_from", + "metric":"bleu", + "score":0.3411643102 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fr", + "task":"translation_from", + "metric":"chrf", + "score":0.5823324237 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fr", + "task":"translation_to", + "metric":"bleu", + "score":0.549646027 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fr", + "task":"translation_to", + "metric":"chrf", + "score":0.7334440232 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.020521917 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.2363991566 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.038851639 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.2330289804 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"gu", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"gu", + "task":"translation_from", + "metric":"bleu", + "score":0.3431336081 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"gu", + "task":"translation_from", + "metric":"chrf", + "score":0.5478126679 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"gu", + "task":"translation_to", + "metric":"bleu", + "score":0.1775808906 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"gu", + "task":"translation_to", + "metric":"chrf", + "score":0.4530128509 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ha", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ha", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ha", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ha", + "task":"translation_from", + "metric":"bleu", + "score":0.2923469792 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ha", + "task":"translation_from", + "metric":"chrf", + "score":0.5018131258 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ha", + "task":"translation_to", + "metric":"bleu", + "score":0.2792533669 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ha", + "task":"translation_to", + "metric":"chrf", + "score":0.5455037681 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"hi", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"hi", + "task":"translation_from", + "metric":"bleu", + "score":0.4434404142 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"hi", + "task":"translation_from", + "metric":"chrf", + "score":0.6607832834 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"hi", + "task":"translation_to", + "metric":"bleu", + "score":0.4308263411 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"hi", + "task":"translation_to", + "metric":"chrf", + "score":0.6353494719 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"hne", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"hne", + "task":"translation_from", + "metric":"bleu", + "score":0.3988769415 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"hne", + "task":"translation_from", + "metric":"chrf", + "score":0.6179037667 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"hne", + "task":"translation_to", + "metric":"bleu", + "score":0.1507190186 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"hne", + "task":"translation_to", + "metric":"chrf", + "score":0.4178703457 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ht", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ht", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ht", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ht", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ht", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"hu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"hu", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"hu", + "task":"translation_from", + "metric":"bleu", + "score":0.3268473222 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"hu", + "task":"translation_from", + "metric":"chrf", + "score":0.5875784187 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"hu", + "task":"translation_to", + "metric":"bleu", + "score":0.3853964262 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"hu", + "task":"translation_to", + "metric":"chrf", + "score":0.644268597 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"id", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"id", + "task":"translation_from", + "metric":"bleu", + "score":0.3626330278 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"id", + "task":"translation_from", + "metric":"chrf", + "score":0.5869542517 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"id", + "task":"translation_to", + "metric":"bleu", + "score":0.4368014195 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"id", + "task":"translation_to", + "metric":"chrf", + "score":0.6964617832 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ig", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ig", + "task":"translation_from", + "metric":"bleu", + "score":0.2899610129 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ig", + "task":"translation_from", + "metric":"chrf", + "score":0.5189509889 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ig", + "task":"translation_to", + "metric":"bleu", + "score":0.2768774018 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ig", + "task":"translation_to", + "metric":"chrf", + "score":0.5137444144 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ilo", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"bleu", + "score":0.3472094652 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"chrf", + "score":0.5708345321 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"bleu", + "score":0.2724432186 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"chrf", + "score":0.5503510798 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"it", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"it", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"it", + "task":"translation_from", + "metric":"bleu", + "score":0.3422169639 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"it", + "task":"translation_from", + "metric":"chrf", + "score":0.5695643744 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"it", + "task":"translation_to", + "metric":"bleu", + "score":0.3590717293 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"it", + "task":"translation_to", + "metric":"chrf", + "score":0.5878176707 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ja", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ja", + "task":"translation_from", + "metric":"bleu", + "score":0.3331002174 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ja", + "task":"translation_from", + "metric":"chrf", + "score":0.579659503 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ja", + "task":"translation_to", + "metric":"bleu", + "score":0.336969824 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ja", + "task":"translation_to", + "metric":"chrf", + "score":0.4913494739 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"jv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"jv", + "task":"translation_from", + "metric":"bleu", + "score":0.3700621486 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"jv", + "task":"translation_from", + "metric":"chrf", + "score":0.5837249923 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"jv", + "task":"translation_to", + "metric":"bleu", + "score":0.3088767184 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"jv", + "task":"translation_to", + "metric":"chrf", + "score":0.5884562937 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ki", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ki", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ki", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ki", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ki", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"kk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"kk", + "task":"translation_from", + "metric":"bleu", + "score":0.2509895727 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"kk", + "task":"translation_from", + "metric":"chrf", + "score":0.5504416013 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"kk", + "task":"translation_to", + "metric":"bleu", + "score":0.3061931512 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"kk", + "task":"translation_to", + "metric":"chrf", + "score":0.5755019454 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"km", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"km", + "task":"translation_from", + "metric":"bleu", + "score":0.3918191618 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"km", + "task":"translation_from", + "metric":"chrf", + "score":0.6170794637 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"km", + "task":"translation_to", + "metric":"bleu", + "score":0.1880645416 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"km", + "task":"translation_to", + "metric":"chrf", + "score":0.3989811117 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"kn", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"kn", + "task":"translation_from", + "metric":"bleu", + "score":0.3364506705 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"kn", + "task":"translation_from", + "metric":"chrf", + "score":0.568444139 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"kn", + "task":"translation_to", + "metric":"bleu", + "score":0.3756915681 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"kn", + "task":"translation_to", + "metric":"chrf", + "score":0.5684194735 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ko", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ko", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ko", + "task":"translation_from", + "metric":"bleu", + "score":0.2805488398 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ko", + "task":"translation_from", + "metric":"chrf", + "score":0.5298229011 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ko", + "task":"translation_to", + "metric":"bleu", + "score":0.2739358937 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ko", + "task":"translation_to", + "metric":"chrf", + "score":0.3591923755 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"lua", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"lua", + "task":"translation_from", + "metric":"bleu", + "score":0.1644396626 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"lua", + "task":"translation_from", + "metric":"chrf", + "score":0.3700254848 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"lua", + "task":"translation_to", + "metric":"bleu", + "score":0.1334761711 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"lua", + "task":"translation_to", + "metric":"chrf", + "score":0.430142277 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"mag", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"mag", + "task":"translation_from", + "metric":"bleu", + "score":0.3953125797 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"mag", + "task":"translation_from", + "metric":"chrf", + "score":0.6309277281 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"mag", + "task":"translation_to", + "metric":"bleu", + "score":0.3149005177 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"mag", + "task":"translation_to", + "metric":"chrf", + "score":0.5121389124 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"mai", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"mai", + "task":"translation_from", + "metric":"bleu", + "score":0.3477763054 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"mai", + "task":"translation_from", + "metric":"chrf", + "score":0.5972164517 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"mai", + "task":"translation_to", + "metric":"bleu", + "score":0.2678562502 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"mai", + "task":"translation_to", + "metric":"chrf", + "score":0.5016256548 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"mg", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"mg", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"mg", + "task":"translation_from", + "metric":"bleu", + "score":0.2950679588 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"mg", + "task":"translation_from", + "metric":"chrf", + "score":0.5434984641 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"mg", + "task":"translation_to", + "metric":"bleu", + "score":0.2063059259 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"mg", + "task":"translation_to", + "metric":"chrf", + "score":0.5248165256 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ml", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ml", + "task":"translation_from", + "metric":"bleu", + "score":0.3735487132 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ml", + "task":"translation_from", + "metric":"chrf", + "score":0.5985929462 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ml", + "task":"translation_to", + "metric":"bleu", + "score":0.2991127987 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ml", + "task":"translation_to", + "metric":"chrf", + "score":0.5530820193 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"mr", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"mr", + "task":"translation_from", + "metric":"bleu", + "score":0.3338185652 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"mr", + "task":"translation_from", + "metric":"chrf", + "score":0.5787491818 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"mr", + "task":"translation_to", + "metric":"bleu", + "score":0.2806196555 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"mr", + "task":"translation_to", + "metric":"chrf", + "score":0.4516145469 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ms", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ms", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ms", + "task":"translation_from", + "metric":"bleu", + "score":0.4099406931 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ms", + "task":"translation_from", + "metric":"chrf", + "score":0.6343459464 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ms", + "task":"translation_to", + "metric":"bleu", + "score":0.4650961929 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ms", + "task":"translation_to", + "metric":"chrf", + "score":0.742377276 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"my", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"my", + "task":"translation_from", + "metric":"bleu", + "score":0.3081644584 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"my", + "task":"translation_from", + "metric":"chrf", + "score":0.567441399 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"my", + "task":"translation_to", + "metric":"bleu", + "score":0.2529515223 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"my", + "task":"translation_to", + "metric":"chrf", + "score":0.5121166935 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ne", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ne", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ne", + "task":"translation_from", + "metric":"bleu", + "score":0.4035620418 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ne", + "task":"translation_from", + "metric":"chrf", + "score":0.6298286173 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ne", + "task":"translation_to", + "metric":"bleu", + "score":0.2518010194 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ne", + "task":"translation_to", + "metric":"chrf", + "score":0.5019977224 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"nl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"nl", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"nl", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"nl", + "task":"translation_from", + "metric":"bleu", + "score":0.2807966919 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"nl", + "task":"translation_from", + "metric":"chrf", + "score":0.5304954689 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"nl", + "task":"translation_to", + "metric":"bleu", + "score":0.4120530736 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"nl", + "task":"translation_to", + "metric":"chrf", + "score":0.6593260342 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ny", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ny", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ny", + "task":"translation_from", + "metric":"bleu", + "score":0.2237313135 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ny", + "task":"translation_from", + "metric":"chrf", + "score":0.4999468628 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ny", + "task":"translation_to", + "metric":"bleu", + "score":0.2341852741 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ny", + "task":"translation_to", + "metric":"chrf", + "score":0.5553049856 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"om", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"om", + "task":"translation_from", + "metric":"bleu", + "score":0.1546333274 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"om", + "task":"translation_from", + "metric":"chrf", + "score":0.3730093916 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"om", + "task":"translation_to", + "metric":"bleu", + "score":0.0699361494 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"om", + "task":"translation_to", + "metric":"chrf", + "score":0.4093787348 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"or", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"or", + "task":"translation_from", + "metric":"bleu", + "score":0.3421886958 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"or", + "task":"translation_from", + "metric":"chrf", + "score":0.5848387431 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"or", + "task":"translation_to", + "metric":"bleu", + "score":0.2784394077 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"or", + "task":"translation_to", + "metric":"chrf", + "score":0.5108902329 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pa", + "task":"translation_from", + "metric":"bleu", + "score":0.4372599799 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pa", + "task":"translation_from", + "metric":"chrf", + "score":0.658993109 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pa", + "task":"translation_to", + "metric":"bleu", + "score":0.4174871385 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pa", + "task":"translation_to", + "metric":"chrf", + "score":0.5931595705 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pl", + "task":"translation_from", + "metric":"bleu", + "score":0.2722413511 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pl", + "task":"translation_from", + "metric":"chrf", + "score":0.5398004754 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pl", + "task":"translation_to", + "metric":"bleu", + "score":0.3757453667 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pl", + "task":"translation_to", + "metric":"chrf", + "score":0.579529149 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pt", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pt", + "task":"translation_from", + "metric":"bleu", + "score":0.3198419121 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pt", + "task":"translation_from", + "metric":"chrf", + "score":0.578067895 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pt", + "task":"translation_to", + "metric":"bleu", + "score":0.5056809967 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pt", + "task":"translation_to", + "metric":"chrf", + "score":0.6966172136 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ro", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ro", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ro", + "task":"translation_from", + "metric":"bleu", + "score":0.3154573291 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ro", + "task":"translation_from", + "metric":"chrf", + "score":0.5600439488 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ro", + "task":"translation_to", + "metric":"bleu", + "score":0.5650725553 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ro", + "task":"translation_to", + "metric":"chrf", + "score":0.7127688163 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ru", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ru", + "task":"translation_from", + "metric":"bleu", + "score":0.2839962776 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ru", + "task":"translation_from", + "metric":"chrf", + "score":0.5461994333 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ru", + "task":"translation_to", + "metric":"bleu", + "score":0.4589390255 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ru", + "task":"translation_to", + "metric":"chrf", + "score":0.6469214364 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"rw", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"rw", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"rw", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"rw", + "task":"translation_from", + "metric":"bleu", + "score":0.2696305636 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"rw", + "task":"translation_from", + "metric":"chrf", + "score":0.5244991633 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"rw", + "task":"translation_to", + "metric":"bleu", + "score":0.3319598047 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"rw", + "task":"translation_to", + "metric":"chrf", + "score":0.5861214096 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sd", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sd", + "task":"translation_from", + "metric":"bleu", + "score":0.3972794455 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sd", + "task":"translation_from", + "metric":"chrf", + "score":0.6232130593 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sd", + "task":"translation_to", + "metric":"bleu", + "score":0.3415088181 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sd", + "task":"translation_to", + "metric":"chrf", + "score":0.5390152372 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"si", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"si", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"si", + "task":"translation_from", + "metric":"bleu", + "score":0.2864590726 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"si", + "task":"translation_from", + "metric":"chrf", + "score":0.5427330367 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"si", + "task":"translation_to", + "metric":"bleu", + "score":0.3306843079 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"si", + "task":"translation_to", + "metric":"chrf", + "score":0.4979151965 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sn", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sn", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sn", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sn", + "task":"translation_from", + "metric":"bleu", + "score":0.1795249187 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sn", + "task":"translation_from", + "metric":"chrf", + "score":0.439139386 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sn", + "task":"translation_to", + "metric":"bleu", + "score":0.2284701542 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sn", + "task":"translation_to", + "metric":"chrf", + "score":0.5463949389 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"so", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"so", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"so", + "task":"translation_from", + "metric":"bleu", + "score":0.284867651 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"so", + "task":"translation_from", + "metric":"chrf", + "score":0.5244275819 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"so", + "task":"translation_to", + "metric":"bleu", + "score":0.2202968782 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"so", + "task":"translation_to", + "metric":"chrf", + "score":0.5048544071 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sr", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sr", + "task":"translation_from", + "metric":"bleu", + "score":0.2893867971 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sr", + "task":"translation_from", + "metric":"chrf", + "score":0.5578776437 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sr", + "task":"translation_to", + "metric":"bleu", + "score":0.4400648152 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sr", + "task":"translation_to", + "metric":"chrf", + "score":0.6115459213 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"su", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"su", + "task":"translation_from", + "metric":"bleu", + "score":0.32232697 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"su", + "task":"translation_from", + "metric":"chrf", + "score":0.5111738773 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"su", + "task":"translation_to", + "metric":"bleu", + "score":0.2383157401 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"su", + "task":"translation_to", + "metric":"chrf", + "score":0.5175978358 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sv", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sv", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sv", + "task":"translation_from", + "metric":"bleu", + "score":0.3617201239 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sv", + "task":"translation_from", + "metric":"chrf", + "score":0.5926536872 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sv", + "task":"translation_to", + "metric":"bleu", + "score":0.4685613196 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sv", + "task":"translation_to", + "metric":"chrf", + "score":0.6911608485 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sw", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sw", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sw", + "task":"translation_from", + "metric":"bleu", + "score":0.4043048116 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sw", + "task":"translation_from", + "metric":"chrf", + "score":0.5944297519 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sw", + "task":"translation_to", + "metric":"bleu", + "score":0.499303533 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sw", + "task":"translation_to", + "metric":"chrf", + "score":0.7212747243 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ta", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ta", + "task":"translation_from", + "metric":"bleu", + "score":0.2819090872 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ta", + "task":"translation_from", + "metric":"chrf", + "score":0.5410426012 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ta", + "task":"translation_to", + "metric":"bleu", + "score":0.2951438389 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ta", + "task":"translation_to", + "metric":"chrf", + "score":0.5712604905 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"te", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"te", + "task":"translation_from", + "metric":"bleu", + "score":0.4243816819 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"te", + "task":"translation_from", + "metric":"chrf", + "score":0.6336752528 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"te", + "task":"translation_to", + "metric":"bleu", + "score":0.3644641049 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"te", + "task":"translation_to", + "metric":"chrf", + "score":0.5789291672 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"tg", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"tg", + "task":"translation_from", + "metric":"bleu", + "score":0.2251503741 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"tg", + "task":"translation_from", + "metric":"chrf", + "score":0.4903696181 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"tg", + "task":"translation_to", + "metric":"bleu", + "score":0.2873179741 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"tg", + "task":"translation_to", + "metric":"chrf", + "score":0.5146227404 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"th", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"th", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"th", + "task":"translation_from", + "metric":"bleu", + "score":0.3047162219 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"th", + "task":"translation_from", + "metric":"chrf", + "score":0.5499065244 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"th", + "task":"translation_to", + "metric":"bleu", + "score":0.4136384398 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"th", + "task":"translation_to", + "metric":"chrf", + "score":0.5513959132 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ti", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ti", + "task":"translation_from", + "metric":"bleu", + "score":0.2867986153 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ti", + "task":"translation_from", + "metric":"chrf", + "score":0.4858296113 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ti", + "task":"translation_to", + "metric":"bleu", + "score":0.101641187 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ti", + "task":"translation_to", + "metric":"chrf", + "score":0.2278398804 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"tr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"tr", + "task":"translation_from", + "metric":"bleu", + "score":0.2782856704 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"tr", + "task":"translation_from", + "metric":"chrf", + "score":0.5422402953 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"tr", + "task":"translation_to", + "metric":"bleu", + "score":0.419062749 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"tr", + "task":"translation_to", + "metric":"chrf", + "score":0.6455051222 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"uk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"uk", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"uk", + "task":"translation_from", + "metric":"bleu", + "score":0.3049575256 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"uk", + "task":"translation_from", + "metric":"chrf", + "score":0.5755673238 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"uk", + "task":"translation_to", + "metric":"bleu", + "score":0.4056417811 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"uk", + "task":"translation_to", + "metric":"chrf", + "score":0.6001236102 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"umb", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"umb", + "task":"translation_from", + "metric":"bleu", + "score":0.0390495324 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"umb", + "task":"translation_from", + "metric":"chrf", + "score":0.2184695701 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"umb", + "task":"translation_to", + "metric":"bleu", + "score":0.0636422012 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"umb", + "task":"translation_to", + "metric":"chrf", + "score":0.296360163 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ur", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ur", + "task":"translation_from", + "metric":"bleu", + "score":0.31244285 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ur", + "task":"translation_from", + "metric":"chrf", + "score":0.5630479496 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ur", + "task":"translation_to", + "metric":"bleu", + "score":0.2911146353 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ur", + "task":"translation_to", + "metric":"chrf", + "score":0.4826415387 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"uz", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"uz", + "task":"translation_from", + "metric":"bleu", + "score":0.2813736334 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"uz", + "task":"translation_from", + "metric":"chrf", + "score":0.5350839669 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"uz", + "task":"translation_to", + "metric":"bleu", + "score":0.3532409319 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"uz", + "task":"translation_to", + "metric":"chrf", + "score":0.6242374823 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"vi", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"vi", + "task":"translation_from", + "metric":"bleu", + "score":0.3436662566 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"vi", + "task":"translation_from", + "metric":"chrf", + "score":0.59026429 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"vi", + "task":"translation_to", + "metric":"bleu", + "score":0.447007323 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"vi", + "task":"translation_to", + "metric":"chrf", + "score":0.6624838094 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"wo", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"wo", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"wo", + "task":"translation_from", + "metric":"bleu", + "score":0.0835563722 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"wo", + "task":"translation_from", + "metric":"chrf", + "score":0.3389944349 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"wo", + "task":"translation_to", + "metric":"bleu", + "score":0.1150505644 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"wo", + "task":"translation_to", + "metric":"chrf", + "score":0.3347031666 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"wuu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"bleu", + "score":0.3135484165 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"chrf", + "score":0.5406963315 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"bleu", + "score":0.1901478921 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"chrf", + "score":0.2245996516 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"xh", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"xh", + "task":"translation_from", + "metric":"bleu", + "score":0.2533217863 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"xh", + "task":"translation_from", + "metric":"chrf", + "score":0.4979177365 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"xh", + "task":"translation_to", + "metric":"bleu", + "score":0.1440335108 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"xh", + "task":"translation_to", + "metric":"chrf", + "score":0.4965120865 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"yo", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"yo", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"yo", + "task":"translation_from", + "metric":"bleu", + "score":0.1607554286 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"yo", + "task":"translation_from", + "metric":"chrf", + "score":0.4105347932 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"yo", + "task":"translation_to", + "metric":"bleu", + "score":0.1645681144 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"yo", + "task":"translation_to", + "metric":"chrf", + "score":0.349083777 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"yue", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"yue", + "task":"translation_from", + "metric":"bleu", + "score":0.2392191989 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"yue", + "task":"translation_from", + "metric":"chrf", + "score":0.4953232912 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"yue", + "task":"translation_to", + "metric":"bleu", + "score":0.2147687469 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"yue", + "task":"translation_to", + "metric":"chrf", + "score":0.2691081013 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"zh", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"zh", + "task":"translation_from", + "metric":"bleu", + "score":0.3075560511 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"zh", + "task":"translation_from", + "metric":"chrf", + "score":0.5721434339 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"zh", + "task":"translation_to", + "metric":"bleu", + "score":0.3628421643 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"zh", + "task":"translation_to", + "metric":"chrf", + "score":0.3921364269 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"zu", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"zu", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"zu", + "task":"translation_from", + "metric":"bleu", + "score":0.3475884805 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"zu", + "task":"translation_from", + "metric":"chrf", + "score":0.6151377801 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"zu", + "task":"translation_to", + "metric":"bleu", + "score":0.3045492612 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"zu", + "task":"translation_to", + "metric":"chrf", + "score":0.5663641807 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"aeb", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.2499368982 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.4866856816 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.2032851597 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.4298526595 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"af", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"af", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"af", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"af", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"af", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ak", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ak", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ak", + "task":"translation_from", + "metric":"bleu", + "score":0.1425831777 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ak", + "task":"translation_from", + "metric":"chrf", + "score":0.417812484 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ak", + "task":"translation_to", + "metric":"bleu", + "score":0.0942003912 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ak", + "task":"translation_to", + "metric":"chrf", + "score":0.3936431694 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"am", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"am", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"am", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"am", + "task":"translation_from", + "metric":"bleu", + "score":0.2720072911 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"am", + "task":"translation_from", + "metric":"chrf", + "score":0.5061425801 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"am", + "task":"translation_to", + "metric":"bleu", + "score":0.1852281481 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"am", + "task":"translation_to", + "metric":"chrf", + "score":0.3131355766 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"apc", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"apc", + "task":"translation_from", + "metric":"bleu", + "score":0.2661119281 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"apc", + "task":"translation_from", + "metric":"chrf", + "score":0.5602064313 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"apc", + "task":"translation_to", + "metric":"bleu", + "score":0.194000916 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"apc", + "task":"translation_to", + "metric":"chrf", + "score":0.4535351144 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ar", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ar", + "task":"translation_from", + "metric":"bleu", + "score":0.2723646085 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ar", + "task":"translation_from", + "metric":"chrf", + "score":0.523730035 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ar", + "task":"translation_to", + "metric":"bleu", + "score":0.3878873306 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ar", + "task":"translation_to", + "metric":"chrf", + "score":0.592059186 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ary", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ary", + "task":"translation_from", + "metric":"bleu", + "score":0.1616972069 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ary", + "task":"translation_from", + "metric":"chrf", + "score":0.4328883781 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ary", + "task":"translation_to", + "metric":"bleu", + "score":0.1751707508 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ary", + "task":"translation_to", + "metric":"chrf", + "score":0.4233167915 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"arz", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"arz", + "task":"translation_from", + "metric":"bleu", + "score":0.2181300738 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"arz", + "task":"translation_from", + "metric":"chrf", + "score":0.4481685644 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"arz", + "task":"translation_to", + "metric":"bleu", + "score":0.215871503 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"arz", + "task":"translation_to", + "metric":"chrf", + "score":0.454646328 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"as", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"as", + "task":"translation_from", + "metric":"bleu", + "score":0.2489741176 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"as", + "task":"translation_from", + "metric":"chrf", + "score":0.4653663899 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"as", + "task":"translation_to", + "metric":"bleu", + "score":0.1897550206 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"as", + "task":"translation_to", + "metric":"chrf", + "score":0.4113322824 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"awa", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"awa", + "task":"translation_from", + "metric":"bleu", + "score":0.2828158417 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"awa", + "task":"translation_from", + "metric":"chrf", + "score":0.5179193605 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"awa", + "task":"translation_to", + "metric":"bleu", + "score":0.1666719193 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"awa", + "task":"translation_to", + "metric":"chrf", + "score":0.4162476616 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"az", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"az", + "task":"translation_from", + "metric":"bleu", + "score":0.2101918607 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"az", + "task":"translation_from", + "metric":"chrf", + "score":0.4594084738 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"az", + "task":"translation_to", + "metric":"bleu", + "score":0.171792145 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"az", + "task":"translation_to", + "metric":"chrf", + "score":0.4130816559 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"be", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"be", + "task":"translation_from", + "metric":"bleu", + "score":0.2000799381 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"be", + "task":"translation_from", + "metric":"chrf", + "score":0.4988072587 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"be", + "task":"translation_to", + "metric":"bleu", + "score":0.3128559705 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"be", + "task":"translation_to", + "metric":"chrf", + "score":0.4876970107 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"bho", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"bho", + "task":"translation_from", + "metric":"bleu", + "score":0.2526226356 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"bho", + "task":"translation_from", + "metric":"chrf", + "score":0.5007947756 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"bho", + "task":"translation_to", + "metric":"bleu", + "score":0.2513374937 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"bho", + "task":"translation_to", + "metric":"chrf", + "score":0.4492954272 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"bm", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"bm", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"bm", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"bm", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"bm", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"bn", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"bn", + "task":"translation_from", + "metric":"bleu", + "score":0.2672489266 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"bn", + "task":"translation_from", + "metric":"chrf", + "score":0.4952818431 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"bn", + "task":"translation_to", + "metric":"bleu", + "score":0.3639249804 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"bn", + "task":"translation_to", + "metric":"chrf", + "score":0.5538942616 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ca", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ca", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ca", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ca", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ca", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ceb", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"bleu", + "score":0.4195422704 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"chrf", + "score":0.6085776274 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"bleu", + "score":0.3993771419 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"chrf", + "score":0.6357624414 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ckb", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"bleu", + "score":0.260213991 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"chrf", + "score":0.4864597898 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"bleu", + "score":0.2793994268 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"chrf", + "score":0.508602676 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"cs", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"cs", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"cs", + "task":"translation_from", + "metric":"bleu", + "score":0.3077322035 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"cs", + "task":"translation_from", + "metric":"chrf", + "score":0.5442587621 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"cs", + "task":"translation_to", + "metric":"bleu", + "score":0.3445618242 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"cs", + "task":"translation_to", + "metric":"chrf", + "score":0.56756333 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"de", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"de", + "task":"translation_from", + "metric":"bleu", + "score":0.3382313883 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"de", + "task":"translation_from", + "metric":"chrf", + "score":0.5705047774 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"de", + "task":"translation_to", + "metric":"bleu", + "score":0.5354923841 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"de", + "task":"translation_to", + "metric":"chrf", + "score":0.7125417889 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"el", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"el", + "task":"translation_from", + "metric":"bleu", + "score":0.3210907235 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"el", + "task":"translation_from", + "metric":"chrf", + "score":0.5292167329 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"el", + "task":"translation_to", + "metric":"bleu", + "score":0.3443988404 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"el", + "task":"translation_to", + "metric":"chrf", + "score":0.5424093748 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"en", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"en", + "task":"translation_from", + "metric":"bleu", + "score":0.4617498931 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"en", + "task":"translation_from", + "metric":"chrf", + "score":0.6321211549 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"en", + "task":"translation_to", + "metric":"bleu", + "score":0.5951204739 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"en", + "task":"translation_to", + "metric":"chrf", + "score":0.7613397345 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"es", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"es", + "task":"translation_from", + "metric":"bleu", + "score":0.3547349164 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"es", + "task":"translation_from", + "metric":"chrf", + "score":0.5728186386 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"es", + "task":"translation_to", + "metric":"bleu", + "score":0.3576086442 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"es", + "task":"translation_to", + "metric":"chrf", + "score":0.6061019948 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"fa", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"fa", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"fa", + "task":"translation_from", + "metric":"bleu", + "score":0.2676796828 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"fa", + "task":"translation_from", + "metric":"chrf", + "score":0.5663114288 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"fa", + "task":"translation_to", + "metric":"bleu", + "score":0.2591969049 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"fa", + "task":"translation_to", + "metric":"chrf", + "score":0.4814104167 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"fil", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"fil", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"fil", + "task":"translation_from", + "metric":"bleu", + "score":0.4277064952 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"fil", + "task":"translation_from", + "metric":"chrf", + "score":0.6325003325 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"fil", + "task":"translation_to", + "metric":"bleu", + "score":0.3269491361 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"fil", + "task":"translation_to", + "metric":"chrf", + "score":0.612989238 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"fr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"fr", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"fr", + "task":"translation_from", + "metric":"bleu", + "score":0.2978444639 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"fr", + "task":"translation_from", + "metric":"chrf", + "score":0.5625976718 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"fr", + "task":"translation_to", + "metric":"bleu", + "score":0.5244850062 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"fr", + "task":"translation_to", + "metric":"chrf", + "score":0.7081676298 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.0361796916 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.195120399 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0308475815 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.1890051706 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"gu", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"gu", + "task":"translation_from", + "metric":"bleu", + "score":0.3150102324 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"gu", + "task":"translation_from", + "metric":"chrf", + "score":0.5340625085 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"gu", + "task":"translation_to", + "metric":"bleu", + "score":0.2069349026 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"gu", + "task":"translation_to", + "metric":"chrf", + "score":0.4761478869 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ha", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ha", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ha", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ha", + "task":"translation_from", + "metric":"bleu", + "score":0.218966139 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ha", + "task":"translation_from", + "metric":"chrf", + "score":0.4181042336 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ha", + "task":"translation_to", + "metric":"bleu", + "score":0.2395753169 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ha", + "task":"translation_to", + "metric":"chrf", + "score":0.5013466224 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"hi", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"hi", + "task":"translation_from", + "metric":"bleu", + "score":0.4286739426 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"hi", + "task":"translation_from", + "metric":"chrf", + "score":0.6359453866 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"hi", + "task":"translation_to", + "metric":"bleu", + "score":0.4344801023 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"hi", + "task":"translation_to", + "metric":"chrf", + "score":0.6474630132 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"hne", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"hne", + "task":"translation_from", + "metric":"bleu", + "score":0.3063272533 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"hne", + "task":"translation_from", + "metric":"chrf", + "score":0.5583492368 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"hne", + "task":"translation_to", + "metric":"bleu", + "score":0.1757166109 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"hne", + "task":"translation_to", + "metric":"chrf", + "score":0.4152865266 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ht", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ht", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ht", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ht", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ht", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"hu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"hu", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"hu", + "task":"translation_from", + "metric":"bleu", + "score":0.274174318 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"hu", + "task":"translation_from", + "metric":"chrf", + "score":0.5398050773 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"hu", + "task":"translation_to", + "metric":"bleu", + "score":0.2927577916 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"hu", + "task":"translation_to", + "metric":"chrf", + "score":0.56675535 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"id", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"id", + "task":"translation_from", + "metric":"bleu", + "score":0.3126497326 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"id", + "task":"translation_from", + "metric":"chrf", + "score":0.5733116043 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"id", + "task":"translation_to", + "metric":"bleu", + "score":0.3882402101 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"id", + "task":"translation_to", + "metric":"chrf", + "score":0.6624914478 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ig", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ig", + "task":"translation_from", + "metric":"bleu", + "score":0.1503374245 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ig", + "task":"translation_from", + "metric":"chrf", + "score":0.387578878 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ig", + "task":"translation_to", + "metric":"bleu", + "score":0.2586477386 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ig", + "task":"translation_to", + "metric":"chrf", + "score":0.4926307711 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ilo", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"bleu", + "score":0.232232342 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"chrf", + "score":0.4479000894 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"bleu", + "score":0.2119661542 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"chrf", + "score":0.5179791668 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"it", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"it", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"it", + "task":"translation_from", + "metric":"bleu", + "score":0.3116016155 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"it", + "task":"translation_from", + "metric":"chrf", + "score":0.5537049588 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"it", + "task":"translation_to", + "metric":"bleu", + "score":0.3440495149 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"it", + "task":"translation_to", + "metric":"chrf", + "score":0.6004337743 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ja", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ja", + "task":"translation_from", + "metric":"bleu", + "score":0.289402493 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ja", + "task":"translation_from", + "metric":"chrf", + "score":0.5452343766 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ja", + "task":"translation_to", + "metric":"bleu", + "score":0.1879084772 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ja", + "task":"translation_to", + "metric":"chrf", + "score":0.3787664659 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"jv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"jv", + "task":"translation_from", + "metric":"bleu", + "score":0.3561823456 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"jv", + "task":"translation_from", + "metric":"chrf", + "score":0.5619277442 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"jv", + "task":"translation_to", + "metric":"bleu", + "score":0.2609272138 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"jv", + "task":"translation_to", + "metric":"chrf", + "score":0.5344454302 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ki", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ki", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ki", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ki", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ki", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"kk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"kk", + "task":"translation_from", + "metric":"bleu", + "score":0.2053088231 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"kk", + "task":"translation_from", + "metric":"chrf", + "score":0.491430616 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"kk", + "task":"translation_to", + "metric":"bleu", + "score":0.4063809808 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"kk", + "task":"translation_to", + "metric":"chrf", + "score":0.6167229896 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"km", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"km", + "task":"translation_from", + "metric":"bleu", + "score":0.3195578223 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"km", + "task":"translation_from", + "metric":"chrf", + "score":0.5643490342 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"km", + "task":"translation_to", + "metric":"bleu", + "score":0.2319063764 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"km", + "task":"translation_to", + "metric":"chrf", + "score":0.4461032467 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"kn", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"kn", + "task":"translation_from", + "metric":"bleu", + "score":0.2485030856 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"kn", + "task":"translation_from", + "metric":"chrf", + "score":0.4688750005 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"kn", + "task":"translation_to", + "metric":"bleu", + "score":0.3577614115 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"kn", + "task":"translation_to", + "metric":"chrf", + "score":0.5550425425 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ko", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ko", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ko", + "task":"translation_from", + "metric":"bleu", + "score":0.2106519512 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ko", + "task":"translation_from", + "metric":"chrf", + "score":0.4804338475 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ko", + "task":"translation_to", + "metric":"bleu", + "score":0.2003821738 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ko", + "task":"translation_to", + "metric":"chrf", + "score":0.2850409306 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"lua", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"lua", + "task":"translation_from", + "metric":"bleu", + "score":0.1057085266 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"lua", + "task":"translation_from", + "metric":"chrf", + "score":0.2715159938 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"lua", + "task":"translation_to", + "metric":"bleu", + "score":0.0708970987 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"lua", + "task":"translation_to", + "metric":"chrf", + "score":0.3583242702 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"mag", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"mag", + "task":"translation_from", + "metric":"bleu", + "score":0.3007758183 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"mag", + "task":"translation_from", + "metric":"chrf", + "score":0.5378616534 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"mag", + "task":"translation_to", + "metric":"bleu", + "score":0.2795823496 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"mag", + "task":"translation_to", + "metric":"chrf", + "score":0.510712197 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"mai", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"mai", + "task":"translation_from", + "metric":"bleu", + "score":0.212326315 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"mai", + "task":"translation_from", + "metric":"chrf", + "score":0.4808320621 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"mai", + "task":"translation_to", + "metric":"bleu", + "score":0.2353530898 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"mai", + "task":"translation_to", + "metric":"chrf", + "score":0.498918765 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"mg", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"mg", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"mg", + "task":"translation_from", + "metric":"bleu", + "score":0.2180528106 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"mg", + "task":"translation_from", + "metric":"chrf", + "score":0.4350629264 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"mg", + "task":"translation_to", + "metric":"bleu", + "score":0.1752962142 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"mg", + "task":"translation_to", + "metric":"chrf", + "score":0.4941543502 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ml", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ml", + "task":"translation_from", + "metric":"bleu", + "score":0.3848912948 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ml", + "task":"translation_from", + "metric":"chrf", + "score":0.6007084641 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ml", + "task":"translation_to", + "metric":"bleu", + "score":0.3023908744 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ml", + "task":"translation_to", + "metric":"chrf", + "score":0.5415851472 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"mr", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"mr", + "task":"translation_from", + "metric":"bleu", + "score":0.2906692433 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"mr", + "task":"translation_from", + "metric":"chrf", + "score":0.5058194876 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"mr", + "task":"translation_to", + "metric":"bleu", + "score":0.2450137243 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"mr", + "task":"translation_to", + "metric":"chrf", + "score":0.4736891146 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ms", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ms", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ms", + "task":"translation_from", + "metric":"bleu", + "score":0.3362256422 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ms", + "task":"translation_from", + "metric":"chrf", + "score":0.5937301471 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ms", + "task":"translation_to", + "metric":"bleu", + "score":0.4506461939 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ms", + "task":"translation_to", + "metric":"chrf", + "score":0.7014575648 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"my", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"my", + "task":"translation_from", + "metric":"bleu", + "score":0.2814491551 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"my", + "task":"translation_from", + "metric":"chrf", + "score":0.5513455988 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"my", + "task":"translation_to", + "metric":"bleu", + "score":0.2724659132 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"my", + "task":"translation_to", + "metric":"chrf", + "score":0.5135188138 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ne", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ne", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ne", + "task":"translation_from", + "metric":"bleu", + "score":0.3218775268 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ne", + "task":"translation_from", + "metric":"chrf", + "score":0.5549355351 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ne", + "task":"translation_to", + "metric":"bleu", + "score":0.2676260775 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ne", + "task":"translation_to", + "metric":"chrf", + "score":0.5006126727 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"nl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"nl", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"nl", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"nl", + "task":"translation_from", + "metric":"bleu", + "score":0.2807256089 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"nl", + "task":"translation_from", + "metric":"chrf", + "score":0.5254117929 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"nl", + "task":"translation_to", + "metric":"bleu", + "score":0.321808319 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"nl", + "task":"translation_to", + "metric":"chrf", + "score":0.5984422632 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ny", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ny", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ny", + "task":"translation_from", + "metric":"bleu", + "score":0.1741946793 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ny", + "task":"translation_from", + "metric":"chrf", + "score":0.3946218629 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ny", + "task":"translation_to", + "metric":"bleu", + "score":0.1729000095 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ny", + "task":"translation_to", + "metric":"chrf", + "score":0.501423047 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"om", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"om", + "task":"translation_from", + "metric":"bleu", + "score":0.1059783758 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"om", + "task":"translation_from", + "metric":"chrf", + "score":0.3306681685 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"om", + "task":"translation_to", + "metric":"bleu", + "score":0.044447102 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"om", + "task":"translation_to", + "metric":"chrf", + "score":0.379164388 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"or", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"or", + "task":"translation_from", + "metric":"bleu", + "score":0.3044074075 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"or", + "task":"translation_from", + "metric":"chrf", + "score":0.5411406602 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"or", + "task":"translation_to", + "metric":"bleu", + "score":0.2312884216 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"or", + "task":"translation_to", + "metric":"chrf", + "score":0.5063263205 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"pa", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"pa", + "task":"translation_from", + "metric":"bleu", + "score":0.3792889323 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"pa", + "task":"translation_from", + "metric":"chrf", + "score":0.6001893022 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"pa", + "task":"translation_to", + "metric":"bleu", + "score":0.4267930078 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"pa", + "task":"translation_to", + "metric":"chrf", + "score":0.583867208 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"pl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"pl", + "task":"translation_from", + "metric":"bleu", + "score":0.2910351794 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"pl", + "task":"translation_from", + "metric":"chrf", + "score":0.5387220968 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"pl", + "task":"translation_to", + "metric":"bleu", + "score":0.352446244 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"pl", + "task":"translation_to", + "metric":"chrf", + "score":0.5847615168 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"pt", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"pt", + "task":"translation_from", + "metric":"bleu", + "score":0.3275326122 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"pt", + "task":"translation_from", + "metric":"chrf", + "score":0.5672682921 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"pt", + "task":"translation_to", + "metric":"bleu", + "score":0.4390630519 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"pt", + "task":"translation_to", + "metric":"chrf", + "score":0.6588223005 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ro", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ro", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ro", + "task":"translation_from", + "metric":"bleu", + "score":0.3171625415 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ro", + "task":"translation_from", + "metric":"chrf", + "score":0.5772460535 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ro", + "task":"translation_to", + "metric":"bleu", + "score":0.4778809926 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ro", + "task":"translation_to", + "metric":"chrf", + "score":0.6619427768 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ru", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ru", + "task":"translation_from", + "metric":"bleu", + "score":0.266439807 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ru", + "task":"translation_from", + "metric":"chrf", + "score":0.5101737799 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ru", + "task":"translation_to", + "metric":"bleu", + "score":0.4085478092 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ru", + "task":"translation_to", + "metric":"chrf", + "score":0.5658655698 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"rw", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"rw", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"rw", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"rw", + "task":"translation_from", + "metric":"bleu", + "score":0.15500158 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"rw", + "task":"translation_from", + "metric":"chrf", + "score":0.3976950814 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"rw", + "task":"translation_to", + "metric":"bleu", + "score":0.2871474268 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"rw", + "task":"translation_to", + "metric":"chrf", + "score":0.5626056331 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sd", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sd", + "task":"translation_from", + "metric":"bleu", + "score":0.3431093451 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sd", + "task":"translation_from", + "metric":"chrf", + "score":0.5329383828 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sd", + "task":"translation_to", + "metric":"bleu", + "score":0.2838954554 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sd", + "task":"translation_to", + "metric":"chrf", + "score":0.48412 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"si", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"si", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"si", + "task":"translation_from", + "metric":"bleu", + "score":0.28322243 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"si", + "task":"translation_from", + "metric":"chrf", + "score":0.5207906875 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"si", + "task":"translation_to", + "metric":"bleu", + "score":0.2943621784 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"si", + "task":"translation_to", + "metric":"chrf", + "score":0.4749986301 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sn", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sn", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sn", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sn", + "task":"translation_from", + "metric":"bleu", + "score":0.1334599567 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sn", + "task":"translation_from", + "metric":"chrf", + "score":0.3857630332 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sn", + "task":"translation_to", + "metric":"bleu", + "score":0.1122823827 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sn", + "task":"translation_to", + "metric":"chrf", + "score":0.4635739463 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"so", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"so", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"so", + "task":"translation_from", + "metric":"bleu", + "score":0.2156343628 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"so", + "task":"translation_from", + "metric":"chrf", + "score":0.4198074415 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"so", + "task":"translation_to", + "metric":"bleu", + "score":0.2207115321 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"so", + "task":"translation_to", + "metric":"chrf", + "score":0.5118672399 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sr", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sr", + "task":"translation_from", + "metric":"bleu", + "score":0.2933759432 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sr", + "task":"translation_from", + "metric":"chrf", + "score":0.5710698033 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sr", + "task":"translation_to", + "metric":"bleu", + "score":0.4425485023 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sr", + "task":"translation_to", + "metric":"chrf", + "score":0.6215234533 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"su", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"su", + "task":"translation_from", + "metric":"bleu", + "score":0.2152161054 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"su", + "task":"translation_from", + "metric":"chrf", + "score":0.3971586695 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"su", + "task":"translation_to", + "metric":"bleu", + "score":0.2374945192 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"su", + "task":"translation_to", + "metric":"chrf", + "score":0.5272097328 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sv", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sv", + "task":"translation_from", + "metric":"bleu", + "score":0.3335095456 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sv", + "task":"translation_from", + "metric":"chrf", + "score":0.5683382887 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sv", + "task":"translation_to", + "metric":"bleu", + "score":0.4033731642 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sv", + "task":"translation_to", + "metric":"chrf", + "score":0.6519271741 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sw", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sw", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sw", + "task":"translation_from", + "metric":"bleu", + "score":0.2763965367 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sw", + "task":"translation_from", + "metric":"chrf", + "score":0.520411275 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sw", + "task":"translation_to", + "metric":"bleu", + "score":0.4350912598 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"sw", + "task":"translation_to", + "metric":"chrf", + "score":0.6853284539 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ta", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ta", + "task":"translation_from", + "metric":"bleu", + "score":0.2415112532 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ta", + "task":"translation_from", + "metric":"chrf", + "score":0.4752276392 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ta", + "task":"translation_to", + "metric":"bleu", + "score":0.2730244696 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ta", + "task":"translation_to", + "metric":"chrf", + "score":0.5683000198 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"te", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"te", + "task":"translation_from", + "metric":"bleu", + "score":0.3528600199 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"te", + "task":"translation_from", + "metric":"chrf", + "score":0.5850279702 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"te", + "task":"translation_to", + "metric":"bleu", + "score":0.3231474889 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"te", + "task":"translation_to", + "metric":"chrf", + "score":0.5470305035 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"tg", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"tg", + "task":"translation_from", + "metric":"bleu", + "score":0.208524293 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"tg", + "task":"translation_from", + "metric":"chrf", + "score":0.4271785057 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"tg", + "task":"translation_to", + "metric":"bleu", + "score":0.2278942993 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"tg", + "task":"translation_to", + "metric":"chrf", + "score":0.4700484002 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"th", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"th", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"th", + "task":"translation_from", + "metric":"bleu", + "score":0.2681599618 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"th", + "task":"translation_from", + "metric":"chrf", + "score":0.5133569475 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"th", + "task":"translation_to", + "metric":"bleu", + "score":0.3973895019 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"th", + "task":"translation_to", + "metric":"chrf", + "score":0.564303282 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ti", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ti", + "task":"translation_from", + "metric":"bleu", + "score":0.1768961884 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ti", + "task":"translation_from", + "metric":"chrf", + "score":0.348072496 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ti", + "task":"translation_to", + "metric":"bleu", + "score":0.1310924895 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ti", + "task":"translation_to", + "metric":"chrf", + "score":0.2594660098 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"tr", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"tr", + "task":"translation_from", + "metric":"bleu", + "score":0.2806311806 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"tr", + "task":"translation_from", + "metric":"chrf", + "score":0.5431910468 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"tr", + "task":"translation_to", + "metric":"bleu", + "score":0.3916346072 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"tr", + "task":"translation_to", + "metric":"chrf", + "score":0.6289997941 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"uk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"uk", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"uk", + "task":"translation_from", + "metric":"bleu", + "score":0.3007101794 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"uk", + "task":"translation_from", + "metric":"chrf", + "score":0.5519617104 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"uk", + "task":"translation_to", + "metric":"bleu", + "score":0.319789332 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"uk", + "task":"translation_to", + "metric":"chrf", + "score":0.540431455 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"umb", + "task":"classification", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"umb", + "task":"translation_from", + "metric":"bleu", + "score":0.025133561 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"umb", + "task":"translation_from", + "metric":"chrf", + "score":0.1190888288 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"umb", + "task":"translation_to", + "metric":"bleu", + "score":0.018289241 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"umb", + "task":"translation_to", + "metric":"chrf", + "score":0.1529779827 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ur", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ur", + "task":"translation_from", + "metric":"bleu", + "score":0.2859928961 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ur", + "task":"translation_from", + "metric":"chrf", + "score":0.5295533045 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ur", + "task":"translation_to", + "metric":"bleu", + "score":0.3010091175 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ur", + "task":"translation_to", + "metric":"chrf", + "score":0.493353195 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"uz", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"uz", + "task":"translation_from", + "metric":"bleu", + "score":0.2407351505 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"uz", + "task":"translation_from", + "metric":"chrf", + "score":0.4734226532 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"uz", + "task":"translation_to", + "metric":"bleu", + "score":0.3363563156 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"uz", + "task":"translation_to", + "metric":"chrf", + "score":0.5891323556 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"vi", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"vi", + "task":"translation_from", + "metric":"bleu", + "score":0.3170290484 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"vi", + "task":"translation_from", + "metric":"chrf", + "score":0.5491010642 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"vi", + "task":"translation_to", + "metric":"bleu", + "score":0.4032471641 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"vi", + "task":"translation_to", + "metric":"chrf", + "score":0.6394566771 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"wo", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"wo", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"wo", + "task":"translation_from", + "metric":"bleu", + "score":0.0638721925 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"wo", + "task":"translation_from", + "metric":"chrf", + "score":0.2417596357 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"wo", + "task":"translation_to", + "metric":"bleu", + "score":0.0586926041 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"wo", + "task":"translation_to", + "metric":"chrf", + "score":0.2518105026 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"wuu", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"bleu", + "score":0.2746262088 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"chrf", + "score":0.4924092277 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"bleu", + "score":0.1648044562 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"chrf", + "score":0.2037009528 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"xh", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"xh", + "task":"translation_from", + "metric":"bleu", + "score":0.2251844915 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"xh", + "task":"translation_from", + "metric":"chrf", + "score":0.4461128395 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"xh", + "task":"translation_to", + "metric":"bleu", + "score":0.134895078 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"xh", + "task":"translation_to", + "metric":"chrf", + "score":0.4836355083 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"yo", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"yo", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"yo", + "task":"translation_from", + "metric":"bleu", + "score":0.1141869405 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"yo", + "task":"translation_from", + "metric":"chrf", + "score":0.3128047258 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"yo", + "task":"translation_to", + "metric":"bleu", + "score":0.1341626528 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"yo", + "task":"translation_to", + "metric":"chrf", + "score":0.2926500144 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"yue", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"yue", + "task":"translation_from", + "metric":"bleu", + "score":0.1826865099 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"yue", + "task":"translation_from", + "metric":"chrf", + "score":0.4272648905 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"yue", + "task":"translation_to", + "metric":"bleu", + "score":0.1499743312 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"yue", + "task":"translation_to", + "metric":"chrf", + "score":0.2347308661 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"zh", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"zh", + "task":"translation_from", + "metric":"bleu", + "score":0.2557280993 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"zh", + "task":"translation_from", + "metric":"chrf", + "score":0.5212143675 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"zh", + "task":"translation_to", + "metric":"bleu", + "score":0.2610248692 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"zh", + "task":"translation_to", + "metric":"chrf", + "score":0.314329989 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"zu", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"zu", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"zu", + "task":"translation_from", + "metric":"bleu", + "score":0.2674818373 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"zu", + "task":"translation_from", + "metric":"chrf", + "score":0.5139550602 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"zu", + "task":"translation_to", + "metric":"bleu", + "score":0.2723879605 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"zu", + "task":"translation_to", + "metric":"chrf", + "score":0.567169258 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"aeb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.3519233265 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.5745897235 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.2759791384 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.4854942304 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"af", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"af", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"af", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"af", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"af", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ak", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ak", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ak", + "task":"translation_from", + "metric":"bleu", + "score":0.2615212462 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ak", + "task":"translation_from", + "metric":"chrf", + "score":0.4896634905 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ak", + "task":"translation_to", + "metric":"bleu", + "score":0.1667049515 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ak", + "task":"translation_to", + "metric":"chrf", + "score":0.4295949613 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"am", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"am", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"am", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"am", + "task":"translation_from", + "metric":"bleu", + "score":0.339375511 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"am", + "task":"translation_from", + "metric":"chrf", + "score":0.566407043 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"am", + "task":"translation_to", + "metric":"bleu", + "score":0.2692320655 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"am", + "task":"translation_to", + "metric":"chrf", + "score":0.3685144367 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"apc", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"apc", + "task":"translation_from", + "metric":"bleu", + "score":0.3872368514 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"apc", + "task":"translation_from", + "metric":"chrf", + "score":0.6253206413 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"apc", + "task":"translation_to", + "metric":"bleu", + "score":0.3385588073 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"apc", + "task":"translation_to", + "metric":"chrf", + "score":0.5846751763 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ar", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ar", + "task":"translation_from", + "metric":"bleu", + "score":0.3462011916 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ar", + "task":"translation_from", + "metric":"chrf", + "score":0.5813984303 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ar", + "task":"translation_to", + "metric":"bleu", + "score":0.4319399394 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ar", + "task":"translation_to", + "metric":"chrf", + "score":0.6269389132 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ary", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ary", + "task":"translation_from", + "metric":"bleu", + "score":0.2181205299 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ary", + "task":"translation_from", + "metric":"chrf", + "score":0.4844955734 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ary", + "task":"translation_to", + "metric":"bleu", + "score":0.2033199109 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ary", + "task":"translation_to", + "metric":"chrf", + "score":0.4375696019 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"arz", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"arz", + "task":"translation_from", + "metric":"bleu", + "score":0.2639599801 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"arz", + "task":"translation_from", + "metric":"chrf", + "score":0.4789807253 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"arz", + "task":"translation_to", + "metric":"bleu", + "score":0.2907084686 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"arz", + "task":"translation_to", + "metric":"chrf", + "score":0.4882539682 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"as", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"as", + "task":"translation_from", + "metric":"bleu", + "score":0.3118761994 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"as", + "task":"translation_from", + "metric":"chrf", + "score":0.5439623542 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"as", + "task":"translation_to", + "metric":"bleu", + "score":0.243905252 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"as", + "task":"translation_to", + "metric":"chrf", + "score":0.4730608179 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"awa", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"awa", + "task":"translation_from", + "metric":"bleu", + "score":0.40510024 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"awa", + "task":"translation_from", + "metric":"chrf", + "score":0.6210515689 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"awa", + "task":"translation_to", + "metric":"bleu", + "score":0.2510210672 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"awa", + "task":"translation_to", + "metric":"chrf", + "score":0.4814090379 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"az", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"az", + "task":"translation_from", + "metric":"bleu", + "score":0.3101513593 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"az", + "task":"translation_from", + "metric":"chrf", + "score":0.5253923906 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"az", + "task":"translation_to", + "metric":"bleu", + "score":0.216177525 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"az", + "task":"translation_to", + "metric":"chrf", + "score":0.4555999734 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"be", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"be", + "task":"translation_from", + "metric":"bleu", + "score":0.2142226733 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"be", + "task":"translation_from", + "metric":"chrf", + "score":0.5048792464 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"be", + "task":"translation_to", + "metric":"bleu", + "score":0.3216771298 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"be", + "task":"translation_to", + "metric":"chrf", + "score":0.5056511666 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"bho", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"bho", + "task":"translation_from", + "metric":"bleu", + "score":0.3246124272 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"bho", + "task":"translation_from", + "metric":"chrf", + "score":0.5547058357 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"bho", + "task":"translation_to", + "metric":"bleu", + "score":0.2300858071 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"bho", + "task":"translation_to", + "metric":"chrf", + "score":0.4391471287 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"bm", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"bm", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"bm", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"bm", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"bm", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"bn", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"bn", + "task":"translation_from", + "metric":"bleu", + "score":0.3332105938 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"bn", + "task":"translation_from", + "metric":"chrf", + "score":0.5788748413 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"bn", + "task":"translation_to", + "metric":"bleu", + "score":0.3925309816 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"bn", + "task":"translation_to", + "metric":"chrf", + "score":0.5671456285 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ca", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ca", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ca", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ca", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ca", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ceb", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"bleu", + "score":0.4667759574 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"chrf", + "score":0.6329355142 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"bleu", + "score":0.4086791428 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"chrf", + "score":0.6523845508 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ckb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"bleu", + "score":0.3593703137 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"chrf", + "score":0.6131084436 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"bleu", + "score":0.349617489 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"chrf", + "score":0.5888504157 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"cs", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"cs", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"cs", + "task":"translation_from", + "metric":"bleu", + "score":0.4190817149 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"cs", + "task":"translation_from", + "metric":"chrf", + "score":0.633614654 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"cs", + "task":"translation_to", + "metric":"bleu", + "score":0.3332466044 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"cs", + "task":"translation_to", + "metric":"chrf", + "score":0.5272130276 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"de", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"de", + "task":"translation_from", + "metric":"bleu", + "score":0.4080538745 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"de", + "task":"translation_from", + "metric":"chrf", + "score":0.6278026445 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"de", + "task":"translation_to", + "metric":"bleu", + "score":0.4940498755 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"de", + "task":"translation_to", + "metric":"chrf", + "score":0.6915113583 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"el", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"el", + "task":"translation_from", + "metric":"bleu", + "score":0.3680077775 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"el", + "task":"translation_from", + "metric":"chrf", + "score":0.5798463116 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"el", + "task":"translation_to", + "metric":"bleu", + "score":0.4003636095 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"el", + "task":"translation_to", + "metric":"chrf", + "score":0.5747287276 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"en", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"en", + "task":"translation_from", + "metric":"bleu", + "score":0.5780592594 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"en", + "task":"translation_from", + "metric":"chrf", + "score":0.727062887 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"en", + "task":"translation_to", + "metric":"bleu", + "score":0.725042796 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"en", + "task":"translation_to", + "metric":"chrf", + "score":0.868453404 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"es", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"es", + "task":"translation_from", + "metric":"bleu", + "score":0.3228577771 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"es", + "task":"translation_from", + "metric":"chrf", + "score":0.5691176688 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"es", + "task":"translation_to", + "metric":"bleu", + "score":0.4211069488 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"es", + "task":"translation_to", + "metric":"chrf", + "score":0.6329026504 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fa", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fa", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fa", + "task":"translation_from", + "metric":"bleu", + "score":0.3659700454 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fa", + "task":"translation_from", + "metric":"chrf", + "score":0.5807664259 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fa", + "task":"translation_to", + "metric":"bleu", + "score":0.2252471667 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fa", + "task":"translation_to", + "metric":"chrf", + "score":0.4480100347 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fil", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fil", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fil", + "task":"translation_from", + "metric":"bleu", + "score":0.447799796 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fil", + "task":"translation_from", + "metric":"chrf", + "score":0.6437494805 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fil", + "task":"translation_to", + "metric":"bleu", + "score":0.318387966 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fil", + "task":"translation_to", + "metric":"chrf", + "score":0.6173467767 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fr", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fr", + "task":"translation_from", + "metric":"bleu", + "score":0.3683003934 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fr", + "task":"translation_from", + "metric":"chrf", + "score":0.5961800274 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fr", + "task":"translation_to", + "metric":"bleu", + "score":0.5899042948 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fr", + "task":"translation_to", + "metric":"chrf", + "score":0.7506595836 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.0858271085 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.2495672773 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0320352537 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.2006317654 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"gu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"gu", + "task":"translation_from", + "metric":"bleu", + "score":0.3793081536 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"gu", + "task":"translation_from", + "metric":"chrf", + "score":0.5865031052 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"gu", + "task":"translation_to", + "metric":"bleu", + "score":0.2344717249 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"gu", + "task":"translation_to", + "metric":"chrf", + "score":0.4873543825 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ha", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ha", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ha", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ha", + "task":"translation_from", + "metric":"bleu", + "score":0.3157236901 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ha", + "task":"translation_from", + "metric":"chrf", + "score":0.5365403784 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ha", + "task":"translation_to", + "metric":"bleu", + "score":0.3221592053 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ha", + "task":"translation_to", + "metric":"chrf", + "score":0.565816945 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"hi", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"hi", + "task":"translation_from", + "metric":"bleu", + "score":0.4661333335 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"hi", + "task":"translation_from", + "metric":"chrf", + "score":0.6599650679 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"hi", + "task":"translation_to", + "metric":"bleu", + "score":0.4319599559 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"hi", + "task":"translation_to", + "metric":"chrf", + "score":0.6493733048 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"hne", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"hne", + "task":"translation_from", + "metric":"bleu", + "score":0.3345560794 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"hne", + "task":"translation_from", + "metric":"chrf", + "score":0.5782385873 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"hne", + "task":"translation_to", + "metric":"bleu", + "score":0.1623642047 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"hne", + "task":"translation_to", + "metric":"chrf", + "score":0.4427298342 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ht", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ht", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ht", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ht", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ht", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"hu", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"hu", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"hu", + "task":"translation_from", + "metric":"bleu", + "score":0.3210417538 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"hu", + "task":"translation_from", + "metric":"chrf", + "score":0.5852315407 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"hu", + "task":"translation_to", + "metric":"bleu", + "score":0.4603569586 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"hu", + "task":"translation_to", + "metric":"chrf", + "score":0.6610825918 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"id", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"id", + "task":"translation_from", + "metric":"bleu", + "score":0.3507436052 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"id", + "task":"translation_from", + "metric":"chrf", + "score":0.5856872774 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"id", + "task":"translation_to", + "metric":"bleu", + "score":0.387557065 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"id", + "task":"translation_to", + "metric":"chrf", + "score":0.6730969345 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ig", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ig", + "task":"translation_from", + "metric":"bleu", + "score":0.283991055 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ig", + "task":"translation_from", + "metric":"chrf", + "score":0.5165825783 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ig", + "task":"translation_to", + "metric":"bleu", + "score":0.297494689 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ig", + "task":"translation_to", + "metric":"chrf", + "score":0.5366364022 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ilo", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"bleu", + "score":0.3679312463 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"chrf", + "score":0.5717815434 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"bleu", + "score":0.2293183432 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"chrf", + "score":0.5172904845 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"it", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"it", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"it", + "task":"translation_from", + "metric":"bleu", + "score":0.3498261827 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"it", + "task":"translation_from", + "metric":"chrf", + "score":0.5707332142 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"it", + "task":"translation_to", + "metric":"bleu", + "score":0.35475083 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"it", + "task":"translation_to", + "metric":"chrf", + "score":0.5942822113 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ja", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ja", + "task":"translation_from", + "metric":"bleu", + "score":0.3590987818 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ja", + "task":"translation_from", + "metric":"chrf", + "score":0.5958999814 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ja", + "task":"translation_to", + "metric":"bleu", + "score":0.4151803591 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ja", + "task":"translation_to", + "metric":"chrf", + "score":0.5319028037 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"jv", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"jv", + "task":"translation_from", + "metric":"bleu", + "score":0.3793672083 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"jv", + "task":"translation_from", + "metric":"chrf", + "score":0.6054760312 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"jv", + "task":"translation_to", + "metric":"bleu", + "score":0.3161702144 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"jv", + "task":"translation_to", + "metric":"chrf", + "score":0.5956895972 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ki", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ki", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ki", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ki", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ki", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"kk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"kk", + "task":"translation_from", + "metric":"bleu", + "score":0.2948023962 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"kk", + "task":"translation_from", + "metric":"chrf", + "score":0.5499737045 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"kk", + "task":"translation_to", + "metric":"bleu", + "score":0.3612978689 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"kk", + "task":"translation_to", + "metric":"chrf", + "score":0.6021186725 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"km", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"km", + "task":"translation_from", + "metric":"bleu", + "score":0.3644204358 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"km", + "task":"translation_from", + "metric":"chrf", + "score":0.5994539632 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"km", + "task":"translation_to", + "metric":"bleu", + "score":0.2065208646 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"km", + "task":"translation_to", + "metric":"chrf", + "score":0.4474063783 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"kn", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"kn", + "task":"translation_from", + "metric":"bleu", + "score":0.3051972526 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"kn", + "task":"translation_from", + "metric":"chrf", + "score":0.5542686332 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"kn", + "task":"translation_to", + "metric":"bleu", + "score":0.3567486129 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"kn", + "task":"translation_to", + "metric":"chrf", + "score":0.5611431734 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ko", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ko", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ko", + "task":"translation_from", + "metric":"bleu", + "score":0.2872143997 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ko", + "task":"translation_from", + "metric":"chrf", + "score":0.5525223441 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ko", + "task":"translation_to", + "metric":"bleu", + "score":0.3116476133 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ko", + "task":"translation_to", + "metric":"chrf", + "score":0.3648802199 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"lua", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"lua", + "task":"translation_from", + "metric":"bleu", + "score":0.1399233592 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"lua", + "task":"translation_from", + "metric":"chrf", + "score":0.315099285 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"lua", + "task":"translation_to", + "metric":"bleu", + "score":0.0802015694 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"lua", + "task":"translation_to", + "metric":"chrf", + "score":0.3631437635 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"mag", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"mag", + "task":"translation_from", + "metric":"bleu", + "score":0.4128862434 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"mag", + "task":"translation_from", + "metric":"chrf", + "score":0.6274466843 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"mag", + "task":"translation_to", + "metric":"bleu", + "score":0.3688684574 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"mag", + "task":"translation_to", + "metric":"chrf", + "score":0.5833102178 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"mai", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"mai", + "task":"translation_from", + "metric":"bleu", + "score":0.3890840766 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"mai", + "task":"translation_from", + "metric":"chrf", + "score":0.6240476873 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"mai", + "task":"translation_to", + "metric":"bleu", + "score":0.2256501556 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"mai", + "task":"translation_to", + "metric":"chrf", + "score":0.4794729055 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"mg", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"mg", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"mg", + "task":"translation_from", + "metric":"bleu", + "score":0.3701671266 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"mg", + "task":"translation_from", + "metric":"chrf", + "score":0.5789314386 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"mg", + "task":"translation_to", + "metric":"bleu", + "score":0.2339248832 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"mg", + "task":"translation_to", + "metric":"chrf", + "score":0.5444701317 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ml", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ml", + "task":"translation_from", + "metric":"bleu", + "score":0.4065449181 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ml", + "task":"translation_from", + "metric":"chrf", + "score":0.6069224309 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ml", + "task":"translation_to", + "metric":"bleu", + "score":0.3084108149 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ml", + "task":"translation_to", + "metric":"chrf", + "score":0.5610104654 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"mr", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"mr", + "task":"translation_from", + "metric":"bleu", + "score":0.2888720948 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"mr", + "task":"translation_from", + "metric":"chrf", + "score":0.5411662197 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"mr", + "task":"translation_to", + "metric":"bleu", + "score":0.2820351359 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"mr", + "task":"translation_to", + "metric":"chrf", + "score":0.5017455952 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ms", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ms", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ms", + "task":"translation_from", + "metric":"bleu", + "score":0.4137133794 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ms", + "task":"translation_from", + "metric":"chrf", + "score":0.6312868188 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ms", + "task":"translation_to", + "metric":"bleu", + "score":0.4812654706 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ms", + "task":"translation_to", + "metric":"chrf", + "score":0.7314221816 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"my", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"my", + "task":"translation_from", + "metric":"bleu", + "score":0.3696810103 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"my", + "task":"translation_from", + "metric":"chrf", + "score":0.5941720939 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"my", + "task":"translation_to", + "metric":"bleu", + "score":0.3374140159 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"my", + "task":"translation_to", + "metric":"chrf", + "score":0.5598126987 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ne", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ne", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ne", + "task":"translation_from", + "metric":"bleu", + "score":0.3690975587 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ne", + "task":"translation_from", + "metric":"chrf", + "score":0.591186642 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ne", + "task":"translation_to", + "metric":"bleu", + "score":0.2727284255 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ne", + "task":"translation_to", + "metric":"chrf", + "score":0.4816401296 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"nl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"nl", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"nl", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"nl", + "task":"translation_from", + "metric":"bleu", + "score":0.3099744217 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"nl", + "task":"translation_from", + "metric":"chrf", + "score":0.5540665201 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"nl", + "task":"translation_to", + "metric":"bleu", + "score":0.358350435 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"nl", + "task":"translation_to", + "metric":"chrf", + "score":0.6375438913 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ny", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ny", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ny", + "task":"translation_from", + "metric":"bleu", + "score":0.2769742108 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ny", + "task":"translation_from", + "metric":"chrf", + "score":0.5127880962 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ny", + "task":"translation_to", + "metric":"bleu", + "score":0.1953053994 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ny", + "task":"translation_to", + "metric":"chrf", + "score":0.5454095128 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"om", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"om", + "task":"translation_from", + "metric":"bleu", + "score":0.1552982789 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"om", + "task":"translation_from", + "metric":"chrf", + "score":0.4088650794 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"om", + "task":"translation_to", + "metric":"bleu", + "score":0.0578542594 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"om", + "task":"translation_to", + "metric":"chrf", + "score":0.4227186624 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"or", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"or", + "task":"translation_from", + "metric":"bleu", + "score":0.3491547876 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"or", + "task":"translation_from", + "metric":"chrf", + "score":0.6003545703 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"or", + "task":"translation_to", + "metric":"bleu", + "score":0.307748028 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"or", + "task":"translation_to", + "metric":"chrf", + "score":0.5199829894 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pa", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pa", + "task":"translation_from", + "metric":"bleu", + "score":0.4833653569 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pa", + "task":"translation_from", + "metric":"chrf", + "score":0.6877252787 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pa", + "task":"translation_to", + "metric":"bleu", + "score":0.4959043786 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pa", + "task":"translation_to", + "metric":"chrf", + "score":0.631939007 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pl", + "task":"translation_from", + "metric":"bleu", + "score":0.345076722 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pl", + "task":"translation_from", + "metric":"chrf", + "score":0.5982949848 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pl", + "task":"translation_to", + "metric":"bleu", + "score":0.3888863333 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pl", + "task":"translation_to", + "metric":"chrf", + "score":0.6077722316 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pt", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pt", + "task":"translation_from", + "metric":"bleu", + "score":0.4185968559 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pt", + "task":"translation_from", + "metric":"chrf", + "score":0.6194298291 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pt", + "task":"translation_to", + "metric":"bleu", + "score":0.5066913819 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pt", + "task":"translation_to", + "metric":"chrf", + "score":0.7045563325 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ro", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ro", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ro", + "task":"translation_from", + "metric":"bleu", + "score":0.3510540475 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ro", + "task":"translation_from", + "metric":"chrf", + "score":0.5985634799 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ro", + "task":"translation_to", + "metric":"bleu", + "score":0.5670740367 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ro", + "task":"translation_to", + "metric":"chrf", + "score":0.7258358589 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ru", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ru", + "task":"translation_from", + "metric":"bleu", + "score":0.2835606416 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ru", + "task":"translation_from", + "metric":"chrf", + "score":0.5525332546 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ru", + "task":"translation_to", + "metric":"bleu", + "score":0.5294387768 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ru", + "task":"translation_to", + "metric":"chrf", + "score":0.6814959444 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"rw", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"rw", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"rw", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"rw", + "task":"translation_from", + "metric":"bleu", + "score":0.315385923 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"rw", + "task":"translation_from", + "metric":"chrf", + "score":0.5485214208 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"rw", + "task":"translation_to", + "metric":"bleu", + "score":0.3039027455 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"rw", + "task":"translation_to", + "metric":"chrf", + "score":0.5685019601 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sd", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sd", + "task":"translation_from", + "metric":"bleu", + "score":0.4019575944 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sd", + "task":"translation_from", + "metric":"chrf", + "score":0.6276858351 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sd", + "task":"translation_to", + "metric":"bleu", + "score":0.3830695907 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sd", + "task":"translation_to", + "metric":"chrf", + "score":0.5452929704 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"si", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"si", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"si", + "task":"translation_from", + "metric":"bleu", + "score":0.3256641934 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"si", + "task":"translation_from", + "metric":"chrf", + "score":0.5531574071 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"si", + "task":"translation_to", + "metric":"bleu", + "score":0.3465036043 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"si", + "task":"translation_to", + "metric":"chrf", + "score":0.5339014715 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sn", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sn", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sn", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sn", + "task":"translation_from", + "metric":"bleu", + "score":0.2148918029 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sn", + "task":"translation_from", + "metric":"chrf", + "score":0.4431856714 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sn", + "task":"translation_to", + "metric":"bleu", + "score":0.2048159746 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sn", + "task":"translation_to", + "metric":"chrf", + "score":0.5229910344 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"so", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"so", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"so", + "task":"translation_from", + "metric":"bleu", + "score":0.3102660748 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"so", + "task":"translation_from", + "metric":"chrf", + "score":0.5202647222 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"so", + "task":"translation_to", + "metric":"bleu", + "score":0.2456069778 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"so", + "task":"translation_to", + "metric":"chrf", + "score":0.503324615 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sr", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sr", + "task":"translation_from", + "metric":"bleu", + "score":0.3298581842 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sr", + "task":"translation_from", + "metric":"chrf", + "score":0.5870517038 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sr", + "task":"translation_to", + "metric":"bleu", + "score":0.4507987284 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sr", + "task":"translation_to", + "metric":"chrf", + "score":0.6306764686 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"su", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"su", + "task":"translation_from", + "metric":"bleu", + "score":0.3438400948 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"su", + "task":"translation_from", + "metric":"chrf", + "score":0.5431534783 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"su", + "task":"translation_to", + "metric":"bleu", + "score":0.2185629205 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"su", + "task":"translation_to", + "metric":"chrf", + "score":0.513335728 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sv", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sv", + "task":"translation_from", + "metric":"bleu", + "score":0.3332298772 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sv", + "task":"translation_from", + "metric":"chrf", + "score":0.5774389783 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sv", + "task":"translation_to", + "metric":"bleu", + "score":0.4778984127 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sv", + "task":"translation_to", + "metric":"chrf", + "score":0.6958168144 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sw", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sw", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sw", + "task":"translation_from", + "metric":"bleu", + "score":0.4452506057 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sw", + "task":"translation_from", + "metric":"chrf", + "score":0.6299322033 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sw", + "task":"translation_to", + "metric":"bleu", + "score":0.4773237879 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sw", + "task":"translation_to", + "metric":"chrf", + "score":0.6983325706 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ta", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ta", + "task":"translation_from", + "metric":"bleu", + "score":0.2765535661 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ta", + "task":"translation_from", + "metric":"chrf", + "score":0.5553462948 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ta", + "task":"translation_to", + "metric":"bleu", + "score":0.3584530222 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ta", + "task":"translation_to", + "metric":"chrf", + "score":0.6096517359 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"te", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"te", + "task":"translation_from", + "metric":"bleu", + "score":0.4838983303 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"te", + "task":"translation_from", + "metric":"chrf", + "score":0.6878651593 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"te", + "task":"translation_to", + "metric":"bleu", + "score":0.4225689448 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"te", + "task":"translation_to", + "metric":"chrf", + "score":0.6171822766 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"tg", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"tg", + "task":"translation_from", + "metric":"bleu", + "score":0.2905859261 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"tg", + "task":"translation_from", + "metric":"chrf", + "score":0.5219303661 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"tg", + "task":"translation_to", + "metric":"bleu", + "score":0.3215838806 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"tg", + "task":"translation_to", + "metric":"chrf", + "score":0.5332721729 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"th", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"th", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"th", + "task":"translation_from", + "metric":"bleu", + "score":0.363389223 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"th", + "task":"translation_from", + "metric":"chrf", + "score":0.5927603201 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"th", + "task":"translation_to", + "metric":"bleu", + "score":0.4280908922 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"th", + "task":"translation_to", + "metric":"chrf", + "score":0.5695430758 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ti", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ti", + "task":"translation_from", + "metric":"bleu", + "score":0.2870643832 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ti", + "task":"translation_from", + "metric":"chrf", + "score":0.5217258722 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ti", + "task":"translation_to", + "metric":"bleu", + "score":0.1683718664 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ti", + "task":"translation_to", + "metric":"chrf", + "score":0.2689944739 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"tr", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"tr", + "task":"translation_from", + "metric":"bleu", + "score":0.3532965173 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"tr", + "task":"translation_from", + "metric":"chrf", + "score":0.6170908018 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"tr", + "task":"translation_to", + "metric":"bleu", + "score":0.4401941591 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"tr", + "task":"translation_to", + "metric":"chrf", + "score":0.6752054069 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"uk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"uk", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"uk", + "task":"translation_from", + "metric":"bleu", + "score":0.3183568029 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"uk", + "task":"translation_from", + "metric":"chrf", + "score":0.569783479 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"uk", + "task":"translation_to", + "metric":"bleu", + "score":0.4278428166 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"uk", + "task":"translation_to", + "metric":"chrf", + "score":0.6040719448 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"umb", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"umb", + "task":"translation_from", + "metric":"bleu", + "score":0.037144113 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"umb", + "task":"translation_from", + "metric":"chrf", + "score":0.089331464 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"umb", + "task":"translation_to", + "metric":"bleu", + "score":0.0447156552 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"umb", + "task":"translation_to", + "metric":"chrf", + "score":0.2228994735 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ur", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ur", + "task":"translation_from", + "metric":"bleu", + "score":0.3194163699 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ur", + "task":"translation_from", + "metric":"chrf", + "score":0.5758075077 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ur", + "task":"translation_to", + "metric":"bleu", + "score":0.2609063103 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ur", + "task":"translation_to", + "metric":"chrf", + "score":0.4351160146 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"uz", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"uz", + "task":"translation_from", + "metric":"bleu", + "score":0.3488574237 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"uz", + "task":"translation_from", + "metric":"chrf", + "score":0.5833892626 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"uz", + "task":"translation_to", + "metric":"bleu", + "score":0.3525318348 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"uz", + "task":"translation_to", + "metric":"chrf", + "score":0.600901419 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"vi", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"vi", + "task":"translation_from", + "metric":"bleu", + "score":0.4227968054 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"vi", + "task":"translation_from", + "metric":"chrf", + "score":0.6326522416 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"vi", + "task":"translation_to", + "metric":"bleu", + "score":0.4693432911 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"vi", + "task":"translation_to", + "metric":"chrf", + "score":0.6659480306 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"wo", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"wo", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"wo", + "task":"translation_from", + "metric":"bleu", + "score":0.1552091518 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"wo", + "task":"translation_from", + "metric":"chrf", + "score":0.3984533183 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"wo", + "task":"translation_to", + "metric":"bleu", + "score":0.0934433089 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"wo", + "task":"translation_to", + "metric":"chrf", + "score":0.3362523248 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"wuu", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"bleu", + "score":0.3241760602 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"chrf", + "score":0.5694459727 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"bleu", + "score":0.1373684835 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"chrf", + "score":0.1808455778 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"xh", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"xh", + "task":"translation_from", + "metric":"bleu", + "score":0.2594184267 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"xh", + "task":"translation_from", + "metric":"chrf", + "score":0.4970898641 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"xh", + "task":"translation_to", + "metric":"bleu", + "score":0.1342973002 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"xh", + "task":"translation_to", + "metric":"chrf", + "score":0.4760810578 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"yo", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"yo", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"yo", + "task":"translation_from", + "metric":"bleu", + "score":0.1670055121 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"yo", + "task":"translation_from", + "metric":"chrf", + "score":0.3949060751 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"yo", + "task":"translation_to", + "metric":"bleu", + "score":0.1271782927 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"yo", + "task":"translation_to", + "metric":"chrf", + "score":0.2784136749 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"yue", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"yue", + "task":"translation_from", + "metric":"bleu", + "score":0.2666023686 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"yue", + "task":"translation_from", + "metric":"chrf", + "score":0.5200218275 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"yue", + "task":"translation_to", + "metric":"bleu", + "score":0.1881613886 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"yue", + "task":"translation_to", + "metric":"chrf", + "score":0.2877597368 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"zh", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"zh", + "task":"translation_from", + "metric":"bleu", + "score":0.2632355471 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"zh", + "task":"translation_from", + "metric":"chrf", + "score":0.5527183044 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"zh", + "task":"translation_to", + "metric":"bleu", + "score":0.3128970722 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"zh", + "task":"translation_to", + "metric":"chrf", + "score":0.3699956681 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"zu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"zu", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"zu", + "task":"translation_from", + "metric":"bleu", + "score":0.3295494586 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"zu", + "task":"translation_from", + "metric":"chrf", + "score":0.557523684 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"zu", + "task":"translation_to", + "metric":"bleu", + "score":0.3146714644 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"zu", + "task":"translation_to", + "metric":"chrf", + "score":0.5811521396 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"aeb", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.342116281 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.559017125 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.2612038772 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.4610162591 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"af", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"af", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"af", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"af", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"af", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ak", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ak", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ak", + "task":"translation_from", + "metric":"bleu", + "score":0.2362598693 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ak", + "task":"translation_from", + "metric":"chrf", + "score":0.4567970323 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ak", + "task":"translation_to", + "metric":"bleu", + "score":0.1615485704 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ak", + "task":"translation_to", + "metric":"chrf", + "score":0.4248295507 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"am", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"am", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"am", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"am", + "task":"translation_from", + "metric":"bleu", + "score":0.2883756135 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"am", + "task":"translation_from", + "metric":"chrf", + "score":0.5452929372 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"am", + "task":"translation_to", + "metric":"bleu", + "score":0.2563045907 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"am", + "task":"translation_to", + "metric":"chrf", + "score":0.3587997566 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"apc", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"apc", + "task":"translation_from", + "metric":"bleu", + "score":0.3529391424 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"apc", + "task":"translation_from", + "metric":"chrf", + "score":0.6061230642 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"apc", + "task":"translation_to", + "metric":"bleu", + "score":0.3735935027 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"apc", + "task":"translation_to", + "metric":"chrf", + "score":0.6118752881 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ar", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ar", + "task":"translation_from", + "metric":"bleu", + "score":0.3509446122 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ar", + "task":"translation_from", + "metric":"chrf", + "score":0.5872861306 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ar", + "task":"translation_to", + "metric":"bleu", + "score":0.4369226272 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ar", + "task":"translation_to", + "metric":"chrf", + "score":0.6357392299 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ary", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ary", + "task":"translation_from", + "metric":"bleu", + "score":0.178647434 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ary", + "task":"translation_from", + "metric":"chrf", + "score":0.459184816 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ary", + "task":"translation_to", + "metric":"bleu", + "score":0.1766325657 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ary", + "task":"translation_to", + "metric":"chrf", + "score":0.42829263 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"arz", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"arz", + "task":"translation_from", + "metric":"bleu", + "score":0.2689181562 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"arz", + "task":"translation_from", + "metric":"chrf", + "score":0.5103302194 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"arz", + "task":"translation_to", + "metric":"bleu", + "score":0.2811045733 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"arz", + "task":"translation_to", + "metric":"chrf", + "score":0.4796679654 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"as", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"as", + "task":"translation_from", + "metric":"bleu", + "score":0.302725237 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"as", + "task":"translation_from", + "metric":"chrf", + "score":0.542445303 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"as", + "task":"translation_to", + "metric":"bleu", + "score":0.2074435657 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"as", + "task":"translation_to", + "metric":"chrf", + "score":0.4358785934 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"awa", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"awa", + "task":"translation_from", + "metric":"bleu", + "score":0.3306584572 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"awa", + "task":"translation_from", + "metric":"chrf", + "score":0.5470737398 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"awa", + "task":"translation_to", + "metric":"bleu", + "score":0.1839015438 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"awa", + "task":"translation_to", + "metric":"chrf", + "score":0.3995221223 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"az", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"az", + "task":"translation_from", + "metric":"bleu", + "score":0.2402619776 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"az", + "task":"translation_from", + "metric":"chrf", + "score":0.4816842061 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"az", + "task":"translation_to", + "metric":"bleu", + "score":0.2017479595 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"az", + "task":"translation_to", + "metric":"chrf", + "score":0.4438028104 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"be", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"be", + "task":"translation_from", + "metric":"bleu", + "score":0.1964434077 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"be", + "task":"translation_from", + "metric":"chrf", + "score":0.4658109118 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"be", + "task":"translation_to", + "metric":"bleu", + "score":0.3578761246 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"be", + "task":"translation_to", + "metric":"chrf", + "score":0.5250650323 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"bho", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"bho", + "task":"translation_from", + "metric":"bleu", + "score":0.3118354834 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"bho", + "task":"translation_from", + "metric":"chrf", + "score":0.5301057957 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"bho", + "task":"translation_to", + "metric":"bleu", + "score":0.2712094702 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"bho", + "task":"translation_to", + "metric":"chrf", + "score":0.4554148161 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"bm", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"bm", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"bm", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"bm", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"bm", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"bn", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"bn", + "task":"translation_from", + "metric":"bleu", + "score":0.2928560114 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"bn", + "task":"translation_from", + "metric":"chrf", + "score":0.5373877759 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"bn", + "task":"translation_to", + "metric":"bleu", + "score":0.371713483 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"bn", + "task":"translation_to", + "metric":"chrf", + "score":0.5467648432 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ca", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ca", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ca", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ca", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ca", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ceb", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"bleu", + "score":0.4167458111 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"chrf", + "score":0.6414773714 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"bleu", + "score":0.4574369641 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"chrf", + "score":0.6642298649 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ckb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"bleu", + "score":0.3171272191 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"chrf", + "score":0.5378911972 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"bleu", + "score":0.3576320675 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"chrf", + "score":0.5996552124 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"cs", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"cs", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"cs", + "task":"translation_from", + "metric":"bleu", + "score":0.3763167038 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"cs", + "task":"translation_from", + "metric":"chrf", + "score":0.6069984198 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"cs", + "task":"translation_to", + "metric":"bleu", + "score":0.412011399 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"cs", + "task":"translation_to", + "metric":"chrf", + "score":0.5948875971 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"de", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"de", + "task":"translation_from", + "metric":"bleu", + "score":0.3827187056 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"de", + "task":"translation_from", + "metric":"chrf", + "score":0.6092943987 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"de", + "task":"translation_to", + "metric":"bleu", + "score":0.5181328066 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"de", + "task":"translation_to", + "metric":"chrf", + "score":0.6981190119 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"el", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"el", + "task":"translation_from", + "metric":"bleu", + "score":0.3297475202 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"el", + "task":"translation_from", + "metric":"chrf", + "score":0.5587828835 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"el", + "task":"translation_to", + "metric":"bleu", + "score":0.3865296224 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"el", + "task":"translation_to", + "metric":"chrf", + "score":0.5630460332 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"en", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"en", + "task":"translation_from", + "metric":"bleu", + "score":0.5942868447 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"en", + "task":"translation_from", + "metric":"chrf", + "score":0.7298379077 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"en", + "task":"translation_to", + "metric":"bleu", + "score":0.7309888475 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"en", + "task":"translation_to", + "metric":"chrf", + "score":0.8534239972 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"es", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"es", + "task":"translation_from", + "metric":"bleu", + "score":0.3497891701 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"es", + "task":"translation_from", + "metric":"chrf", + "score":0.5889817614 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"es", + "task":"translation_to", + "metric":"bleu", + "score":0.395885417 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"es", + "task":"translation_to", + "metric":"chrf", + "score":0.6273835234 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"fa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"fa", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"fa", + "task":"translation_from", + "metric":"bleu", + "score":0.3764428485 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"fa", + "task":"translation_from", + "metric":"chrf", + "score":0.5794911256 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"fa", + "task":"translation_to", + "metric":"bleu", + "score":0.3019679958 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"fa", + "task":"translation_to", + "metric":"chrf", + "score":0.5314471888 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"fil", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"fil", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"fil", + "task":"translation_from", + "metric":"bleu", + "score":0.3970330872 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"fil", + "task":"translation_from", + "metric":"chrf", + "score":0.6224300541 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"fil", + "task":"translation_to", + "metric":"bleu", + "score":0.3731416111 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"fil", + "task":"translation_to", + "metric":"chrf", + "score":0.6421804886 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"fr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"fr", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"fr", + "task":"translation_from", + "metric":"bleu", + "score":0.3737227872 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"fr", + "task":"translation_from", + "metric":"chrf", + "score":0.6039484183 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"fr", + "task":"translation_to", + "metric":"bleu", + "score":0.5555743798 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"fr", + "task":"translation_to", + "metric":"chrf", + "score":0.7229519037 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.0654195918 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.2431272498 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0469027058 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.2599881115 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"gu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"gu", + "task":"translation_from", + "metric":"bleu", + "score":0.344471287 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"gu", + "task":"translation_from", + "metric":"chrf", + "score":0.5591834446 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"gu", + "task":"translation_to", + "metric":"bleu", + "score":0.180119873 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"gu", + "task":"translation_to", + "metric":"chrf", + "score":0.4654772276 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ha", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ha", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ha", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ha", + "task":"translation_from", + "metric":"bleu", + "score":0.2852268084 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ha", + "task":"translation_from", + "metric":"chrf", + "score":0.4820918601 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ha", + "task":"translation_to", + "metric":"bleu", + "score":0.318588004 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ha", + "task":"translation_to", + "metric":"chrf", + "score":0.5675346049 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"hi", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"hi", + "task":"translation_from", + "metric":"bleu", + "score":0.4387215588 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"hi", + "task":"translation_from", + "metric":"chrf", + "score":0.6443095169 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"hi", + "task":"translation_to", + "metric":"bleu", + "score":0.4255607348 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"hi", + "task":"translation_to", + "metric":"chrf", + "score":0.6457270128 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"hne", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"hne", + "task":"translation_from", + "metric":"bleu", + "score":0.336133928 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"hne", + "task":"translation_from", + "metric":"chrf", + "score":0.545638091 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"hne", + "task":"translation_to", + "metric":"bleu", + "score":0.1683321583 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"hne", + "task":"translation_to", + "metric":"chrf", + "score":0.4261207547 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ht", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ht", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ht", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ht", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ht", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"hu", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"hu", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"hu", + "task":"translation_from", + "metric":"bleu", + "score":0.3151646581 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"hu", + "task":"translation_from", + "metric":"chrf", + "score":0.5599039863 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"hu", + "task":"translation_to", + "metric":"bleu", + "score":0.4642022823 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"hu", + "task":"translation_to", + "metric":"chrf", + "score":0.6720003623 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"id", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"id", + "task":"translation_from", + "metric":"bleu", + "score":0.3789722313 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"id", + "task":"translation_from", + "metric":"chrf", + "score":0.5973074889 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"id", + "task":"translation_to", + "metric":"bleu", + "score":0.406320567 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"id", + "task":"translation_to", + "metric":"chrf", + "score":0.6828299565 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ig", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ig", + "task":"translation_from", + "metric":"bleu", + "score":0.2779082008 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ig", + "task":"translation_from", + "metric":"chrf", + "score":0.5108078595 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ig", + "task":"translation_to", + "metric":"bleu", + "score":0.2835120188 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ig", + "task":"translation_to", + "metric":"chrf", + "score":0.5067796001 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ilo", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"bleu", + "score":0.2679844764 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"chrf", + "score":0.5037933164 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"bleu", + "score":0.243508886 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"chrf", + "score":0.5329216971 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"it", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"it", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"it", + "task":"translation_from", + "metric":"bleu", + "score":0.3177725576 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"it", + "task":"translation_from", + "metric":"chrf", + "score":0.5648818053 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"it", + "task":"translation_to", + "metric":"bleu", + "score":0.3654943432 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"it", + "task":"translation_to", + "metric":"chrf", + "score":0.5949572053 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ja", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ja", + "task":"translation_from", + "metric":"bleu", + "score":0.3423388267 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ja", + "task":"translation_from", + "metric":"chrf", + "score":0.5884893314 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ja", + "task":"translation_to", + "metric":"bleu", + "score":0.3740472584 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ja", + "task":"translation_to", + "metric":"chrf", + "score":0.4832664839 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"jv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"jv", + "task":"translation_from", + "metric":"bleu", + "score":0.3540174328 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"jv", + "task":"translation_from", + "metric":"chrf", + "score":0.5513315973 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"jv", + "task":"translation_to", + "metric":"bleu", + "score":0.329885986 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"jv", + "task":"translation_to", + "metric":"chrf", + "score":0.5805485408 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ki", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ki", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ki", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ki", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ki", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"kk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"kk", + "task":"translation_from", + "metric":"bleu", + "score":0.2553025069 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"kk", + "task":"translation_from", + "metric":"chrf", + "score":0.5408614418 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"kk", + "task":"translation_to", + "metric":"bleu", + "score":0.3062994849 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"kk", + "task":"translation_to", + "metric":"chrf", + "score":0.58504635 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"km", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"km", + "task":"translation_from", + "metric":"bleu", + "score":0.3700483899 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"km", + "task":"translation_from", + "metric":"chrf", + "score":0.6006134318 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"km", + "task":"translation_to", + "metric":"bleu", + "score":0.2315452529 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"km", + "task":"translation_to", + "metric":"chrf", + "score":0.4617416997 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"kn", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"kn", + "task":"translation_from", + "metric":"bleu", + "score":0.2512885128 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"kn", + "task":"translation_from", + "metric":"chrf", + "score":0.4934774392 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"kn", + "task":"translation_to", + "metric":"bleu", + "score":0.3278617048 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"kn", + "task":"translation_to", + "metric":"chrf", + "score":0.5102619479 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ko", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ko", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ko", + "task":"translation_from", + "metric":"bleu", + "score":0.2465751079 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ko", + "task":"translation_from", + "metric":"chrf", + "score":0.515705028 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ko", + "task":"translation_to", + "metric":"bleu", + "score":0.2528779436 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ko", + "task":"translation_to", + "metric":"chrf", + "score":0.3488788279 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"lua", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"lua", + "task":"translation_from", + "metric":"bleu", + "score":0.0591613845 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"lua", + "task":"translation_from", + "metric":"chrf", + "score":0.2662007935 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"lua", + "task":"translation_to", + "metric":"bleu", + "score":0.0779434955 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"lua", + "task":"translation_to", + "metric":"chrf", + "score":0.3095367271 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"mag", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"mag", + "task":"translation_from", + "metric":"bleu", + "score":0.3908377774 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"mag", + "task":"translation_from", + "metric":"chrf", + "score":0.6260985434 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"mag", + "task":"translation_to", + "metric":"bleu", + "score":0.3130016025 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"mag", + "task":"translation_to", + "metric":"chrf", + "score":0.5391710538 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"mai", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"mai", + "task":"translation_from", + "metric":"bleu", + "score":0.3471192 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"mai", + "task":"translation_from", + "metric":"chrf", + "score":0.5771683143 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"mai", + "task":"translation_to", + "metric":"bleu", + "score":0.2207082106 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"mai", + "task":"translation_to", + "metric":"chrf", + "score":0.4870892013 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"mg", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"mg", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"mg", + "task":"translation_from", + "metric":"bleu", + "score":0.2993063676 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"mg", + "task":"translation_from", + "metric":"chrf", + "score":0.5474937127 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"mg", + "task":"translation_to", + "metric":"bleu", + "score":0.2153101678 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"mg", + "task":"translation_to", + "metric":"chrf", + "score":0.5379094165 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ml", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ml", + "task":"translation_from", + "metric":"bleu", + "score":0.3532448793 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ml", + "task":"translation_from", + "metric":"chrf", + "score":0.5657281022 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ml", + "task":"translation_to", + "metric":"bleu", + "score":0.3046979511 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ml", + "task":"translation_to", + "metric":"chrf", + "score":0.5523287159 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"mr", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"mr", + "task":"translation_from", + "metric":"bleu", + "score":0.3055522766 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"mr", + "task":"translation_from", + "metric":"chrf", + "score":0.5435968357 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"mr", + "task":"translation_to", + "metric":"bleu", + "score":0.257460039 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"mr", + "task":"translation_to", + "metric":"chrf", + "score":0.4845716024 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ms", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ms", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ms", + "task":"translation_from", + "metric":"bleu", + "score":0.3746934831 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ms", + "task":"translation_from", + "metric":"chrf", + "score":0.6046609636 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ms", + "task":"translation_to", + "metric":"bleu", + "score":0.4734156929 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ms", + "task":"translation_to", + "metric":"chrf", + "score":0.7284733826 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"my", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"my", + "task":"translation_from", + "metric":"bleu", + "score":0.3552781219 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"my", + "task":"translation_from", + "metric":"chrf", + "score":0.5977013775 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"my", + "task":"translation_to", + "metric":"bleu", + "score":0.3211140622 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"my", + "task":"translation_to", + "metric":"chrf", + "score":0.544805929 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ne", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ne", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ne", + "task":"translation_from", + "metric":"bleu", + "score":0.3774439938 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ne", + "task":"translation_from", + "metric":"chrf", + "score":0.599804205 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ne", + "task":"translation_to", + "metric":"bleu", + "score":0.2861323795 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ne", + "task":"translation_to", + "metric":"chrf", + "score":0.5180107937 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"nl", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"nl", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"nl", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"nl", + "task":"translation_from", + "metric":"bleu", + "score":0.312116976 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"nl", + "task":"translation_from", + "metric":"chrf", + "score":0.5463170004 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"nl", + "task":"translation_to", + "metric":"bleu", + "score":0.3780530389 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"nl", + "task":"translation_to", + "metric":"chrf", + "score":0.6232733213 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ny", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ny", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ny", + "task":"translation_from", + "metric":"bleu", + "score":0.2177968416 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ny", + "task":"translation_from", + "metric":"chrf", + "score":0.4415294523 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ny", + "task":"translation_to", + "metric":"bleu", + "score":0.1367315108 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ny", + "task":"translation_to", + "metric":"chrf", + "score":0.4585024296 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"om", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"om", + "task":"translation_from", + "metric":"bleu", + "score":0.1871006972 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"om", + "task":"translation_from", + "metric":"chrf", + "score":0.4365658925 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"om", + "task":"translation_to", + "metric":"bleu", + "score":0.106229994 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"om", + "task":"translation_to", + "metric":"chrf", + "score":0.4277182017 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"or", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"or", + "task":"translation_from", + "metric":"bleu", + "score":0.3740486194 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"or", + "task":"translation_from", + "metric":"chrf", + "score":0.6141131486 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"or", + "task":"translation_to", + "metric":"bleu", + "score":0.31231668 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"or", + "task":"translation_to", + "metric":"chrf", + "score":0.5222572922 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"pa", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"pa", + "task":"translation_from", + "metric":"bleu", + "score":0.4182659606 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"pa", + "task":"translation_from", + "metric":"chrf", + "score":0.6696655487 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"pa", + "task":"translation_to", + "metric":"bleu", + "score":0.4665320226 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"pa", + "task":"translation_to", + "metric":"chrf", + "score":0.6280330147 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"pl", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"pl", + "task":"translation_from", + "metric":"bleu", + "score":0.3282584844 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"pl", + "task":"translation_from", + "metric":"chrf", + "score":0.5713765921 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"pl", + "task":"translation_to", + "metric":"bleu", + "score":0.3762753954 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"pl", + "task":"translation_to", + "metric":"chrf", + "score":0.5940500139 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"pt", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"pt", + "task":"translation_from", + "metric":"bleu", + "score":0.3485890022 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"pt", + "task":"translation_from", + "metric":"chrf", + "score":0.574915747 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"pt", + "task":"translation_to", + "metric":"bleu", + "score":0.4760104707 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"pt", + "task":"translation_to", + "metric":"chrf", + "score":0.6891420805 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ro", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ro", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ro", + "task":"translation_from", + "metric":"bleu", + "score":0.3285564053 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ro", + "task":"translation_from", + "metric":"chrf", + "score":0.5835489949 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ro", + "task":"translation_to", + "metric":"bleu", + "score":0.5863602394 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ro", + "task":"translation_to", + "metric":"chrf", + "score":0.7345305045 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ru", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ru", + "task":"translation_from", + "metric":"bleu", + "score":0.2893557086 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ru", + "task":"translation_from", + "metric":"chrf", + "score":0.5514512546 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ru", + "task":"translation_to", + "metric":"bleu", + "score":0.4910352633 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ru", + "task":"translation_to", + "metric":"chrf", + "score":0.6636379715 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"rw", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"rw", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"rw", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"rw", + "task":"translation_from", + "metric":"bleu", + "score":0.2768738298 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"rw", + "task":"translation_from", + "metric":"chrf", + "score":0.5136190092 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"rw", + "task":"translation_to", + "metric":"bleu", + "score":0.2743310586 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"rw", + "task":"translation_to", + "metric":"chrf", + "score":0.5596031593 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sd", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sd", + "task":"translation_from", + "metric":"bleu", + "score":0.3296224998 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sd", + "task":"translation_from", + "metric":"chrf", + "score":0.5499189472 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sd", + "task":"translation_to", + "metric":"bleu", + "score":0.2231786181 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sd", + "task":"translation_to", + "metric":"chrf", + "score":0.407169401 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"si", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"si", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"si", + "task":"translation_from", + "metric":"bleu", + "score":0.2632131459 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"si", + "task":"translation_from", + "metric":"chrf", + "score":0.4981476408 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"si", + "task":"translation_to", + "metric":"bleu", + "score":0.3150668549 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"si", + "task":"translation_to", + "metric":"chrf", + "score":0.466344362 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sn", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sn", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sn", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sn", + "task":"translation_from", + "metric":"bleu", + "score":0.1425864886 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sn", + "task":"translation_from", + "metric":"chrf", + "score":0.3921687091 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sn", + "task":"translation_to", + "metric":"bleu", + "score":0.1876717865 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sn", + "task":"translation_to", + "metric":"chrf", + "score":0.4923376927 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"so", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"so", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"so", + "task":"translation_from", + "metric":"bleu", + "score":0.2921978364 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"so", + "task":"translation_from", + "metric":"chrf", + "score":0.5121729513 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"so", + "task":"translation_to", + "metric":"bleu", + "score":0.2437506181 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"so", + "task":"translation_to", + "metric":"chrf", + "score":0.511793128 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sr", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sr", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sr", + "task":"translation_from", + "metric":"bleu", + "score":0.3070769379 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sr", + "task":"translation_from", + "metric":"chrf", + "score":0.5829431146 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sr", + "task":"translation_to", + "metric":"bleu", + "score":0.4562210568 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sr", + "task":"translation_to", + "metric":"chrf", + "score":0.6349957477 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"su", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"su", + "task":"translation_from", + "metric":"bleu", + "score":0.2923338131 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"su", + "task":"translation_from", + "metric":"chrf", + "score":0.4917795718 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"su", + "task":"translation_to", + "metric":"bleu", + "score":0.2448808161 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"su", + "task":"translation_to", + "metric":"chrf", + "score":0.5213243396 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sv", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sv", + "task":"translation_from", + "metric":"bleu", + "score":0.340913979 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sv", + "task":"translation_from", + "metric":"chrf", + "score":0.5878242881 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sv", + "task":"translation_to", + "metric":"bleu", + "score":0.4174508433 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sv", + "task":"translation_to", + "metric":"chrf", + "score":0.6558948574 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sw", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sw", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sw", + "task":"translation_from", + "metric":"bleu", + "score":0.397583037 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sw", + "task":"translation_from", + "metric":"chrf", + "score":0.6014699575 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sw", + "task":"translation_to", + "metric":"bleu", + "score":0.4540021563 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"sw", + "task":"translation_to", + "metric":"chrf", + "score":0.7002830052 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ta", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ta", + "task":"translation_from", + "metric":"bleu", + "score":0.2981018347 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ta", + "task":"translation_from", + "metric":"chrf", + "score":0.5573394656 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ta", + "task":"translation_to", + "metric":"bleu", + "score":0.3033361537 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ta", + "task":"translation_to", + "metric":"chrf", + "score":0.5406646936 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"te", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"te", + "task":"translation_from", + "metric":"bleu", + "score":0.4025505277 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"te", + "task":"translation_from", + "metric":"chrf", + "score":0.6339036498 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"te", + "task":"translation_to", + "metric":"bleu", + "score":0.4166086163 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"te", + "task":"translation_to", + "metric":"chrf", + "score":0.6171953291 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"tg", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"tg", + "task":"translation_from", + "metric":"bleu", + "score":0.2859260679 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"tg", + "task":"translation_from", + "metric":"chrf", + "score":0.5305344486 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"tg", + "task":"translation_to", + "metric":"bleu", + "score":0.3454858711 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"tg", + "task":"translation_to", + "metric":"chrf", + "score":0.5585923193 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"th", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"th", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"th", + "task":"translation_from", + "metric":"bleu", + "score":0.3196721957 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"th", + "task":"translation_from", + "metric":"chrf", + "score":0.5597673276 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"th", + "task":"translation_to", + "metric":"bleu", + "score":0.4114706745 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"th", + "task":"translation_to", + "metric":"chrf", + "score":0.560767027 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ti", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ti", + "task":"translation_from", + "metric":"bleu", + "score":0.2476296934 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ti", + "task":"translation_from", + "metric":"chrf", + "score":0.5033069835 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ti", + "task":"translation_to", + "metric":"bleu", + "score":0.1179117378 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ti", + "task":"translation_to", + "metric":"chrf", + "score":0.2587205011 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"tr", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"tr", + "task":"translation_from", + "metric":"bleu", + "score":0.3291780472 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"tr", + "task":"translation_from", + "metric":"chrf", + "score":0.5900439285 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"tr", + "task":"translation_to", + "metric":"bleu", + "score":0.4285247051 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"tr", + "task":"translation_to", + "metric":"chrf", + "score":0.6508035663 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"uk", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"uk", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"uk", + "task":"translation_from", + "metric":"bleu", + "score":0.3407035036 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"uk", + "task":"translation_from", + "metric":"chrf", + "score":0.583433778 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"uk", + "task":"translation_to", + "metric":"bleu", + "score":0.4167194618 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"uk", + "task":"translation_to", + "metric":"chrf", + "score":0.6135073244 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"umb", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"umb", + "task":"translation_from", + "metric":"bleu", + "score":0.0287200326 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"umb", + "task":"translation_from", + "metric":"chrf", + "score":0.1566177223 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"umb", + "task":"translation_to", + "metric":"bleu", + "score":0.0503465615 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"umb", + "task":"translation_to", + "metric":"chrf", + "score":0.21805483 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ur", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ur", + "task":"translation_from", + "metric":"bleu", + "score":0.3212777323 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ur", + "task":"translation_from", + "metric":"chrf", + "score":0.5735084601 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ur", + "task":"translation_to", + "metric":"bleu", + "score":0.3027958989 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"ur", + "task":"translation_to", + "metric":"chrf", + "score":0.4912965943 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"uz", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"uz", + "task":"translation_from", + "metric":"bleu", + "score":0.2583582755 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"uz", + "task":"translation_from", + "metric":"chrf", + "score":0.483302551 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"uz", + "task":"translation_to", + "metric":"bleu", + "score":0.3579243963 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"uz", + "task":"translation_to", + "metric":"chrf", + "score":0.6083657804 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"vi", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"vi", + "task":"translation_from", + "metric":"bleu", + "score":0.3471784526 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"vi", + "task":"translation_from", + "metric":"chrf", + "score":0.5719753053 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"vi", + "task":"translation_to", + "metric":"bleu", + "score":0.4601231177 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"vi", + "task":"translation_to", + "metric":"chrf", + "score":0.6644848789 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"wo", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"wo", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"wo", + "task":"translation_from", + "metric":"bleu", + "score":0.0932068478 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"wo", + "task":"translation_from", + "metric":"chrf", + "score":0.3792197219 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"wo", + "task":"translation_to", + "metric":"bleu", + "score":0.1171143464 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"wo", + "task":"translation_to", + "metric":"chrf", + "score":0.3384795969 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"wuu", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"bleu", + "score":0.2968992777 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"chrf", + "score":0.5258850631 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"bleu", + "score":0.1321430026 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"chrf", + "score":0.176594989 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"xh", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"xh", + "task":"translation_from", + "metric":"bleu", + "score":0.1979226992 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"xh", + "task":"translation_from", + "metric":"chrf", + "score":0.4588070152 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"xh", + "task":"translation_to", + "metric":"bleu", + "score":0.1181506898 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"xh", + "task":"translation_to", + "metric":"chrf", + "score":0.4718021868 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"yo", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"yo", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"yo", + "task":"translation_from", + "metric":"bleu", + "score":0.1110331374 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"yo", + "task":"translation_from", + "metric":"chrf", + "score":0.3622261661 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"yo", + "task":"translation_to", + "metric":"bleu", + "score":0.1764819134 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"yo", + "task":"translation_to", + "metric":"chrf", + "score":0.3463753843 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"yue", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"yue", + "task":"translation_from", + "metric":"bleu", + "score":0.2756047962 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"yue", + "task":"translation_from", + "metric":"chrf", + "score":0.518253876 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"yue", + "task":"translation_to", + "metric":"bleu", + "score":0.2356751392 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"yue", + "task":"translation_to", + "metric":"chrf", + "score":0.3051882861 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"zh", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"zh", + "task":"translation_from", + "metric":"bleu", + "score":0.2989639846 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"zh", + "task":"translation_from", + "metric":"chrf", + "score":0.5646599732 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"zh", + "task":"translation_to", + "metric":"bleu", + "score":0.2915310914 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"zh", + "task":"translation_to", + "metric":"chrf", + "score":0.3358004159 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"zu", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"zu", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"zu", + "task":"translation_from", + "metric":"bleu", + "score":0.3429319501 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"zu", + "task":"translation_from", + "metric":"chrf", + "score":0.5895603725 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"zu", + "task":"translation_to", + "metric":"bleu", + "score":0.2713803282 + }, + { + "model":"google\/gemini-2.5-flash-preview-05-20", + "bcp_47":"zu", + "task":"translation_to", + "metric":"chrf", + "score":0.5773152323 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"aeb", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.0278093886 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.1209403877 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.0460469917 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.1583874959 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"af", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"af", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"af", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"af", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"af", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ak", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ak", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ak", + "task":"translation_from", + "metric":"bleu", + "score":0.0746358572 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ak", + "task":"translation_from", + "metric":"chrf", + "score":0.2039454163 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ak", + "task":"translation_to", + "metric":"bleu", + "score":0.0106555853 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ak", + "task":"translation_to", + "metric":"chrf", + "score":0.1635891431 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"am", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"am", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"am", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"am", + "task":"translation_from", + "metric":"bleu", + "score":0.0987853648 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"am", + "task":"translation_from", + "metric":"chrf", + "score":0.2172965208 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"am", + "task":"translation_to", + "metric":"bleu", + "score":0.0037326563 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"am", + "task":"translation_to", + "metric":"chrf", + "score":0.0273289802 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"apc", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"apc", + "task":"translation_from", + "metric":"bleu", + "score":0.0349474752 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"apc", + "task":"translation_from", + "metric":"chrf", + "score":0.205929391 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"apc", + "task":"translation_to", + "metric":"bleu", + "score":0.0109943205 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"apc", + "task":"translation_to", + "metric":"chrf", + "score":0.1135056868 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ar", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ar", + "task":"translation_from", + "metric":"bleu", + "score":0.0231513455 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ar", + "task":"translation_from", + "metric":"chrf", + "score":0.1669816885 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ar", + "task":"translation_to", + "metric":"bleu", + "score":0.0192052173 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ar", + "task":"translation_to", + "metric":"chrf", + "score":0.1199941852 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ary", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ary", + "task":"translation_from", + "metric":"bleu", + "score":0.0482644911 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ary", + "task":"translation_from", + "metric":"chrf", + "score":0.1570610957 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ary", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ary", + "task":"translation_to", + "metric":"chrf", + "score":0.0671140896 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"arz", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"arz", + "task":"translation_from", + "metric":"bleu", + "score":0.0333540125 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"arz", + "task":"translation_from", + "metric":"chrf", + "score":0.1654807425 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"arz", + "task":"translation_to", + "metric":"bleu", + "score":0.0300458941 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"arz", + "task":"translation_to", + "metric":"chrf", + "score":0.1417391491 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"as", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"as", + "task":"translation_from", + "metric":"bleu", + "score":0.0153668157 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"as", + "task":"translation_from", + "metric":"chrf", + "score":0.1119995149 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"as", + "task":"translation_to", + "metric":"bleu", + "score":0.0988733729 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"as", + "task":"translation_to", + "metric":"chrf", + "score":0.2096173766 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"awa", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"awa", + "task":"translation_from", + "metric":"bleu", + "score":0.0696643378 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"awa", + "task":"translation_from", + "metric":"chrf", + "score":0.1931858455 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"awa", + "task":"translation_to", + "metric":"bleu", + "score":0.0309816185 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"awa", + "task":"translation_to", + "metric":"chrf", + "score":0.1018697927 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"az", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"az", + "task":"translation_from", + "metric":"bleu", + "score":0.0634083235 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"az", + "task":"translation_from", + "metric":"chrf", + "score":0.1819427877 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"az", + "task":"translation_to", + "metric":"bleu", + "score":0.0728528728 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"az", + "task":"translation_to", + "metric":"chrf", + "score":0.2068099712 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"be", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"be", + "task":"translation_from", + "metric":"bleu", + "score":0.0726648889 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"be", + "task":"translation_from", + "metric":"chrf", + "score":0.2430791182 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"be", + "task":"translation_to", + "metric":"bleu", + "score":0.0528414924 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"be", + "task":"translation_to", + "metric":"chrf", + "score":0.1724803068 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bho", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bho", + "task":"translation_from", + "metric":"bleu", + "score":0.1903946317 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bho", + "task":"translation_from", + "metric":"chrf", + "score":0.3145924631 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bho", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bho", + "task":"translation_to", + "metric":"chrf", + "score":0.0310651444 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bm", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bm", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bm", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bm", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bm", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bn", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bn", + "task":"translation_from", + "metric":"bleu", + "score":0.0425897525 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bn", + "task":"translation_from", + "metric":"chrf", + "score":0.1329517484 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bn", + "task":"translation_to", + "metric":"bleu", + "score":0.1071842556 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bn", + "task":"translation_to", + "metric":"chrf", + "score":0.2292182808 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ca", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ca", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ca", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ca", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ca", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ceb", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"bleu", + "score":0.1295041316 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"chrf", + "score":0.2647572228 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"bleu", + "score":0.0551171959 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"chrf", + "score":0.2019792449 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ckb", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"bleu", + "score":0.1181725504 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"chrf", + "score":0.3417239653 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"bleu", + "score":0.0030057917 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"chrf", + "score":0.050016858 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"cs", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"cs", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"cs", + "task":"translation_from", + "metric":"bleu", + "score":0.1106488773 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"cs", + "task":"translation_from", + "metric":"chrf", + "score":0.2661126449 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"cs", + "task":"translation_to", + "metric":"bleu", + "score":0.0566112691 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"cs", + "task":"translation_to", + "metric":"chrf", + "score":0.2161355093 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"de", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"de", + "task":"translation_from", + "metric":"bleu", + "score":0.1071586446 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"de", + "task":"translation_from", + "metric":"chrf", + "score":0.2867516145 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"de", + "task":"translation_to", + "metric":"bleu", + "score":0.1380160311 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"de", + "task":"translation_to", + "metric":"chrf", + "score":0.3472666619 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"el", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"el", + "task":"translation_from", + "metric":"bleu", + "score":0.1228102479 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"el", + "task":"translation_from", + "metric":"chrf", + "score":0.257059719 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"el", + "task":"translation_to", + "metric":"bleu", + "score":0.0709906394 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"el", + "task":"translation_to", + "metric":"chrf", + "score":0.1615768924 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"en", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"en", + "task":"translation_from", + "metric":"bleu", + "score":0.3271580119 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"en", + "task":"translation_from", + "metric":"chrf", + "score":0.4059591673 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"en", + "task":"translation_to", + "metric":"bleu", + "score":0.4705724484 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"en", + "task":"translation_to", + "metric":"chrf", + "score":0.5810510479 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"es", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"es", + "task":"translation_from", + "metric":"bleu", + "score":0.0612440394 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"es", + "task":"translation_from", + "metric":"chrf", + "score":0.214820597 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"es", + "task":"translation_to", + "metric":"bleu", + "score":0.0718408174 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"es", + "task":"translation_to", + "metric":"chrf", + "score":0.2974455623 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fa", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fa", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fa", + "task":"translation_from", + "metric":"bleu", + "score":0.1093307519 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fa", + "task":"translation_from", + "metric":"chrf", + "score":0.2212819207 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fa", + "task":"translation_to", + "metric":"bleu", + "score":0.0461058798 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fa", + "task":"translation_to", + "metric":"chrf", + "score":0.1370841628 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fil", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fil", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fil", + "task":"translation_from", + "metric":"bleu", + "score":0.1005924157 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fil", + "task":"translation_from", + "metric":"chrf", + "score":0.202708484 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fil", + "task":"translation_to", + "metric":"bleu", + "score":0.0160833262 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fil", + "task":"translation_to", + "metric":"chrf", + "score":0.1960110619 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fr", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fr", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fr", + "task":"translation_from", + "metric":"bleu", + "score":0.1269813968 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fr", + "task":"translation_from", + "metric":"chrf", + "score":0.3065913664 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fr", + "task":"translation_to", + "metric":"bleu", + "score":0.1789987295 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fr", + "task":"translation_to", + "metric":"chrf", + "score":0.3463028707 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.014745965 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.0749091363 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.0895914252 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"gu", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"gu", + "task":"translation_from", + "metric":"bleu", + "score":0.097971755 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"gu", + "task":"translation_from", + "metric":"chrf", + "score":0.1777195033 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"gu", + "task":"translation_to", + "metric":"bleu", + "score":0.0318870555 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"gu", + "task":"translation_to", + "metric":"chrf", + "score":0.1529629731 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ha", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ha", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ha", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ha", + "task":"translation_from", + "metric":"bleu", + "score":0.0369448389 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ha", + "task":"translation_from", + "metric":"chrf", + "score":0.1480560277 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ha", + "task":"translation_to", + "metric":"bleu", + "score":0.0919802251 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ha", + "task":"translation_to", + "metric":"chrf", + "score":0.2629251679 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hi", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hi", + "task":"translation_from", + "metric":"bleu", + "score":0.2538230452 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hi", + "task":"translation_from", + "metric":"chrf", + "score":0.3759994265 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hi", + "task":"translation_to", + "metric":"bleu", + "score":0.0835774684 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hi", + "task":"translation_to", + "metric":"chrf", + "score":0.1904298158 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hne", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hne", + "task":"translation_from", + "metric":"bleu", + "score":0.0800273183 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hne", + "task":"translation_from", + "metric":"chrf", + "score":0.2260677118 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hne", + "task":"translation_to", + "metric":"bleu", + "score":0.0220446366 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hne", + "task":"translation_to", + "metric":"chrf", + "score":0.0997285023 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ht", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ht", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ht", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ht", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ht", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hu", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hu", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hu", + "task":"translation_from", + "metric":"bleu", + "score":0.0883989834 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hu", + "task":"translation_from", + "metric":"chrf", + "score":0.206785454 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hu", + "task":"translation_to", + "metric":"bleu", + "score":0.0790692679 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hu", + "task":"translation_to", + "metric":"chrf", + "score":0.28304649 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"id", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"id", + "task":"translation_from", + "metric":"bleu", + "score":0.0773479102 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"id", + "task":"translation_from", + "metric":"chrf", + "score":0.2587381281 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"id", + "task":"translation_to", + "metric":"bleu", + "score":0.0433423647 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"id", + "task":"translation_to", + "metric":"chrf", + "score":0.2817069358 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ig", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ig", + "task":"translation_from", + "metric":"bleu", + "score":0.0612163002 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ig", + "task":"translation_from", + "metric":"chrf", + "score":0.2381342912 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ig", + "task":"translation_to", + "metric":"bleu", + "score":0.0426402139 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ig", + "task":"translation_to", + "metric":"chrf", + "score":0.1696737174 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ilo", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"bleu", + "score":0.0970247032 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"chrf", + "score":0.2111718332 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"bleu", + "score":0.0050070462 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"chrf", + "score":0.1683969558 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"it", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"it", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"it", + "task":"translation_from", + "metric":"bleu", + "score":0.139001615 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"it", + "task":"translation_from", + "metric":"chrf", + "score":0.2668336456 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"it", + "task":"translation_to", + "metric":"bleu", + "score":0.0475935646 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"it", + "task":"translation_to", + "metric":"chrf", + "score":0.2602541027 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ja", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ja", + "task":"translation_from", + "metric":"bleu", + "score":0.0609909305 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ja", + "task":"translation_from", + "metric":"chrf", + "score":0.1860226608 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ja", + "task":"translation_to", + "metric":"bleu", + "score":0.0692256682 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ja", + "task":"translation_to", + "metric":"chrf", + "score":0.1449932716 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"jv", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"jv", + "task":"translation_from", + "metric":"bleu", + "score":0.0495085803 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"jv", + "task":"translation_from", + "metric":"chrf", + "score":0.1459303026 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"jv", + "task":"translation_to", + "metric":"bleu", + "score":0.0098682093 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"jv", + "task":"translation_to", + "metric":"chrf", + "score":0.1292642853 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ki", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ki", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ki", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ki", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ki", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"kk", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"kk", + "task":"translation_from", + "metric":"bleu", + "score":0.0827091376 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"kk", + "task":"translation_from", + "metric":"chrf", + "score":0.2337306985 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"kk", + "task":"translation_to", + "metric":"bleu", + "score":0.0492400989 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"kk", + "task":"translation_to", + "metric":"chrf", + "score":0.155912411 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"km", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"km", + "task":"translation_from", + "metric":"bleu", + "score":0.0860125484 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"km", + "task":"translation_from", + "metric":"chrf", + "score":0.1623830923 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"km", + "task":"translation_to", + "metric":"bleu", + "score":0.0024514101 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"km", + "task":"translation_to", + "metric":"chrf", + "score":0.0781695805 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"kn", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"kn", + "task":"translation_from", + "metric":"bleu", + "score":0.0937784828 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"kn", + "task":"translation_from", + "metric":"chrf", + "score":0.2195953032 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"kn", + "task":"translation_to", + "metric":"bleu", + "score":0.0577688436 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"kn", + "task":"translation_to", + "metric":"chrf", + "score":0.1510063998 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ko", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ko", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ko", + "task":"translation_from", + "metric":"bleu", + "score":0.0680252346 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ko", + "task":"translation_from", + "metric":"chrf", + "score":0.2091636742 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ko", + "task":"translation_to", + "metric":"bleu", + "score":0.0555477009 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ko", + "task":"translation_to", + "metric":"chrf", + "score":0.0549298013 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"lua", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"lua", + "task":"translation_from", + "metric":"bleu", + "score":0.0036630043 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"lua", + "task":"translation_from", + "metric":"chrf", + "score":0.099240382 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"lua", + "task":"translation_to", + "metric":"bleu", + "score":0.0532977337 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"lua", + "task":"translation_to", + "metric":"chrf", + "score":0.2153600503 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mag", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mag", + "task":"translation_from", + "metric":"bleu", + "score":0.1425685645 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mag", + "task":"translation_from", + "metric":"chrf", + "score":0.3016796517 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mag", + "task":"translation_to", + "metric":"bleu", + "score":0.0118929014 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mag", + "task":"translation_to", + "metric":"chrf", + "score":0.0840825564 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mai", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mai", + "task":"translation_from", + "metric":"bleu", + "score":0.115229855 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mai", + "task":"translation_from", + "metric":"chrf", + "score":0.2180450998 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mai", + "task":"translation_to", + "metric":"bleu", + "score":0.0163179059 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mai", + "task":"translation_to", + "metric":"chrf", + "score":0.0417840087 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mg", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mg", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mg", + "task":"translation_from", + "metric":"bleu", + "score":0.0410364581 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mg", + "task":"translation_from", + "metric":"chrf", + "score":0.2193286405 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mg", + "task":"translation_to", + "metric":"bleu", + "score":0.0422799242 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mg", + "task":"translation_to", + "metric":"chrf", + "score":0.1425526516 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ml", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ml", + "task":"translation_from", + "metric":"bleu", + "score":0.0630918824 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ml", + "task":"translation_from", + "metric":"chrf", + "score":0.1710971727 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ml", + "task":"translation_to", + "metric":"bleu", + "score":0.0386225926 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ml", + "task":"translation_to", + "metric":"chrf", + "score":0.1445595523 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mr", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mr", + "task":"translation_from", + "metric":"bleu", + "score":0.1084731704 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mr", + "task":"translation_from", + "metric":"chrf", + "score":0.2498733805 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mr", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mr", + "task":"translation_to", + "metric":"chrf", + "score":0.0399406962 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ms", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ms", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ms", + "task":"translation_from", + "metric":"bleu", + "score":0.033427329 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ms", + "task":"translation_from", + "metric":"chrf", + "score":0.1616696801 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ms", + "task":"translation_to", + "metric":"bleu", + "score":0.115786224 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ms", + "task":"translation_to", + "metric":"chrf", + "score":0.3018549986 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"my", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"my", + "task":"translation_from", + "metric":"bleu", + "score":0.2294643956 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"my", + "task":"translation_from", + "metric":"chrf", + "score":0.3457333311 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"my", + "task":"translation_to", + "metric":"bleu", + "score":0.1065767565 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"my", + "task":"translation_to", + "metric":"chrf", + "score":0.2047469752 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ne", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ne", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ne", + "task":"translation_from", + "metric":"bleu", + "score":0.0951128399 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ne", + "task":"translation_from", + "metric":"chrf", + "score":0.2178534884 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ne", + "task":"translation_to", + "metric":"bleu", + "score":0.0398161454 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ne", + "task":"translation_to", + "metric":"chrf", + "score":0.1412294262 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"nl", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"nl", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"nl", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"nl", + "task":"translation_from", + "metric":"bleu", + "score":0.0563796721 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"nl", + "task":"translation_from", + "metric":"chrf", + "score":0.1918127836 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"nl", + "task":"translation_to", + "metric":"bleu", + "score":0.0887408505 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"nl", + "task":"translation_to", + "metric":"chrf", + "score":0.3444852597 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ny", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ny", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ny", + "task":"translation_from", + "metric":"bleu", + "score":0.0322569074 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ny", + "task":"translation_from", + "metric":"chrf", + "score":0.1681655692 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ny", + "task":"translation_to", + "metric":"bleu", + "score":0.0133097605 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ny", + "task":"translation_to", + "metric":"chrf", + "score":0.1890356187 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"om", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"om", + "task":"translation_from", + "metric":"bleu", + "score":0.0380467697 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"om", + "task":"translation_from", + "metric":"chrf", + "score":0.11665963 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"om", + "task":"translation_to", + "metric":"bleu", + "score":0.0196821089 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"om", + "task":"translation_to", + "metric":"chrf", + "score":0.1887330103 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"or", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"or", + "task":"translation_from", + "metric":"bleu", + "score":0.0987048471 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"or", + "task":"translation_from", + "metric":"chrf", + "score":0.2474195062 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"or", + "task":"translation_to", + "metric":"bleu", + "score":0.0246921682 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"or", + "task":"translation_to", + "metric":"chrf", + "score":0.1089265139 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pa", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pa", + "task":"translation_from", + "metric":"bleu", + "score":0.2220426626 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pa", + "task":"translation_from", + "metric":"chrf", + "score":0.3598952341 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pa", + "task":"translation_to", + "metric":"bleu", + "score":0.1611882376 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pa", + "task":"translation_to", + "metric":"chrf", + "score":0.2396561128 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pl", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pl", + "task":"translation_from", + "metric":"bleu", + "score":0.0904332342 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pl", + "task":"translation_from", + "metric":"chrf", + "score":0.2068730334 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pl", + "task":"translation_to", + "metric":"bleu", + "score":0.046065351 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pl", + "task":"translation_to", + "metric":"chrf", + "score":0.1925827805 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pt", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pt", + "task":"translation_from", + "metric":"bleu", + "score":0.1079576302 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pt", + "task":"translation_from", + "metric":"chrf", + "score":0.2645017017 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pt", + "task":"translation_to", + "metric":"bleu", + "score":0.0569295003 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pt", + "task":"translation_to", + "metric":"chrf", + "score":0.2615431845 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ro", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ro", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ro", + "task":"translation_from", + "metric":"bleu", + "score":0.131593328 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ro", + "task":"translation_from", + "metric":"chrf", + "score":0.3060223321 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ro", + "task":"translation_to", + "metric":"bleu", + "score":0.0757294413 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ro", + "task":"translation_to", + "metric":"chrf", + "score":0.2150897212 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ru", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ru", + "task":"translation_from", + "metric":"bleu", + "score":0.0926690761 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ru", + "task":"translation_from", + "metric":"chrf", + "score":0.2397253952 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ru", + "task":"translation_to", + "metric":"bleu", + "score":0.1044259789 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ru", + "task":"translation_to", + "metric":"chrf", + "score":0.236302624 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"rw", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"rw", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"rw", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"rw", + "task":"translation_from", + "metric":"bleu", + "score":0.0153852885 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"rw", + "task":"translation_from", + "metric":"chrf", + "score":0.1605190155 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"rw", + "task":"translation_to", + "metric":"bleu", + "score":0.0600552316 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"rw", + "task":"translation_to", + "metric":"chrf", + "score":0.2182309051 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sd", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sd", + "task":"translation_from", + "metric":"bleu", + "score":0.120327349 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sd", + "task":"translation_from", + "metric":"chrf", + "score":0.2042820289 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sd", + "task":"translation_to", + "metric":"bleu", + "score":0.0309396387 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sd", + "task":"translation_to", + "metric":"chrf", + "score":0.1043645846 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"si", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"si", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"si", + "task":"translation_from", + "metric":"bleu", + "score":0.0861987344 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"si", + "task":"translation_from", + "metric":"chrf", + "score":0.2079338406 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"si", + "task":"translation_to", + "metric":"bleu", + "score":0.0196434254 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"si", + "task":"translation_to", + "metric":"chrf", + "score":0.0610643505 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sn", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sn", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sn", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sn", + "task":"translation_from", + "metric":"bleu", + "score":0.0320247445 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sn", + "task":"translation_from", + "metric":"chrf", + "score":0.2176774161 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sn", + "task":"translation_to", + "metric":"bleu", + "score":0.0700005142 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sn", + "task":"translation_to", + "metric":"chrf", + "score":0.1952413901 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"so", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"so", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"so", + "task":"translation_from", + "metric":"bleu", + "score":0.0252575003 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"so", + "task":"translation_from", + "metric":"chrf", + "score":0.157057904 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"so", + "task":"translation_to", + "metric":"bleu", + "score":0.0629444831 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"so", + "task":"translation_to", + "metric":"chrf", + "score":0.1833979697 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sr", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sr", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sr", + "task":"translation_from", + "metric":"bleu", + "score":0.0868186974 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sr", + "task":"translation_from", + "metric":"chrf", + "score":0.2586575848 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sr", + "task":"translation_to", + "metric":"bleu", + "score":0.1093378877 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sr", + "task":"translation_to", + "metric":"chrf", + "score":0.2502315423 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"su", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"su", + "task":"translation_from", + "metric":"bleu", + "score":0.0782352762 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"su", + "task":"translation_from", + "metric":"chrf", + "score":0.2378174872 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"su", + "task":"translation_to", + "metric":"bleu", + "score":0.0338179306 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"su", + "task":"translation_to", + "metric":"chrf", + "score":0.2284098709 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sv", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sv", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sv", + "task":"translation_from", + "metric":"bleu", + "score":0.1179976804 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sv", + "task":"translation_from", + "metric":"chrf", + "score":0.2633320797 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sv", + "task":"translation_to", + "metric":"bleu", + "score":0.0494945427 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sv", + "task":"translation_to", + "metric":"chrf", + "score":0.2411403917 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sw", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sw", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sw", + "task":"translation_from", + "metric":"bleu", + "score":0.1282740208 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sw", + "task":"translation_from", + "metric":"chrf", + "score":0.2521886667 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sw", + "task":"translation_to", + "metric":"bleu", + "score":0.0748708455 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sw", + "task":"translation_to", + "metric":"chrf", + "score":0.2420611826 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ta", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ta", + "task":"translation_from", + "metric":"bleu", + "score":0.1073230839 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ta", + "task":"translation_from", + "metric":"chrf", + "score":0.1798254279 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ta", + "task":"translation_to", + "metric":"bleu", + "score":0.0317538654 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ta", + "task":"translation_to", + "metric":"chrf", + "score":0.2038003362 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"te", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"te", + "task":"translation_from", + "metric":"bleu", + "score":0.1951561832 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"te", + "task":"translation_from", + "metric":"chrf", + "score":0.3697480899 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"te", + "task":"translation_to", + "metric":"bleu", + "score":0.1899598166 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"te", + "task":"translation_to", + "metric":"chrf", + "score":0.2894416622 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"tg", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"tg", + "task":"translation_from", + "metric":"bleu", + "score":0.0653258846 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"tg", + "task":"translation_from", + "metric":"chrf", + "score":0.2205970586 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"tg", + "task":"translation_to", + "metric":"bleu", + "score":0.0222271283 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"tg", + "task":"translation_to", + "metric":"chrf", + "score":0.120000505 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"th", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"th", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"th", + "task":"translation_from", + "metric":"bleu", + "score":0.1262768628 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"th", + "task":"translation_from", + "metric":"chrf", + "score":0.2570885899 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"th", + "task":"translation_to", + "metric":"bleu", + "score":0.0575688551 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"th", + "task":"translation_to", + "metric":"chrf", + "score":0.1582234491 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ti", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ti", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ti", + "task":"translation_from", + "metric":"chrf", + "score":0.062613791 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ti", + "task":"translation_to", + "metric":"bleu", + "score":0.0059519046 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ti", + "task":"translation_to", + "metric":"chrf", + "score":0.0274291267 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"tr", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"tr", + "task":"translation_from", + "metric":"bleu", + "score":0.0337787053 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"tr", + "task":"translation_from", + "metric":"chrf", + "score":0.1824544035 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"tr", + "task":"translation_to", + "metric":"bleu", + "score":0.1405643754 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"tr", + "task":"translation_to", + "metric":"chrf", + "score":0.281387297 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"uk", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"uk", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"uk", + "task":"translation_from", + "metric":"bleu", + "score":0.1091041441 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"uk", + "task":"translation_from", + "metric":"chrf", + "score":0.2184696361 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"uk", + "task":"translation_to", + "metric":"bleu", + "score":0.1508474535 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"uk", + "task":"translation_to", + "metric":"chrf", + "score":0.234056096 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"umb", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"umb", + "task":"translation_from", + "metric":"bleu", + "score":0.0058005929 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"umb", + "task":"translation_from", + "metric":"chrf", + "score":0.0841095708 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"umb", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"umb", + "task":"translation_to", + "metric":"chrf", + "score":0.1328221884 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ur", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ur", + "task":"translation_from", + "metric":"bleu", + "score":0.1386027419 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ur", + "task":"translation_from", + "metric":"chrf", + "score":0.3084595255 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ur", + "task":"translation_to", + "metric":"bleu", + "score":0.0167447692 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ur", + "task":"translation_to", + "metric":"chrf", + "score":0.0960347815 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"uz", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"uz", + "task":"translation_from", + "metric":"bleu", + "score":0.0342337572 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"uz", + "task":"translation_from", + "metric":"chrf", + "score":0.1153353221 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"uz", + "task":"translation_to", + "metric":"bleu", + "score":0.0694684605 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"uz", + "task":"translation_to", + "metric":"chrf", + "score":0.2369528571 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"vi", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"vi", + "task":"translation_from", + "metric":"bleu", + "score":0.1615259525 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"vi", + "task":"translation_from", + "metric":"chrf", + "score":0.2808117936 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"vi", + "task":"translation_to", + "metric":"bleu", + "score":0.1251511875 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"vi", + "task":"translation_to", + "metric":"chrf", + "score":0.3058766946 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"wo", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"wo", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"wo", + "task":"translation_from", + "metric":"bleu", + "score":0.0065958006 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"wo", + "task":"translation_from", + "metric":"chrf", + "score":0.0642484091 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"wo", + "task":"translation_to", + "metric":"bleu", + "score":0.0043862302 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"wo", + "task":"translation_to", + "metric":"chrf", + "score":0.1616631945 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"wuu", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"bleu", + "score":0.0666328001 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"chrf", + "score":0.2282939681 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"bleu", + "score":0.0063550665 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"chrf", + "score":0.0402314549 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"xh", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"xh", + "task":"translation_from", + "metric":"bleu", + "score":0.0731036446 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"xh", + "task":"translation_from", + "metric":"chrf", + "score":0.1810894045 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"xh", + "task":"translation_to", + "metric":"bleu", + "score":0.0117190064 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"xh", + "task":"translation_to", + "metric":"chrf", + "score":0.1631103727 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"yo", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"yo", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"yo", + "task":"translation_from", + "metric":"bleu", + "score":0.058648798 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"yo", + "task":"translation_from", + "metric":"chrf", + "score":0.162917811 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"yo", + "task":"translation_to", + "metric":"bleu", + "score":0.0647492243 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"yo", + "task":"translation_to", + "metric":"chrf", + "score":0.1522863767 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"yue", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"yue", + "task":"translation_from", + "metric":"bleu", + "score":0.1133445002 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"yue", + "task":"translation_from", + "metric":"chrf", + "score":0.2630654346 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"yue", + "task":"translation_to", + "metric":"bleu", + "score":0.0177899901 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"yue", + "task":"translation_to", + "metric":"chrf", + "score":0.0452074918 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zh", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zh", + "task":"translation_from", + "metric":"bleu", + "score":0.0949407188 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zh", + "task":"translation_from", + "metric":"chrf", + "score":0.2042376654 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zh", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zh", + "task":"translation_to", + "metric":"chrf", + "score":0.0169223477 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zu", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zu", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zu", + "task":"translation_from", + "metric":"bleu", + "score":0.0689235431 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zu", + "task":"translation_from", + "metric":"chrf", + "score":0.2000811037 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zu", + "task":"translation_to", + "metric":"bleu", + "score":0.0413489342 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zu", + "task":"translation_to", + "metric":"chrf", + "score":0.1904482997 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"aeb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.2073802913 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.4889223975 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.0840656979 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.3453561943 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"af", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"af", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"af", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"af", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"af", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ak", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ak", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ak", + "task":"translation_from", + "metric":"bleu", + "score":0.120094546 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ak", + "task":"translation_from", + "metric":"chrf", + "score":0.3259782194 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ak", + "task":"translation_to", + "metric":"bleu", + "score":0.0974181135 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ak", + "task":"translation_to", + "metric":"chrf", + "score":0.3477814679 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"am", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"am", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"am", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"am", + "task":"translation_from", + "metric":"bleu", + "score":0.2393172056 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"am", + "task":"translation_from", + "metric":"chrf", + "score":0.4971254293 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"am", + "task":"translation_to", + "metric":"bleu", + "score":0.2089212841 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"am", + "task":"translation_to", + "metric":"chrf", + "score":0.3406916002 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"apc", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"apc", + "task":"translation_from", + "metric":"bleu", + "score":0.2712045148 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"apc", + "task":"translation_from", + "metric":"chrf", + "score":0.5477096036 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"apc", + "task":"translation_to", + "metric":"bleu", + "score":0.178052271 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"apc", + "task":"translation_to", + "metric":"chrf", + "score":0.468064885 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ar", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ar", + "task":"translation_from", + "metric":"bleu", + "score":0.2747843596 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ar", + "task":"translation_from", + "metric":"chrf", + "score":0.5519960681 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ar", + "task":"translation_to", + "metric":"bleu", + "score":0.2863967069 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ar", + "task":"translation_to", + "metric":"chrf", + "score":0.5318173199 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ary", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ary", + "task":"translation_from", + "metric":"bleu", + "score":0.1096694862 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ary", + "task":"translation_from", + "metric":"chrf", + "score":0.4291604898 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ary", + "task":"translation_to", + "metric":"bleu", + "score":0.1630720543 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ary", + "task":"translation_to", + "metric":"chrf", + "score":0.3952400339 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"arz", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"arz", + "task":"translation_from", + "metric":"bleu", + "score":0.1892846534 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"arz", + "task":"translation_from", + "metric":"chrf", + "score":0.4212342522 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"arz", + "task":"translation_to", + "metric":"bleu", + "score":0.1938470016 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"arz", + "task":"translation_to", + "metric":"chrf", + "score":0.4527968539 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"as", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"as", + "task":"translation_from", + "metric":"bleu", + "score":0.2094379574 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"as", + "task":"translation_from", + "metric":"chrf", + "score":0.4509809217 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"as", + "task":"translation_to", + "metric":"bleu", + "score":0.1931386564 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"as", + "task":"translation_to", + "metric":"chrf", + "score":0.4233010233 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"awa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"awa", + "task":"translation_from", + "metric":"bleu", + "score":0.2957522582 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"awa", + "task":"translation_from", + "metric":"chrf", + "score":0.5232039352 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"awa", + "task":"translation_to", + "metric":"bleu", + "score":0.2308361669 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"awa", + "task":"translation_to", + "metric":"chrf", + "score":0.4087255612 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"az", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"az", + "task":"translation_from", + "metric":"bleu", + "score":0.200456445 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"az", + "task":"translation_from", + "metric":"chrf", + "score":0.4226152307 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"az", + "task":"translation_to", + "metric":"bleu", + "score":0.1414132922 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"az", + "task":"translation_to", + "metric":"chrf", + "score":0.4170843853 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"be", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"be", + "task":"translation_from", + "metric":"bleu", + "score":0.18522743 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"be", + "task":"translation_from", + "metric":"chrf", + "score":0.4467570037 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"be", + "task":"translation_to", + "metric":"bleu", + "score":0.2590661095 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"be", + "task":"translation_to", + "metric":"chrf", + "score":0.4657468506 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bho", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bho", + "task":"translation_from", + "metric":"bleu", + "score":0.2663307677 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bho", + "task":"translation_from", + "metric":"chrf", + "score":0.519985227 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bho", + "task":"translation_to", + "metric":"bleu", + "score":0.1913577407 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bho", + "task":"translation_to", + "metric":"chrf", + "score":0.4064669591 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bm", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bm", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bm", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bm", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bm", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bn", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bn", + "task":"translation_from", + "metric":"bleu", + "score":0.271237739 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bn", + "task":"translation_from", + "metric":"chrf", + "score":0.5173954387 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bn", + "task":"translation_to", + "metric":"bleu", + "score":0.3067537945 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bn", + "task":"translation_to", + "metric":"chrf", + "score":0.5194482945 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ca", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ca", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ca", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ca", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ca", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ceb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"bleu", + "score":0.3694979709 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"chrf", + "score":0.59081536 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"bleu", + "score":0.374702944 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"chrf", + "score":0.6019503341 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ckb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"bleu", + "score":0.2792699678 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"chrf", + "score":0.5157552806 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"bleu", + "score":0.2334415639 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"chrf", + "score":0.5128705295 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"cs", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"cs", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"cs", + "task":"translation_from", + "metric":"bleu", + "score":0.3536861453 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"cs", + "task":"translation_from", + "metric":"chrf", + "score":0.6024608455 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"cs", + "task":"translation_to", + "metric":"bleu", + "score":0.4031829559 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"cs", + "task":"translation_to", + "metric":"chrf", + "score":0.6234553711 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"de", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"de", + "task":"translation_from", + "metric":"bleu", + "score":0.3189602129 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"de", + "task":"translation_from", + "metric":"chrf", + "score":0.5548503533 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"de", + "task":"translation_to", + "metric":"bleu", + "score":0.5229096392 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"de", + "task":"translation_to", + "metric":"chrf", + "score":0.7023434262 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"el", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"el", + "task":"translation_from", + "metric":"bleu", + "score":0.3137252517 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"el", + "task":"translation_from", + "metric":"chrf", + "score":0.5147981205 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"el", + "task":"translation_to", + "metric":"bleu", + "score":0.3302929673 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"el", + "task":"translation_to", + "metric":"chrf", + "score":0.505425141 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"en", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"en", + "task":"translation_from", + "metric":"bleu", + "score":0.3889146477 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"en", + "task":"translation_from", + "metric":"chrf", + "score":0.628092835 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"en", + "task":"translation_to", + "metric":"bleu", + "score":0.4660772497 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"en", + "task":"translation_to", + "metric":"chrf", + "score":0.7280386297 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"es", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"es", + "task":"translation_from", + "metric":"bleu", + "score":0.3593767686 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"es", + "task":"translation_from", + "metric":"chrf", + "score":0.5668073679 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"es", + "task":"translation_to", + "metric":"bleu", + "score":0.3662275621 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"es", + "task":"translation_to", + "metric":"chrf", + "score":0.6102640711 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fa", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fa", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fa", + "task":"translation_from", + "metric":"bleu", + "score":0.286051969 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fa", + "task":"translation_from", + "metric":"chrf", + "score":0.5373856549 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fa", + "task":"translation_to", + "metric":"bleu", + "score":0.1816947237 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fa", + "task":"translation_to", + "metric":"chrf", + "score":0.3981159206 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fil", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fil", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fil", + "task":"translation_from", + "metric":"bleu", + "score":0.3579818144 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fil", + "task":"translation_from", + "metric":"chrf", + "score":0.5889481625 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fil", + "task":"translation_to", + "metric":"bleu", + "score":0.3403832088 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fil", + "task":"translation_to", + "metric":"chrf", + "score":0.590264879 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fr", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fr", + "task":"translation_from", + "metric":"bleu", + "score":0.3180384008 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fr", + "task":"translation_from", + "metric":"chrf", + "score":0.5571267732 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fr", + "task":"translation_to", + "metric":"bleu", + "score":0.5778354146 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fr", + "task":"translation_to", + "metric":"chrf", + "score":0.7490356238 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.0380719948 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.2066039108 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0259757351 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.147148937 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"gu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"gu", + "task":"translation_from", + "metric":"bleu", + "score":0.34811918 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"gu", + "task":"translation_from", + "metric":"chrf", + "score":0.5482709715 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"gu", + "task":"translation_to", + "metric":"bleu", + "score":0.1618983325 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"gu", + "task":"translation_to", + "metric":"chrf", + "score":0.4411905252 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ha", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ha", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ha", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ha", + "task":"translation_from", + "metric":"bleu", + "score":0.1925315551 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ha", + "task":"translation_from", + "metric":"chrf", + "score":0.4032389241 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ha", + "task":"translation_to", + "metric":"bleu", + "score":0.1992720083 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ha", + "task":"translation_to", + "metric":"chrf", + "score":0.4905441802 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hi", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hi", + "task":"translation_from", + "metric":"bleu", + "score":0.3722751955 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hi", + "task":"translation_from", + "metric":"chrf", + "score":0.6207213131 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hi", + "task":"translation_to", + "metric":"bleu", + "score":0.3378499277 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hi", + "task":"translation_to", + "metric":"chrf", + "score":0.554090013 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hne", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hne", + "task":"translation_from", + "metric":"bleu", + "score":0.2879989689 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hne", + "task":"translation_from", + "metric":"chrf", + "score":0.5083598943 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hne", + "task":"translation_to", + "metric":"bleu", + "score":0.1719225434 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hne", + "task":"translation_to", + "metric":"chrf", + "score":0.3992950999 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ht", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ht", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ht", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ht", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ht", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hu", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hu", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hu", + "task":"translation_from", + "metric":"bleu", + "score":0.3234067809 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hu", + "task":"translation_from", + "metric":"chrf", + "score":0.5706707095 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hu", + "task":"translation_to", + "metric":"bleu", + "score":0.3187264685 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hu", + "task":"translation_to", + "metric":"chrf", + "score":0.5856828402 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"id", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"id", + "task":"translation_from", + "metric":"bleu", + "score":0.3583744222 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"id", + "task":"translation_from", + "metric":"chrf", + "score":0.5732194975 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"id", + "task":"translation_to", + "metric":"bleu", + "score":0.3364664006 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"id", + "task":"translation_to", + "metric":"chrf", + "score":0.6438910651 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ig", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ig", + "task":"translation_from", + "metric":"bleu", + "score":0.225000401 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ig", + "task":"translation_from", + "metric":"chrf", + "score":0.4567066441 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ig", + "task":"translation_to", + "metric":"bleu", + "score":0.1941055199 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ig", + "task":"translation_to", + "metric":"chrf", + "score":0.4504811493 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ilo", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"bleu", + "score":0.1944477164 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"chrf", + "score":0.4517028309 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"bleu", + "score":0.2035517344 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"chrf", + "score":0.489419705 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"it", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"it", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"it", + "task":"translation_from", + "metric":"bleu", + "score":0.3074361781 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"it", + "task":"translation_from", + "metric":"chrf", + "score":0.5178180754 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"it", + "task":"translation_to", + "metric":"bleu", + "score":0.3505959215 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"it", + "task":"translation_to", + "metric":"chrf", + "score":0.5955060476 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ja", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ja", + "task":"translation_from", + "metric":"bleu", + "score":0.2581140706 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ja", + "task":"translation_from", + "metric":"chrf", + "score":0.5395853617 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ja", + "task":"translation_to", + "metric":"bleu", + "score":0.3298839393 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ja", + "task":"translation_to", + "metric":"chrf", + "score":0.4471547552 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"jv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"jv", + "task":"translation_from", + "metric":"bleu", + "score":0.3177915441 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"jv", + "task":"translation_from", + "metric":"chrf", + "score":0.5387853038 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"jv", + "task":"translation_to", + "metric":"bleu", + "score":0.2549228547 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"jv", + "task":"translation_to", + "metric":"chrf", + "score":0.5322440265 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ki", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ki", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ki", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ki", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ki", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"kk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"kk", + "task":"translation_from", + "metric":"bleu", + "score":0.1983700044 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"kk", + "task":"translation_from", + "metric":"chrf", + "score":0.4843458319 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"kk", + "task":"translation_to", + "metric":"bleu", + "score":0.2920207746 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"kk", + "task":"translation_to", + "metric":"chrf", + "score":0.5345155349 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"km", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"km", + "task":"translation_from", + "metric":"bleu", + "score":0.3702042307 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"km", + "task":"translation_from", + "metric":"chrf", + "score":0.5776853975 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"km", + "task":"translation_to", + "metric":"bleu", + "score":0.1498433716 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"km", + "task":"translation_to", + "metric":"chrf", + "score":0.3652702605 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"kn", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"kn", + "task":"translation_from", + "metric":"bleu", + "score":0.2858443353 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"kn", + "task":"translation_from", + "metric":"chrf", + "score":0.5499221943 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"kn", + "task":"translation_to", + "metric":"bleu", + "score":0.2481102245 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"kn", + "task":"translation_to", + "metric":"chrf", + "score":0.4829685786 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ko", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ko", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ko", + "task":"translation_from", + "metric":"bleu", + "score":0.2305492704 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ko", + "task":"translation_from", + "metric":"chrf", + "score":0.4826740501 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ko", + "task":"translation_to", + "metric":"bleu", + "score":0.1746024172 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ko", + "task":"translation_to", + "metric":"chrf", + "score":0.3073554703 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"lua", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"lua", + "task":"translation_from", + "metric":"bleu", + "score":0.0913600379 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"lua", + "task":"translation_from", + "metric":"chrf", + "score":0.3305636235 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"lua", + "task":"translation_to", + "metric":"bleu", + "score":0.0269728382 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"lua", + "task":"translation_to", + "metric":"chrf", + "score":0.3155017027 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mag", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mag", + "task":"translation_from", + "metric":"bleu", + "score":0.3751831337 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mag", + "task":"translation_from", + "metric":"chrf", + "score":0.6085851316 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mag", + "task":"translation_to", + "metric":"bleu", + "score":0.259988405 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mag", + "task":"translation_to", + "metric":"chrf", + "score":0.5046714005 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mai", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mai", + "task":"translation_from", + "metric":"bleu", + "score":0.306099972 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mai", + "task":"translation_from", + "metric":"chrf", + "score":0.5370842801 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mai", + "task":"translation_to", + "metric":"bleu", + "score":0.1736022871 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mai", + "task":"translation_to", + "metric":"chrf", + "score":0.4305653856 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mg", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mg", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mg", + "task":"translation_from", + "metric":"bleu", + "score":0.2826629018 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mg", + "task":"translation_from", + "metric":"chrf", + "score":0.5215979873 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mg", + "task":"translation_to", + "metric":"bleu", + "score":0.238462643 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mg", + "task":"translation_to", + "metric":"chrf", + "score":0.5334745774 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ml", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ml", + "task":"translation_from", + "metric":"bleu", + "score":0.3161992509 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ml", + "task":"translation_from", + "metric":"chrf", + "score":0.5479755911 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ml", + "task":"translation_to", + "metric":"bleu", + "score":0.2133071404 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ml", + "task":"translation_to", + "metric":"chrf", + "score":0.4660281027 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mr", + "task":"translation_from", + "metric":"bleu", + "score":0.2370074805 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mr", + "task":"translation_from", + "metric":"chrf", + "score":0.4804215458 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mr", + "task":"translation_to", + "metric":"bleu", + "score":0.2399769139 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mr", + "task":"translation_to", + "metric":"chrf", + "score":0.4726429935 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ms", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ms", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ms", + "task":"translation_from", + "metric":"bleu", + "score":0.3104483533 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ms", + "task":"translation_from", + "metric":"chrf", + "score":0.5705763492 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ms", + "task":"translation_to", + "metric":"bleu", + "score":0.4229626959 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ms", + "task":"translation_to", + "metric":"chrf", + "score":0.6856510383 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"my", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"my", + "task":"translation_from", + "metric":"bleu", + "score":0.2227645269 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"my", + "task":"translation_from", + "metric":"chrf", + "score":0.4888582617 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"my", + "task":"translation_to", + "metric":"bleu", + "score":0.1869632744 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"my", + "task":"translation_to", + "metric":"chrf", + "score":0.4322398057 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ne", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ne", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ne", + "task":"translation_from", + "metric":"bleu", + "score":0.3115387303 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ne", + "task":"translation_from", + "metric":"chrf", + "score":0.5342290246 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ne", + "task":"translation_to", + "metric":"bleu", + "score":0.22081567 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ne", + "task":"translation_to", + "metric":"chrf", + "score":0.4878836055 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"nl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"nl", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"nl", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"nl", + "task":"translation_from", + "metric":"bleu", + "score":0.3125704924 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"nl", + "task":"translation_from", + "metric":"chrf", + "score":0.5397676594 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"nl", + "task":"translation_to", + "metric":"bleu", + "score":0.3586968371 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"nl", + "task":"translation_to", + "metric":"chrf", + "score":0.6075205554 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ny", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ny", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ny", + "task":"translation_from", + "metric":"bleu", + "score":0.1901221224 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ny", + "task":"translation_from", + "metric":"chrf", + "score":0.438728736 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ny", + "task":"translation_to", + "metric":"bleu", + "score":0.1330024304 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ny", + "task":"translation_to", + "metric":"chrf", + "score":0.4711022084 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"om", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"om", + "task":"translation_from", + "metric":"bleu", + "score":0.0258426139 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"om", + "task":"translation_from", + "metric":"chrf", + "score":0.2237241232 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"om", + "task":"translation_to", + "metric":"bleu", + "score":0.0460531144 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"om", + "task":"translation_to", + "metric":"chrf", + "score":0.3418147419 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"or", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"or", + "task":"translation_from", + "metric":"bleu", + "score":0.3714452662 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"or", + "task":"translation_from", + "metric":"chrf", + "score":0.5977153904 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"or", + "task":"translation_to", + "metric":"bleu", + "score":0.2234825764 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"or", + "task":"translation_to", + "metric":"chrf", + "score":0.4562477173 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pa", + "task":"translation_from", + "metric":"bleu", + "score":0.4180718844 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pa", + "task":"translation_from", + "metric":"chrf", + "score":0.6426219278 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pa", + "task":"translation_to", + "metric":"bleu", + "score":0.3938693136 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pa", + "task":"translation_to", + "metric":"chrf", + "score":0.5573992167 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pl", + "task":"translation_from", + "metric":"bleu", + "score":0.2456102401 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pl", + "task":"translation_from", + "metric":"chrf", + "score":0.5190609119 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pl", + "task":"translation_to", + "metric":"bleu", + "score":0.4265619216 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pl", + "task":"translation_to", + "metric":"chrf", + "score":0.6320824157 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pt", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pt", + "task":"translation_from", + "metric":"bleu", + "score":0.3537745123 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pt", + "task":"translation_from", + "metric":"chrf", + "score":0.5904429929 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pt", + "task":"translation_to", + "metric":"bleu", + "score":0.4588664196 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pt", + "task":"translation_to", + "metric":"chrf", + "score":0.6844540285 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ro", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ro", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ro", + "task":"translation_from", + "metric":"bleu", + "score":0.3139442337 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ro", + "task":"translation_from", + "metric":"chrf", + "score":0.5741447282 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ro", + "task":"translation_to", + "metric":"bleu", + "score":0.5016049999 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ro", + "task":"translation_to", + "metric":"chrf", + "score":0.6788048008 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ru", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ru", + "task":"translation_from", + "metric":"bleu", + "score":0.2449777422 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ru", + "task":"translation_from", + "metric":"chrf", + "score":0.5268764903 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ru", + "task":"translation_to", + "metric":"bleu", + "score":0.3789708434 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ru", + "task":"translation_to", + "metric":"chrf", + "score":0.5790333031 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"rw", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"rw", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"rw", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"rw", + "task":"translation_from", + "metric":"bleu", + "score":0.1839360587 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"rw", + "task":"translation_from", + "metric":"chrf", + "score":0.448997409 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"rw", + "task":"translation_to", + "metric":"bleu", + "score":0.1891835724 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"rw", + "task":"translation_to", + "metric":"chrf", + "score":0.508623725 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sd", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sd", + "task":"translation_from", + "metric":"bleu", + "score":0.3352727297 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sd", + "task":"translation_from", + "metric":"chrf", + "score":0.5583215205 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sd", + "task":"translation_to", + "metric":"bleu", + "score":0.2009000601 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sd", + "task":"translation_to", + "metric":"chrf", + "score":0.4004383195 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"si", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"si", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"si", + "task":"translation_from", + "metric":"bleu", + "score":0.2297304995 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"si", + "task":"translation_from", + "metric":"chrf", + "score":0.5040607132 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"si", + "task":"translation_to", + "metric":"bleu", + "score":0.2136543311 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"si", + "task":"translation_to", + "metric":"chrf", + "score":0.3916393466 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sn", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sn", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sn", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sn", + "task":"translation_from", + "metric":"bleu", + "score":0.1221415503 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sn", + "task":"translation_from", + "metric":"chrf", + "score":0.3516954503 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sn", + "task":"translation_to", + "metric":"bleu", + "score":0.108688779 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sn", + "task":"translation_to", + "metric":"chrf", + "score":0.4515663403 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"so", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"so", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"so", + "task":"translation_from", + "metric":"bleu", + "score":0.2308889646 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"so", + "task":"translation_from", + "metric":"chrf", + "score":0.4618048204 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"so", + "task":"translation_to", + "metric":"bleu", + "score":0.1667302795 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"so", + "task":"translation_to", + "metric":"chrf", + "score":0.4717296026 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sr", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sr", + "task":"translation_from", + "metric":"bleu", + "score":0.2351861569 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sr", + "task":"translation_from", + "metric":"chrf", + "score":0.5329036218 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sr", + "task":"translation_to", + "metric":"bleu", + "score":0.4168384094 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sr", + "task":"translation_to", + "metric":"chrf", + "score":0.6032787874 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"su", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"su", + "task":"translation_from", + "metric":"bleu", + "score":0.2291561983 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"su", + "task":"translation_from", + "metric":"chrf", + "score":0.4673987803 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"su", + "task":"translation_to", + "metric":"bleu", + "score":0.2036733766 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"su", + "task":"translation_to", + "metric":"chrf", + "score":0.5047620958 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sv", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sv", + "task":"translation_from", + "metric":"bleu", + "score":0.3500384253 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sv", + "task":"translation_from", + "metric":"chrf", + "score":0.5797456052 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sv", + "task":"translation_to", + "metric":"bleu", + "score":0.4268868445 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sv", + "task":"translation_to", + "metric":"chrf", + "score":0.664863412 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sw", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sw", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sw", + "task":"translation_from", + "metric":"bleu", + "score":0.3005035588 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sw", + "task":"translation_from", + "metric":"chrf", + "score":0.5210660172 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sw", + "task":"translation_to", + "metric":"bleu", + "score":0.3401968092 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sw", + "task":"translation_to", + "metric":"chrf", + "score":0.6217197146 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ta", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ta", + "task":"translation_from", + "metric":"bleu", + "score":0.2662307086 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ta", + "task":"translation_from", + "metric":"chrf", + "score":0.5053585639 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ta", + "task":"translation_to", + "metric":"bleu", + "score":0.3044345778 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ta", + "task":"translation_to", + "metric":"chrf", + "score":0.5714036731 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"te", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"te", + "task":"translation_from", + "metric":"bleu", + "score":0.3330093484 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"te", + "task":"translation_from", + "metric":"chrf", + "score":0.5694168709 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"te", + "task":"translation_to", + "metric":"bleu", + "score":0.257812168 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"te", + "task":"translation_to", + "metric":"chrf", + "score":0.5167002436 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"tg", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"tg", + "task":"translation_from", + "metric":"bleu", + "score":0.2176170344 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"tg", + "task":"translation_from", + "metric":"chrf", + "score":0.4496406258 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"tg", + "task":"translation_to", + "metric":"bleu", + "score":0.2605536967 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"tg", + "task":"translation_to", + "metric":"chrf", + "score":0.4816066849 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"th", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"th", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"th", + "task":"translation_from", + "metric":"bleu", + "score":0.2992360169 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"th", + "task":"translation_from", + "metric":"chrf", + "score":0.5585599708 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"th", + "task":"translation_to", + "metric":"bleu", + "score":0.4269079012 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"th", + "task":"translation_to", + "metric":"chrf", + "score":0.5719718715 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ti", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ti", + "task":"translation_from", + "metric":"bleu", + "score":0.2042995208 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ti", + "task":"translation_from", + "metric":"chrf", + "score":0.416626147 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ti", + "task":"translation_to", + "metric":"bleu", + "score":0.0833250166 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ti", + "task":"translation_to", + "metric":"chrf", + "score":0.1982489294 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"tr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"tr", + "task":"translation_from", + "metric":"bleu", + "score":0.2832304201 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"tr", + "task":"translation_from", + "metric":"chrf", + "score":0.5467240003 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"tr", + "task":"translation_to", + "metric":"bleu", + "score":0.3273464288 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"tr", + "task":"translation_to", + "metric":"chrf", + "score":0.5827048506 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"uk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"uk", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"uk", + "task":"translation_from", + "metric":"bleu", + "score":0.2813742416 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"uk", + "task":"translation_from", + "metric":"chrf", + "score":0.5413704266 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"uk", + "task":"translation_to", + "metric":"bleu", + "score":0.4063054094 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"uk", + "task":"translation_to", + "metric":"chrf", + "score":0.6020718231 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"umb", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"umb", + "task":"translation_from", + "metric":"bleu", + "score":0.0495917134 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"umb", + "task":"translation_from", + "metric":"chrf", + "score":0.1711087397 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"umb", + "task":"translation_to", + "metric":"bleu", + "score":0.0358872001 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"umb", + "task":"translation_to", + "metric":"chrf", + "score":0.2761667256 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ur", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ur", + "task":"translation_from", + "metric":"bleu", + "score":0.322448107 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ur", + "task":"translation_from", + "metric":"chrf", + "score":0.5887654616 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ur", + "task":"translation_to", + "metric":"bleu", + "score":0.2148139783 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ur", + "task":"translation_to", + "metric":"chrf", + "score":0.4226865444 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"uz", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"uz", + "task":"translation_from", + "metric":"bleu", + "score":0.2829644119 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"uz", + "task":"translation_from", + "metric":"chrf", + "score":0.5194956482 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"uz", + "task":"translation_to", + "metric":"bleu", + "score":0.2911955464 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"uz", + "task":"translation_to", + "metric":"chrf", + "score":0.5560139888 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"vi", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"vi", + "task":"translation_from", + "metric":"bleu", + "score":0.2745000434 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"vi", + "task":"translation_from", + "metric":"chrf", + "score":0.5206422805 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"vi", + "task":"translation_to", + "metric":"bleu", + "score":0.4261790941 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"vi", + "task":"translation_to", + "metric":"chrf", + "score":0.6358462464 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"wo", + "task":"classification", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"wo", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"wo", + "task":"translation_from", + "metric":"bleu", + "score":0.0696458062 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"wo", + "task":"translation_from", + "metric":"chrf", + "score":0.2461140434 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"wo", + "task":"translation_to", + "metric":"bleu", + "score":0.0728989985 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"wo", + "task":"translation_to", + "metric":"chrf", + "score":0.2267265908 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"wuu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"bleu", + "score":0.2072386748 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"chrf", + "score":0.4628288648 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"bleu", + "score":0.1471425714 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"chrf", + "score":0.1971299212 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"xh", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"xh", + "task":"translation_from", + "metric":"bleu", + "score":0.253783308 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"xh", + "task":"translation_from", + "metric":"chrf", + "score":0.4487387303 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"xh", + "task":"translation_to", + "metric":"bleu", + "score":0.0662544821 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"xh", + "task":"translation_to", + "metric":"chrf", + "score":0.3784904721 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"yo", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"yo", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"yo", + "task":"translation_from", + "metric":"bleu", + "score":0.0887390501 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"yo", + "task":"translation_from", + "metric":"chrf", + "score":0.3201148841 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"yo", + "task":"translation_to", + "metric":"bleu", + "score":0.1178050815 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"yo", + "task":"translation_to", + "metric":"chrf", + "score":0.307433063 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"yue", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"yue", + "task":"translation_from", + "metric":"bleu", + "score":0.2253512269 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"yue", + "task":"translation_from", + "metric":"chrf", + "score":0.4949150094 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"yue", + "task":"translation_to", + "metric":"bleu", + "score":0.1897306863 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"yue", + "task":"translation_to", + "metric":"chrf", + "score":0.2561574259 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zh", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zh", + "task":"translation_from", + "metric":"bleu", + "score":0.2201641871 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zh", + "task":"translation_from", + "metric":"chrf", + "score":0.5051068628 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zh", + "task":"translation_to", + "metric":"bleu", + "score":0.2508351517 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zh", + "task":"translation_to", + "metric":"chrf", + "score":0.3110461024 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zu", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zu", + "task":"translation_from", + "metric":"bleu", + "score":0.252616884 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zu", + "task":"translation_from", + "metric":"chrf", + "score":0.4822778382 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zu", + "task":"translation_to", + "metric":"bleu", + "score":0.1940901676 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zu", + "task":"translation_to", + "metric":"chrf", + "score":0.4661416094 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"aeb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.2041309024 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.4630820951 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.1453469275 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.3874336138 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"af", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"af", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"af", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"af", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"af", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ak", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ak", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ak", + "task":"translation_from", + "metric":"bleu", + "score":0.1059711376 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ak", + "task":"translation_from", + "metric":"chrf", + "score":0.300568481 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ak", + "task":"translation_to", + "metric":"bleu", + "score":0.0110669593 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ak", + "task":"translation_to", + "metric":"chrf", + "score":0.2141540563 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"am", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"am", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"am", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"am", + "task":"translation_from", + "metric":"bleu", + "score":0.1906134629 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"am", + "task":"translation_from", + "metric":"chrf", + "score":0.4467868389 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"am", + "task":"translation_to", + "metric":"bleu", + "score":0.2001643223 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"am", + "task":"translation_to", + "metric":"chrf", + "score":0.3225170104 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"apc", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"apc", + "task":"translation_from", + "metric":"bleu", + "score":0.1876459632 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"apc", + "task":"translation_from", + "metric":"chrf", + "score":0.4830875841 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"apc", + "task":"translation_to", + "metric":"bleu", + "score":0.1830944017 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"apc", + "task":"translation_to", + "metric":"chrf", + "score":0.4175337587 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ar", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ar", + "task":"translation_from", + "metric":"bleu", + "score":0.260683336 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ar", + "task":"translation_from", + "metric":"chrf", + "score":0.5383651277 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ar", + "task":"translation_to", + "metric":"bleu", + "score":0.2962406565 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ar", + "task":"translation_to", + "metric":"chrf", + "score":0.5190026627 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ary", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ary", + "task":"translation_from", + "metric":"bleu", + "score":0.1438491224 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ary", + "task":"translation_from", + "metric":"chrf", + "score":0.418499848 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ary", + "task":"translation_to", + "metric":"bleu", + "score":0.1044262978 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ary", + "task":"translation_to", + "metric":"chrf", + "score":0.3577242047 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"arz", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"arz", + "task":"translation_from", + "metric":"bleu", + "score":0.1675595946 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"arz", + "task":"translation_from", + "metric":"chrf", + "score":0.4187188467 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"arz", + "task":"translation_to", + "metric":"bleu", + "score":0.1545869288 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"arz", + "task":"translation_to", + "metric":"chrf", + "score":0.4031218248 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"as", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"as", + "task":"translation_from", + "metric":"bleu", + "score":0.1892328534 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"as", + "task":"translation_from", + "metric":"chrf", + "score":0.4434206925 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"as", + "task":"translation_to", + "metric":"bleu", + "score":0.1070430926 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"as", + "task":"translation_to", + "metric":"chrf", + "score":0.3318636339 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"awa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"awa", + "task":"translation_from", + "metric":"bleu", + "score":0.3180630074 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"awa", + "task":"translation_from", + "metric":"chrf", + "score":0.5401606876 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"awa", + "task":"translation_to", + "metric":"bleu", + "score":0.1993490206 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"awa", + "task":"translation_to", + "metric":"chrf", + "score":0.4215901923 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"az", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"az", + "task":"translation_from", + "metric":"bleu", + "score":0.1604267099 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"az", + "task":"translation_from", + "metric":"chrf", + "score":0.4139767864 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"az", + "task":"translation_to", + "metric":"bleu", + "score":0.1651025864 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"az", + "task":"translation_to", + "metric":"chrf", + "score":0.3978212407 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"be", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"be", + "task":"translation_from", + "metric":"bleu", + "score":0.19213953 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"be", + "task":"translation_from", + "metric":"chrf", + "score":0.4512512424 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"be", + "task":"translation_to", + "metric":"bleu", + "score":0.2406657525 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"be", + "task":"translation_to", + "metric":"chrf", + "score":0.4536513075 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bho", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bho", + "task":"translation_from", + "metric":"bleu", + "score":0.2519150677 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bho", + "task":"translation_from", + "metric":"chrf", + "score":0.4966963131 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bho", + "task":"translation_to", + "metric":"bleu", + "score":0.2057435019 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bho", + "task":"translation_to", + "metric":"chrf", + "score":0.4016427491 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bm", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bm", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bm", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bm", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bm", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bn", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bn", + "task":"translation_from", + "metric":"bleu", + "score":0.2183929994 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bn", + "task":"translation_from", + "metric":"chrf", + "score":0.4877941086 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bn", + "task":"translation_to", + "metric":"bleu", + "score":0.2700916391 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bn", + "task":"translation_to", + "metric":"chrf", + "score":0.5150577414 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ca", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ca", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ca", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ca", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ca", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ceb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"bleu", + "score":0.2900668497 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"chrf", + "score":0.5379961095 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"bleu", + "score":0.3193377157 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"chrf", + "score":0.5978978692 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ckb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"bleu", + "score":0.2457083208 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"chrf", + "score":0.4937183307 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"bleu", + "score":0.1424911854 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"chrf", + "score":0.3546559531 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"cs", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"cs", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"cs", + "task":"translation_from", + "metric":"bleu", + "score":0.2481120403 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"cs", + "task":"translation_from", + "metric":"chrf", + "score":0.5339550423 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"cs", + "task":"translation_to", + "metric":"bleu", + "score":0.3131426524 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"cs", + "task":"translation_to", + "metric":"chrf", + "score":0.5548197404 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"de", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"de", + "task":"translation_from", + "metric":"bleu", + "score":0.3440655166 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"de", + "task":"translation_from", + "metric":"chrf", + "score":0.563902418 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"de", + "task":"translation_to", + "metric":"bleu", + "score":0.4305522274 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"de", + "task":"translation_to", + "metric":"chrf", + "score":0.6477508732 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"el", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"el", + "task":"translation_from", + "metric":"bleu", + "score":0.2080428665 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"el", + "task":"translation_from", + "metric":"chrf", + "score":0.4376921278 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"el", + "task":"translation_to", + "metric":"bleu", + "score":0.3106300811 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"el", + "task":"translation_to", + "metric":"chrf", + "score":0.4971105137 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"en", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"en", + "task":"translation_from", + "metric":"bleu", + "score":0.4113463435 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"en", + "task":"translation_from", + "metric":"chrf", + "score":0.6260248317 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"en", + "task":"translation_to", + "metric":"bleu", + "score":0.5310035709 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"en", + "task":"translation_to", + "metric":"chrf", + "score":0.7595845064 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"es", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"es", + "task":"translation_from", + "metric":"bleu", + "score":0.3031284355 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"es", + "task":"translation_from", + "metric":"chrf", + "score":0.5241309352 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"es", + "task":"translation_to", + "metric":"bleu", + "score":0.3289699508 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"es", + "task":"translation_to", + "metric":"chrf", + "score":0.5811203167 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fa", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fa", + "task":"translation_from", + "metric":"bleu", + "score":0.2483616515 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fa", + "task":"translation_from", + "metric":"chrf", + "score":0.5338391625 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fa", + "task":"translation_to", + "metric":"bleu", + "score":0.1651229998 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fa", + "task":"translation_to", + "metric":"chrf", + "score":0.3923963113 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fil", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fil", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fil", + "task":"translation_from", + "metric":"bleu", + "score":0.3057177881 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fil", + "task":"translation_from", + "metric":"chrf", + "score":0.5523945263 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fil", + "task":"translation_to", + "metric":"bleu", + "score":0.2711892461 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fil", + "task":"translation_to", + "metric":"chrf", + "score":0.5802332073 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fr", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fr", + "task":"translation_from", + "metric":"bleu", + "score":0.3349110908 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fr", + "task":"translation_from", + "metric":"chrf", + "score":0.564806297 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fr", + "task":"translation_to", + "metric":"bleu", + "score":0.4574014191 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fr", + "task":"translation_to", + "metric":"chrf", + "score":0.6626552528 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.0488154154 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.1944904286 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0115014356 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.1082073343 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"gu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"gu", + "task":"translation_from", + "metric":"bleu", + "score":0.2954497906 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"gu", + "task":"translation_from", + "metric":"chrf", + "score":0.5086877895 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"gu", + "task":"translation_to", + "metric":"bleu", + "score":0.1582270271 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"gu", + "task":"translation_to", + "metric":"chrf", + "score":0.4201411039 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ha", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ha", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ha", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ha", + "task":"translation_from", + "metric":"bleu", + "score":0.1697291765 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ha", + "task":"translation_from", + "metric":"chrf", + "score":0.4073157654 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ha", + "task":"translation_to", + "metric":"bleu", + "score":0.139672818 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ha", + "task":"translation_to", + "metric":"chrf", + "score":0.4450194819 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hi", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hi", + "task":"translation_from", + "metric":"bleu", + "score":0.3184042229 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hi", + "task":"translation_from", + "metric":"chrf", + "score":0.5712698408 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hi", + "task":"translation_to", + "metric":"bleu", + "score":0.3659029431 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hi", + "task":"translation_to", + "metric":"chrf", + "score":0.5796195236 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hne", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hne", + "task":"translation_from", + "metric":"bleu", + "score":0.2791185419 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hne", + "task":"translation_from", + "metric":"chrf", + "score":0.5226615992 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hne", + "task":"translation_to", + "metric":"bleu", + "score":0.145820804 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hne", + "task":"translation_to", + "metric":"chrf", + "score":0.3820953887 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ht", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ht", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ht", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ht", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ht", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hu", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hu", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hu", + "task":"translation_from", + "metric":"bleu", + "score":0.2313008892 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hu", + "task":"translation_from", + "metric":"chrf", + "score":0.4915348458 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hu", + "task":"translation_to", + "metric":"bleu", + "score":0.2765024802 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hu", + "task":"translation_to", + "metric":"chrf", + "score":0.5261755337 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"id", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"id", + "task":"translation_from", + "metric":"bleu", + "score":0.2301748885 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"id", + "task":"translation_from", + "metric":"chrf", + "score":0.4682741896 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"id", + "task":"translation_to", + "metric":"bleu", + "score":0.3346592082 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"id", + "task":"translation_to", + "metric":"chrf", + "score":0.6514874668 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ig", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ig", + "task":"translation_from", + "metric":"bleu", + "score":0.154261694 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ig", + "task":"translation_from", + "metric":"chrf", + "score":0.3957095627 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ig", + "task":"translation_to", + "metric":"bleu", + "score":0.1177946719 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ig", + "task":"translation_to", + "metric":"chrf", + "score":0.341868335 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ilo", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"bleu", + "score":0.2239397579 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"chrf", + "score":0.4512212104 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"bleu", + "score":0.135748348 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"chrf", + "score":0.4408716957 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"it", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"it", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"it", + "task":"translation_from", + "metric":"bleu", + "score":0.2724260509 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"it", + "task":"translation_from", + "metric":"chrf", + "score":0.5200202435 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"it", + "task":"translation_to", + "metric":"bleu", + "score":0.2753225284 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"it", + "task":"translation_to", + "metric":"chrf", + "score":0.5457466615 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ja", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ja", + "task":"translation_from", + "metric":"bleu", + "score":0.2664966821 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ja", + "task":"translation_from", + "metric":"chrf", + "score":0.5386982677 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ja", + "task":"translation_to", + "metric":"bleu", + "score":0.2651365589 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ja", + "task":"translation_to", + "metric":"chrf", + "score":0.409095006 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"jv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"jv", + "task":"translation_from", + "metric":"bleu", + "score":0.2326358655 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"jv", + "task":"translation_from", + "metric":"chrf", + "score":0.4815897231 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"jv", + "task":"translation_to", + "metric":"bleu", + "score":0.2187928356 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"jv", + "task":"translation_to", + "metric":"chrf", + "score":0.4896578943 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ki", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ki", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ki", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ki", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ki", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"kk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"kk", + "task":"translation_from", + "metric":"bleu", + "score":0.1666068635 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"kk", + "task":"translation_from", + "metric":"chrf", + "score":0.4554883841 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"kk", + "task":"translation_to", + "metric":"bleu", + "score":0.1547742726 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"kk", + "task":"translation_to", + "metric":"chrf", + "score":0.4534139462 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"km", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"km", + "task":"translation_from", + "metric":"bleu", + "score":0.2647824193 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"km", + "task":"translation_from", + "metric":"chrf", + "score":0.5269086196 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"km", + "task":"translation_to", + "metric":"bleu", + "score":0.1635334444 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"km", + "task":"translation_to", + "metric":"chrf", + "score":0.3431273828 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"kn", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"kn", + "task":"translation_from", + "metric":"bleu", + "score":0.247746183 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"kn", + "task":"translation_from", + "metric":"chrf", + "score":0.506339637 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"kn", + "task":"translation_to", + "metric":"bleu", + "score":0.1775009719 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"kn", + "task":"translation_to", + "metric":"chrf", + "score":0.4300321597 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ko", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ko", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ko", + "task":"translation_from", + "metric":"bleu", + "score":0.2402657185 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ko", + "task":"translation_from", + "metric":"chrf", + "score":0.497198112 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ko", + "task":"translation_to", + "metric":"bleu", + "score":0.3100527074 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ko", + "task":"translation_to", + "metric":"chrf", + "score":0.3696197774 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"lua", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"lua", + "task":"translation_from", + "metric":"bleu", + "score":0.0872330227 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"lua", + "task":"translation_from", + "metric":"chrf", + "score":0.3059813913 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"lua", + "task":"translation_to", + "metric":"bleu", + "score":0.0010116202 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"lua", + "task":"translation_to", + "metric":"chrf", + "score":0.1893341465 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mag", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mag", + "task":"translation_from", + "metric":"bleu", + "score":0.3447519877 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mag", + "task":"translation_from", + "metric":"chrf", + "score":0.578789784 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mag", + "task":"translation_to", + "metric":"bleu", + "score":0.2508560655 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mag", + "task":"translation_to", + "metric":"chrf", + "score":0.4987822313 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mai", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mai", + "task":"translation_from", + "metric":"bleu", + "score":0.2732982319 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mai", + "task":"translation_from", + "metric":"chrf", + "score":0.5233285219 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mai", + "task":"translation_to", + "metric":"bleu", + "score":0.137657899 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mai", + "task":"translation_to", + "metric":"chrf", + "score":0.3935929024 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mg", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mg", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mg", + "task":"translation_from", + "metric":"bleu", + "score":0.2082275626 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mg", + "task":"translation_from", + "metric":"chrf", + "score":0.4639776287 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mg", + "task":"translation_to", + "metric":"bleu", + "score":0.1350252624 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mg", + "task":"translation_to", + "metric":"chrf", + "score":0.4834543859 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ml", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ml", + "task":"translation_from", + "metric":"bleu", + "score":0.2600500491 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ml", + "task":"translation_from", + "metric":"chrf", + "score":0.5029669853 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ml", + "task":"translation_to", + "metric":"bleu", + "score":0.2091322046 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ml", + "task":"translation_to", + "metric":"chrf", + "score":0.4711774201 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mr", + "task":"translation_from", + "metric":"bleu", + "score":0.2256246926 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mr", + "task":"translation_from", + "metric":"chrf", + "score":0.4703189943 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mr", + "task":"translation_to", + "metric":"bleu", + "score":0.2254492518 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mr", + "task":"translation_to", + "metric":"chrf", + "score":0.447826525 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ms", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ms", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ms", + "task":"translation_from", + "metric":"bleu", + "score":0.2986303081 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ms", + "task":"translation_from", + "metric":"chrf", + "score":0.5546917725 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ms", + "task":"translation_to", + "metric":"bleu", + "score":0.3680194341 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ms", + "task":"translation_to", + "metric":"chrf", + "score":0.6778287705 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"my", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"my", + "task":"translation_from", + "metric":"bleu", + "score":0.1979480779 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"my", + "task":"translation_from", + "metric":"chrf", + "score":0.4791457508 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"my", + "task":"translation_to", + "metric":"bleu", + "score":0.1536786708 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"my", + "task":"translation_to", + "metric":"chrf", + "score":0.4315811907 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ne", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ne", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ne", + "task":"translation_from", + "metric":"bleu", + "score":0.2955515679 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ne", + "task":"translation_from", + "metric":"chrf", + "score":0.5399574649 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ne", + "task":"translation_to", + "metric":"bleu", + "score":0.2350766648 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ne", + "task":"translation_to", + "metric":"chrf", + "score":0.4890671168 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"nl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"nl", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"nl", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"nl", + "task":"translation_from", + "metric":"bleu", + "score":0.2583853642 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"nl", + "task":"translation_from", + "metric":"chrf", + "score":0.5143387984 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"nl", + "task":"translation_to", + "metric":"bleu", + "score":0.3585971813 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"nl", + "task":"translation_to", + "metric":"chrf", + "score":0.6255063069 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ny", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ny", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ny", + "task":"translation_from", + "metric":"bleu", + "score":0.1562574059 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ny", + "task":"translation_from", + "metric":"chrf", + "score":0.378833839 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ny", + "task":"translation_to", + "metric":"bleu", + "score":0.1000795039 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ny", + "task":"translation_to", + "metric":"chrf", + "score":0.447037349 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"om", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"om", + "task":"translation_from", + "metric":"bleu", + "score":0.0981161875 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"om", + "task":"translation_from", + "metric":"chrf", + "score":0.3370208163 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"om", + "task":"translation_to", + "metric":"bleu", + "score":0.040931235 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"om", + "task":"translation_to", + "metric":"chrf", + "score":0.3615428475 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"or", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"or", + "task":"translation_from", + "metric":"bleu", + "score":0.2626677598 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"or", + "task":"translation_from", + "metric":"chrf", + "score":0.4970567085 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"or", + "task":"translation_to", + "metric":"bleu", + "score":0.1807466012 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"or", + "task":"translation_to", + "metric":"chrf", + "score":0.4219189716 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pa", + "task":"translation_from", + "metric":"bleu", + "score":0.3706063992 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pa", + "task":"translation_from", + "metric":"chrf", + "score":0.6167676482 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pa", + "task":"translation_to", + "metric":"bleu", + "score":0.4234596823 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pa", + "task":"translation_to", + "metric":"chrf", + "score":0.5629443923 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pl", + "task":"translation_from", + "metric":"bleu", + "score":0.2754265608 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pl", + "task":"translation_from", + "metric":"chrf", + "score":0.5207065369 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pl", + "task":"translation_to", + "metric":"bleu", + "score":0.3700040895 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pl", + "task":"translation_to", + "metric":"chrf", + "score":0.5924241261 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pt", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pt", + "task":"translation_from", + "metric":"bleu", + "score":0.2971403532 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pt", + "task":"translation_from", + "metric":"chrf", + "score":0.5321068893 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pt", + "task":"translation_to", + "metric":"bleu", + "score":0.4364286549 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pt", + "task":"translation_to", + "metric":"chrf", + "score":0.6509885745 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ro", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ro", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ro", + "task":"translation_from", + "metric":"bleu", + "score":0.27702997 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ro", + "task":"translation_from", + "metric":"chrf", + "score":0.5437386483 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ro", + "task":"translation_to", + "metric":"bleu", + "score":0.4580925611 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ro", + "task":"translation_to", + "metric":"chrf", + "score":0.6514836722 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ru", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ru", + "task":"translation_from", + "metric":"bleu", + "score":0.2300270544 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ru", + "task":"translation_from", + "metric":"chrf", + "score":0.4839384065 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ru", + "task":"translation_to", + "metric":"bleu", + "score":0.4236492288 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ru", + "task":"translation_to", + "metric":"chrf", + "score":0.6116207052 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"rw", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"rw", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"rw", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"rw", + "task":"translation_from", + "metric":"bleu", + "score":0.1602143293 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"rw", + "task":"translation_from", + "metric":"chrf", + "score":0.3793757948 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"rw", + "task":"translation_to", + "metric":"bleu", + "score":0.1370228414 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"rw", + "task":"translation_to", + "metric":"chrf", + "score":0.4797772284 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sd", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sd", + "task":"translation_from", + "metric":"bleu", + "score":0.2571204202 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sd", + "task":"translation_from", + "metric":"chrf", + "score":0.4946608155 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sd", + "task":"translation_to", + "metric":"bleu", + "score":0.0869374651 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sd", + "task":"translation_to", + "metric":"chrf", + "score":0.3119061498 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"si", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"si", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"si", + "task":"translation_from", + "metric":"bleu", + "score":0.1981443603 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"si", + "task":"translation_from", + "metric":"chrf", + "score":0.4536105905 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"si", + "task":"translation_to", + "metric":"bleu", + "score":0.2278086127 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"si", + "task":"translation_to", + "metric":"chrf", + "score":0.4013315084 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sn", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sn", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sn", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sn", + "task":"translation_from", + "metric":"bleu", + "score":0.0939343156 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sn", + "task":"translation_from", + "metric":"chrf", + "score":0.3129229613 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sn", + "task":"translation_to", + "metric":"bleu", + "score":0.074740365 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sn", + "task":"translation_to", + "metric":"chrf", + "score":0.4045773842 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"so", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"so", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"so", + "task":"translation_from", + "metric":"bleu", + "score":0.2273071628 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"so", + "task":"translation_from", + "metric":"chrf", + "score":0.4497946959 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"so", + "task":"translation_to", + "metric":"bleu", + "score":0.1824497409 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"so", + "task":"translation_to", + "metric":"chrf", + "score":0.4972329945 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sr", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sr", + "task":"translation_from", + "metric":"bleu", + "score":0.2541965029 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sr", + "task":"translation_from", + "metric":"chrf", + "score":0.5234491687 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sr", + "task":"translation_to", + "metric":"bleu", + "score":0.3308712415 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sr", + "task":"translation_to", + "metric":"chrf", + "score":0.5512495988 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"su", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"su", + "task":"translation_from", + "metric":"bleu", + "score":0.1522391036 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"su", + "task":"translation_from", + "metric":"chrf", + "score":0.3508292995 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"su", + "task":"translation_to", + "metric":"bleu", + "score":0.1514782919 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"su", + "task":"translation_to", + "metric":"chrf", + "score":0.4909144205 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sv", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sv", + "task":"translation_from", + "metric":"bleu", + "score":0.2959760233 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sv", + "task":"translation_from", + "metric":"chrf", + "score":0.5398896148 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sv", + "task":"translation_to", + "metric":"bleu", + "score":0.4357891553 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sv", + "task":"translation_to", + "metric":"chrf", + "score":0.6529723913 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sw", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sw", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sw", + "task":"translation_from", + "metric":"bleu", + "score":0.2501435914 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sw", + "task":"translation_from", + "metric":"chrf", + "score":0.5088299265 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sw", + "task":"translation_to", + "metric":"bleu", + "score":0.262372343 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sw", + "task":"translation_to", + "metric":"chrf", + "score":0.5806899403 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ta", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ta", + "task":"translation_from", + "metric":"bleu", + "score":0.2450100573 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ta", + "task":"translation_from", + "metric":"chrf", + "score":0.4918691312 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ta", + "task":"translation_to", + "metric":"bleu", + "score":0.2434733519 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ta", + "task":"translation_to", + "metric":"chrf", + "score":0.5120095348 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"te", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"te", + "task":"translation_from", + "metric":"bleu", + "score":0.3568851036 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"te", + "task":"translation_from", + "metric":"chrf", + "score":0.5825326367 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"te", + "task":"translation_to", + "metric":"bleu", + "score":0.3112091725 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"te", + "task":"translation_to", + "metric":"chrf", + "score":0.5431414206 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"tg", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"tg", + "task":"translation_from", + "metric":"bleu", + "score":0.1741933649 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"tg", + "task":"translation_from", + "metric":"chrf", + "score":0.4272342177 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"tg", + "task":"translation_to", + "metric":"bleu", + "score":0.1811584685 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"tg", + "task":"translation_to", + "metric":"chrf", + "score":0.4001890626 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"th", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"th", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"th", + "task":"translation_from", + "metric":"bleu", + "score":0.2544201673 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"th", + "task":"translation_from", + "metric":"chrf", + "score":0.5081271409 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"th", + "task":"translation_to", + "metric":"bleu", + "score":0.2942923294 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"th", + "task":"translation_to", + "metric":"chrf", + "score":0.4479604827 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ti", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ti", + "task":"translation_from", + "metric":"bleu", + "score":0.0881111208 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ti", + "task":"translation_from", + "metric":"chrf", + "score":0.3173214379 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ti", + "task":"translation_to", + "metric":"bleu", + "score":0.0384668791 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ti", + "task":"translation_to", + "metric":"chrf", + "score":0.1259439982 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"tr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"tr", + "task":"translation_from", + "metric":"bleu", + "score":0.2563119866 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"tr", + "task":"translation_from", + "metric":"chrf", + "score":0.5291012922 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"tr", + "task":"translation_to", + "metric":"bleu", + "score":0.3009595898 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"tr", + "task":"translation_to", + "metric":"chrf", + "score":0.5854044281 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"uk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"uk", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"uk", + "task":"translation_from", + "metric":"bleu", + "score":0.2567288533 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"uk", + "task":"translation_from", + "metric":"chrf", + "score":0.5177571061 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"uk", + "task":"translation_to", + "metric":"bleu", + "score":0.3201007033 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"uk", + "task":"translation_to", + "metric":"chrf", + "score":0.5323037228 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"umb", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"umb", + "task":"translation_from", + "metric":"bleu", + "score":0.0115980217 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"umb", + "task":"translation_from", + "metric":"chrf", + "score":0.115883071 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"umb", + "task":"translation_to", + "metric":"bleu", + "score":0.0129780747 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"umb", + "task":"translation_to", + "metric":"chrf", + "score":0.1450749981 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ur", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ur", + "task":"translation_from", + "metric":"bleu", + "score":0.2402951661 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ur", + "task":"translation_from", + "metric":"chrf", + "score":0.5033005385 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ur", + "task":"translation_to", + "metric":"bleu", + "score":0.2302239803 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ur", + "task":"translation_to", + "metric":"chrf", + "score":0.4066956434 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"uz", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"uz", + "task":"translation_from", + "metric":"bleu", + "score":0.203750264 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"uz", + "task":"translation_from", + "metric":"chrf", + "score":0.4979829233 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"uz", + "task":"translation_to", + "metric":"bleu", + "score":0.2162945849 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"uz", + "task":"translation_to", + "metric":"chrf", + "score":0.4941278712 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"vi", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"vi", + "task":"translation_from", + "metric":"bleu", + "score":0.2537752957 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"vi", + "task":"translation_from", + "metric":"chrf", + "score":0.5073147534 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"vi", + "task":"translation_to", + "metric":"bleu", + "score":0.3583753747 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"vi", + "task":"translation_to", + "metric":"chrf", + "score":0.6253917282 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"wo", + "task":"classification", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"wo", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"wo", + "task":"translation_from", + "metric":"bleu", + "score":0.1081430594 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"wo", + "task":"translation_from", + "metric":"chrf", + "score":0.2665454299 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"wo", + "task":"translation_to", + "metric":"bleu", + "score":0.0142970887 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"wo", + "task":"translation_to", + "metric":"chrf", + "score":0.1489810124 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"wuu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"bleu", + "score":0.1700904158 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"chrf", + "score":0.421111634 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"bleu", + "score":0.1213993524 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"chrf", + "score":0.1655788185 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"xh", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"xh", + "task":"translation_from", + "metric":"bleu", + "score":0.1531171972 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"xh", + "task":"translation_from", + "metric":"chrf", + "score":0.3828830786 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"xh", + "task":"translation_to", + "metric":"bleu", + "score":0.0483942569 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"xh", + "task":"translation_to", + "metric":"chrf", + "score":0.3116951706 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"yo", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"yo", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"yo", + "task":"translation_from", + "metric":"bleu", + "score":0.0816098185 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"yo", + "task":"translation_from", + "metric":"chrf", + "score":0.2781732759 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"yo", + "task":"translation_to", + "metric":"bleu", + "score":0.041496472 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"yo", + "task":"translation_to", + "metric":"chrf", + "score":0.202397124 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"yue", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"yue", + "task":"translation_from", + "metric":"bleu", + "score":0.1783312983 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"yue", + "task":"translation_from", + "metric":"chrf", + "score":0.4423885999 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"yue", + "task":"translation_to", + "metric":"bleu", + "score":0.1632112014 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"yue", + "task":"translation_to", + "metric":"chrf", + "score":0.2297357227 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zh", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zh", + "task":"translation_from", + "metric":"bleu", + "score":0.249810194 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zh", + "task":"translation_from", + "metric":"chrf", + "score":0.5151255506 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zh", + "task":"translation_to", + "metric":"bleu", + "score":0.1854861198 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zh", + "task":"translation_to", + "metric":"chrf", + "score":0.2463326959 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zu", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zu", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zu", + "task":"translation_from", + "metric":"bleu", + "score":0.1729786376 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zu", + "task":"translation_from", + "metric":"chrf", + "score":0.4189697233 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zu", + "task":"translation_to", + "metric":"bleu", + "score":0.0866404913 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zu", + "task":"translation_to", + "metric":"chrf", + "score":0.3943277627 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"aeb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.2177971147 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.4738076987 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.1414064724 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.3965739567 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"af", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"af", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"af", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"af", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"af", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ak", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ak", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ak", + "task":"translation_from", + "metric":"bleu", + "score":0.076595229 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ak", + "task":"translation_from", + "metric":"chrf", + "score":0.2493366365 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ak", + "task":"translation_to", + "metric":"bleu", + "score":0.0440715947 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ak", + "task":"translation_to", + "metric":"chrf", + "score":0.2820233612 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"am", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"am", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"am", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"am", + "task":"translation_from", + "metric":"bleu", + "score":0.1913062339 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"am", + "task":"translation_from", + "metric":"chrf", + "score":0.4296053228 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"am", + "task":"translation_to", + "metric":"bleu", + "score":0.13443556 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"am", + "task":"translation_to", + "metric":"chrf", + "score":0.2528930204 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"apc", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"apc", + "task":"translation_from", + "metric":"bleu", + "score":0.24265587 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"apc", + "task":"translation_from", + "metric":"chrf", + "score":0.4918380331 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"apc", + "task":"translation_to", + "metric":"bleu", + "score":0.2104382871 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"apc", + "task":"translation_to", + "metric":"chrf", + "score":0.456050442 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ar", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ar", + "task":"translation_from", + "metric":"bleu", + "score":0.2891206499 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ar", + "task":"translation_from", + "metric":"chrf", + "score":0.5438550217 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ar", + "task":"translation_to", + "metric":"bleu", + "score":0.3184721364 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ar", + "task":"translation_to", + "metric":"chrf", + "score":0.5483731849 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ary", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ary", + "task":"translation_from", + "metric":"bleu", + "score":0.1664804364 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ary", + "task":"translation_from", + "metric":"chrf", + "score":0.4585261833 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ary", + "task":"translation_to", + "metric":"bleu", + "score":0.1299183594 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ary", + "task":"translation_to", + "metric":"chrf", + "score":0.3752977557 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"arz", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"arz", + "task":"translation_from", + "metric":"bleu", + "score":0.1618648119 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"arz", + "task":"translation_from", + "metric":"chrf", + "score":0.4104839109 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"arz", + "task":"translation_to", + "metric":"bleu", + "score":0.2266738862 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"arz", + "task":"translation_to", + "metric":"chrf", + "score":0.4315390742 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"as", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"as", + "task":"translation_from", + "metric":"bleu", + "score":0.2602059805 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"as", + "task":"translation_from", + "metric":"chrf", + "score":0.4987515978 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"as", + "task":"translation_to", + "metric":"bleu", + "score":0.0907943093 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"as", + "task":"translation_to", + "metric":"chrf", + "score":0.348768221 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"awa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"awa", + "task":"translation_from", + "metric":"bleu", + "score":0.3277667824 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"awa", + "task":"translation_from", + "metric":"chrf", + "score":0.5267403611 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"awa", + "task":"translation_to", + "metric":"bleu", + "score":0.2123273366 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"awa", + "task":"translation_to", + "metric":"chrf", + "score":0.408906638 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"az", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"az", + "task":"translation_from", + "metric":"bleu", + "score":0.1880331404 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"az", + "task":"translation_from", + "metric":"chrf", + "score":0.4234748209 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"az", + "task":"translation_to", + "metric":"bleu", + "score":0.1517877566 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"az", + "task":"translation_to", + "metric":"chrf", + "score":0.423956163 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"be", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"be", + "task":"translation_from", + "metric":"bleu", + "score":0.148851004 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"be", + "task":"translation_from", + "metric":"chrf", + "score":0.4514291775 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"be", + "task":"translation_to", + "metric":"bleu", + "score":0.3105472783 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"be", + "task":"translation_to", + "metric":"chrf", + "score":0.498684126 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bho", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bho", + "task":"translation_from", + "metric":"bleu", + "score":0.2430984589 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bho", + "task":"translation_from", + "metric":"chrf", + "score":0.4969060141 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bho", + "task":"translation_to", + "metric":"bleu", + "score":0.1699224465 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bho", + "task":"translation_to", + "metric":"chrf", + "score":0.3964402252 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bm", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bm", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bm", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bm", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bm", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bn", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bn", + "task":"translation_from", + "metric":"bleu", + "score":0.2907230812 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bn", + "task":"translation_from", + "metric":"chrf", + "score":0.5148223626 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bn", + "task":"translation_to", + "metric":"bleu", + "score":0.3473636391 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bn", + "task":"translation_to", + "metric":"chrf", + "score":0.5442574441 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ca", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ca", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ca", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ca", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ca", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ceb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"bleu", + "score":0.3650597419 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"chrf", + "score":0.5512750223 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"bleu", + "score":0.293824845 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"chrf", + "score":0.5724817779 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ckb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"bleu", + "score":0.1983726871 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"chrf", + "score":0.4779908235 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"bleu", + "score":0.0792877335 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"chrf", + "score":0.3908004248 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"cs", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"cs", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"cs", + "task":"translation_from", + "metric":"bleu", + "score":0.2863884915 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"cs", + "task":"translation_from", + "metric":"chrf", + "score":0.5641108436 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"cs", + "task":"translation_to", + "metric":"bleu", + "score":0.352498756 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"cs", + "task":"translation_to", + "metric":"chrf", + "score":0.5860513143 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"de", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"de", + "task":"translation_from", + "metric":"bleu", + "score":0.3577876868 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"de", + "task":"translation_from", + "metric":"chrf", + "score":0.5943423055 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"de", + "task":"translation_to", + "metric":"bleu", + "score":0.5344280565 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"de", + "task":"translation_to", + "metric":"chrf", + "score":0.7084649844 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"el", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"el", + "task":"translation_from", + "metric":"bleu", + "score":0.2914236052 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"el", + "task":"translation_from", + "metric":"chrf", + "score":0.5147962724 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"el", + "task":"translation_to", + "metric":"bleu", + "score":0.3761179017 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"el", + "task":"translation_to", + "metric":"chrf", + "score":0.5590147212 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"en", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"en", + "task":"translation_from", + "metric":"bleu", + "score":0.452427177 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"en", + "task":"translation_from", + "metric":"chrf", + "score":0.6525566656 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"en", + "task":"translation_to", + "metric":"bleu", + "score":0.5467976399 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"en", + "task":"translation_to", + "metric":"chrf", + "score":0.7780833183 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"es", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"es", + "task":"translation_from", + "metric":"bleu", + "score":0.3554331718 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"es", + "task":"translation_from", + "metric":"chrf", + "score":0.5997743406 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"es", + "task":"translation_to", + "metric":"bleu", + "score":0.3847830842 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"es", + "task":"translation_to", + "metric":"chrf", + "score":0.6191109047 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fa", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fa", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fa", + "task":"translation_from", + "metric":"bleu", + "score":0.2579194729 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fa", + "task":"translation_from", + "metric":"chrf", + "score":0.5351839762 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fa", + "task":"translation_to", + "metric":"bleu", + "score":0.1571676635 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fa", + "task":"translation_to", + "metric":"chrf", + "score":0.4046770996 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fil", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fil", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fil", + "task":"translation_from", + "metric":"bleu", + "score":0.3771043132 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fil", + "task":"translation_from", + "metric":"chrf", + "score":0.5835797455 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fil", + "task":"translation_to", + "metric":"bleu", + "score":0.3564426025 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fil", + "task":"translation_to", + "metric":"chrf", + "score":0.6107274367 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fr", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fr", + "task":"translation_from", + "metric":"bleu", + "score":0.2846092378 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fr", + "task":"translation_from", + "metric":"chrf", + "score":0.5655970541 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fr", + "task":"translation_to", + "metric":"bleu", + "score":0.5192984544 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fr", + "task":"translation_to", + "metric":"chrf", + "score":0.7020040834 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.0220051815 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.1861453784 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0227307294 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.1850492522 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"gu", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"gu", + "task":"translation_from", + "metric":"bleu", + "score":0.2796934014 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"gu", + "task":"translation_from", + "metric":"chrf", + "score":0.5155626456 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"gu", + "task":"translation_to", + "metric":"bleu", + "score":0.1979202011 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"gu", + "task":"translation_to", + "metric":"chrf", + "score":0.4528880823 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ha", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ha", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ha", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ha", + "task":"translation_from", + "metric":"bleu", + "score":0.1595296755 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ha", + "task":"translation_from", + "metric":"chrf", + "score":0.3859356797 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ha", + "task":"translation_to", + "metric":"bleu", + "score":0.171830216 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ha", + "task":"translation_to", + "metric":"chrf", + "score":0.4608354018 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hi", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hi", + "task":"translation_from", + "metric":"bleu", + "score":0.3520691191 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hi", + "task":"translation_from", + "metric":"chrf", + "score":0.6035990708 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hi", + "task":"translation_to", + "metric":"bleu", + "score":0.3987037224 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hi", + "task":"translation_to", + "metric":"chrf", + "score":0.6195037668 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hne", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hne", + "task":"translation_from", + "metric":"bleu", + "score":0.2709410734 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hne", + "task":"translation_from", + "metric":"chrf", + "score":0.4976144005 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hne", + "task":"translation_to", + "metric":"bleu", + "score":0.1150407607 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hne", + "task":"translation_to", + "metric":"chrf", + "score":0.3709160058 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ht", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ht", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ht", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ht", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ht", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hu", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hu", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hu", + "task":"translation_from", + "metric":"bleu", + "score":0.2903150375 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hu", + "task":"translation_from", + "metric":"chrf", + "score":0.5392715859 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hu", + "task":"translation_to", + "metric":"bleu", + "score":0.3460432788 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hu", + "task":"translation_to", + "metric":"chrf", + "score":0.6009670508 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"id", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"id", + "task":"translation_from", + "metric":"bleu", + "score":0.3377417704 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"id", + "task":"translation_from", + "metric":"chrf", + "score":0.5674360496 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"id", + "task":"translation_to", + "metric":"bleu", + "score":0.3534620252 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"id", + "task":"translation_to", + "metric":"chrf", + "score":0.6680177029 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ig", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ig", + "task":"translation_from", + "metric":"bleu", + "score":0.1600009223 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ig", + "task":"translation_from", + "metric":"chrf", + "score":0.3857586031 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ig", + "task":"translation_to", + "metric":"bleu", + "score":0.1602266912 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ig", + "task":"translation_to", + "metric":"chrf", + "score":0.4091024664 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ilo", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"bleu", + "score":0.1546473042 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"chrf", + "score":0.3985794204 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"bleu", + "score":0.1752645287 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"chrf", + "score":0.4668449261 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"it", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"it", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"it", + "task":"translation_from", + "metric":"bleu", + "score":0.3356485456 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"it", + "task":"translation_from", + "metric":"chrf", + "score":0.5684527887 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"it", + "task":"translation_to", + "metric":"bleu", + "score":0.3627134123 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"it", + "task":"translation_to", + "metric":"chrf", + "score":0.6050822949 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ja", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ja", + "task":"translation_from", + "metric":"bleu", + "score":0.2481856237 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ja", + "task":"translation_from", + "metric":"chrf", + "score":0.5180749152 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ja", + "task":"translation_to", + "metric":"bleu", + "score":0.242508046 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ja", + "task":"translation_to", + "metric":"chrf", + "score":0.4046420215 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"jv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"jv", + "task":"translation_from", + "metric":"bleu", + "score":0.3019627022 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"jv", + "task":"translation_from", + "metric":"chrf", + "score":0.5133980923 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"jv", + "task":"translation_to", + "metric":"bleu", + "score":0.2316517545 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"jv", + "task":"translation_to", + "metric":"chrf", + "score":0.5189963647 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ki", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ki", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ki", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ki", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ki", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"kk", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"kk", + "task":"translation_from", + "metric":"bleu", + "score":0.2187004813 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"kk", + "task":"translation_from", + "metric":"chrf", + "score":0.4910590831 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"kk", + "task":"translation_to", + "metric":"bleu", + "score":0.2108939118 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"kk", + "task":"translation_to", + "metric":"chrf", + "score":0.4375825873 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"km", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"km", + "task":"translation_from", + "metric":"bleu", + "score":0.3274744668 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"km", + "task":"translation_from", + "metric":"chrf", + "score":0.5605813039 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"km", + "task":"translation_to", + "metric":"bleu", + "score":0.0800539722 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"km", + "task":"translation_to", + "metric":"chrf", + "score":0.3336188156 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"kn", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"kn", + "task":"translation_from", + "metric":"bleu", + "score":0.2692189197 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"kn", + "task":"translation_from", + "metric":"chrf", + "score":0.5290912174 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"kn", + "task":"translation_to", + "metric":"bleu", + "score":0.2869741566 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"kn", + "task":"translation_to", + "metric":"chrf", + "score":0.5072256514 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ko", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ko", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ko", + "task":"translation_from", + "metric":"bleu", + "score":0.2172591082 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ko", + "task":"translation_from", + "metric":"chrf", + "score":0.478962626 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ko", + "task":"translation_to", + "metric":"bleu", + "score":0.2169046229 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ko", + "task":"translation_to", + "metric":"chrf", + "score":0.3151387909 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"lua", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"lua", + "task":"translation_from", + "metric":"bleu", + "score":0.0905061152 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"lua", + "task":"translation_from", + "metric":"chrf", + "score":0.321707617 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"lua", + "task":"translation_to", + "metric":"bleu", + "score":0.0361920973 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"lua", + "task":"translation_to", + "metric":"chrf", + "score":0.222315171 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mag", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mag", + "task":"translation_from", + "metric":"bleu", + "score":0.3100950481 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mag", + "task":"translation_from", + "metric":"chrf", + "score":0.558054933 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mag", + "task":"translation_to", + "metric":"bleu", + "score":0.2213152575 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mag", + "task":"translation_to", + "metric":"chrf", + "score":0.4821662369 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mai", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mai", + "task":"translation_from", + "metric":"bleu", + "score":0.3126340837 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mai", + "task":"translation_from", + "metric":"chrf", + "score":0.5601639768 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mai", + "task":"translation_to", + "metric":"bleu", + "score":0.1875297747 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mai", + "task":"translation_to", + "metric":"chrf", + "score":0.4394137195 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mg", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mg", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mg", + "task":"translation_from", + "metric":"bleu", + "score":0.2502298144 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mg", + "task":"translation_from", + "metric":"chrf", + "score":0.5206889602 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mg", + "task":"translation_to", + "metric":"bleu", + "score":0.1301910408 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mg", + "task":"translation_to", + "metric":"chrf", + "score":0.4488625613 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ml", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ml", + "task":"translation_from", + "metric":"bleu", + "score":0.2809005667 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ml", + "task":"translation_from", + "metric":"chrf", + "score":0.5466717628 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ml", + "task":"translation_to", + "metric":"bleu", + "score":0.2287455417 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ml", + "task":"translation_to", + "metric":"chrf", + "score":0.4915489263 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mr", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mr", + "task":"translation_from", + "metric":"bleu", + "score":0.3395095603 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mr", + "task":"translation_from", + "metric":"chrf", + "score":0.5877742809 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mr", + "task":"translation_to", + "metric":"bleu", + "score":0.2222923122 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mr", + "task":"translation_to", + "metric":"chrf", + "score":0.4572688692 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ms", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ms", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ms", + "task":"translation_from", + "metric":"bleu", + "score":0.3794800258 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ms", + "task":"translation_from", + "metric":"chrf", + "score":0.6256125923 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ms", + "task":"translation_to", + "metric":"bleu", + "score":0.3593747877 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ms", + "task":"translation_to", + "metric":"chrf", + "score":0.664135376 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"my", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"my", + "task":"translation_from", + "metric":"bleu", + "score":0.251920694 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"my", + "task":"translation_from", + "metric":"chrf", + "score":0.4662583176 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"my", + "task":"translation_to", + "metric":"bleu", + "score":0.1647980206 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"my", + "task":"translation_to", + "metric":"chrf", + "score":0.4166796691 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ne", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ne", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ne", + "task":"translation_from", + "metric":"bleu", + "score":0.3022338928 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ne", + "task":"translation_from", + "metric":"chrf", + "score":0.5587522289 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ne", + "task":"translation_to", + "metric":"bleu", + "score":0.2252421952 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ne", + "task":"translation_to", + "metric":"chrf", + "score":0.4768786292 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"nl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"nl", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"nl", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"nl", + "task":"translation_from", + "metric":"bleu", + "score":0.2793746981 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"nl", + "task":"translation_from", + "metric":"chrf", + "score":0.5246312011 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"nl", + "task":"translation_to", + "metric":"bleu", + "score":0.3496466203 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"nl", + "task":"translation_to", + "metric":"chrf", + "score":0.6032151622 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ny", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ny", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ny", + "task":"translation_from", + "metric":"bleu", + "score":0.119086784 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ny", + "task":"translation_from", + "metric":"chrf", + "score":0.3898511388 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ny", + "task":"translation_to", + "metric":"bleu", + "score":0.0923649849 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ny", + "task":"translation_to", + "metric":"chrf", + "score":0.4837931302 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"om", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"om", + "task":"translation_from", + "metric":"bleu", + "score":0.0417850648 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"om", + "task":"translation_from", + "metric":"chrf", + "score":0.2509675066 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"om", + "task":"translation_to", + "metric":"bleu", + "score":0.0312813941 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"om", + "task":"translation_to", + "metric":"chrf", + "score":0.2886309955 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"or", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"or", + "task":"translation_from", + "metric":"bleu", + "score":0.2613495089 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"or", + "task":"translation_from", + "metric":"chrf", + "score":0.5009335042 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"or", + "task":"translation_to", + "metric":"bleu", + "score":0.1648455996 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"or", + "task":"translation_to", + "metric":"chrf", + "score":0.3943041737 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"pa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"pa", + "task":"translation_from", + "metric":"bleu", + "score":0.4164890636 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"pa", + "task":"translation_from", + "metric":"chrf", + "score":0.6375470445 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"pa", + "task":"translation_to", + "metric":"bleu", + "score":0.4166823661 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"pa", + "task":"translation_to", + "metric":"chrf", + "score":0.575314128 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"pl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"pl", + "task":"translation_from", + "metric":"bleu", + "score":0.2913506513 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"pl", + "task":"translation_from", + "metric":"chrf", + "score":0.5431985912 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"pl", + "task":"translation_to", + "metric":"bleu", + "score":0.3723742743 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"pl", + "task":"translation_to", + "metric":"chrf", + "score":0.5891983505 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"pt", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"pt", + "task":"translation_from", + "metric":"bleu", + "score":0.340245547 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"pt", + "task":"translation_from", + "metric":"chrf", + "score":0.5681284927 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"pt", + "task":"translation_to", + "metric":"bleu", + "score":0.4702737577 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"pt", + "task":"translation_to", + "metric":"chrf", + "score":0.6903236014 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ro", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ro", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ro", + "task":"translation_from", + "metric":"bleu", + "score":0.272965046 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ro", + "task":"translation_from", + "metric":"chrf", + "score":0.5527916308 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ro", + "task":"translation_to", + "metric":"bleu", + "score":0.5195197328 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ro", + "task":"translation_to", + "metric":"chrf", + "score":0.6892729705 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ru", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ru", + "task":"translation_from", + "metric":"bleu", + "score":0.2862936285 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ru", + "task":"translation_from", + "metric":"chrf", + "score":0.5264436928 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ru", + "task":"translation_to", + "metric":"bleu", + "score":0.4800957551 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ru", + "task":"translation_to", + "metric":"chrf", + "score":0.6618495803 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"rw", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"rw", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"rw", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"rw", + "task":"translation_from", + "metric":"bleu", + "score":0.1701995093 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"rw", + "task":"translation_from", + "metric":"chrf", + "score":0.4262662427 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"rw", + "task":"translation_to", + "metric":"bleu", + "score":0.1513262342 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"rw", + "task":"translation_to", + "metric":"chrf", + "score":0.4732082637 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sd", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sd", + "task":"translation_from", + "metric":"bleu", + "score":0.2365858071 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sd", + "task":"translation_from", + "metric":"chrf", + "score":0.4722212406 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sd", + "task":"translation_to", + "metric":"bleu", + "score":0.2251623508 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sd", + "task":"translation_to", + "metric":"chrf", + "score":0.4159341653 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"si", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"si", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"si", + "task":"translation_from", + "metric":"bleu", + "score":0.226689844 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"si", + "task":"translation_from", + "metric":"chrf", + "score":0.4706510499 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"si", + "task":"translation_to", + "metric":"bleu", + "score":0.2258552473 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"si", + "task":"translation_to", + "metric":"chrf", + "score":0.4191499082 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sn", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sn", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sn", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sn", + "task":"translation_from", + "metric":"bleu", + "score":0.0756830418 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sn", + "task":"translation_from", + "metric":"chrf", + "score":0.3184767575 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sn", + "task":"translation_to", + "metric":"bleu", + "score":0.0495523985 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sn", + "task":"translation_to", + "metric":"chrf", + "score":0.3971096934 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"so", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"so", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"so", + "task":"translation_from", + "metric":"bleu", + "score":0.1915993132 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"so", + "task":"translation_from", + "metric":"chrf", + "score":0.4208812642 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"so", + "task":"translation_to", + "metric":"bleu", + "score":0.1724511246 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"so", + "task":"translation_to", + "metric":"chrf", + "score":0.4741419887 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sr", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sr", + "task":"translation_from", + "metric":"bleu", + "score":0.245439349 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sr", + "task":"translation_from", + "metric":"chrf", + "score":0.536270172 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sr", + "task":"translation_to", + "metric":"bleu", + "score":0.3929818488 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sr", + "task":"translation_to", + "metric":"chrf", + "score":0.5787667028 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"su", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"su", + "task":"translation_from", + "metric":"bleu", + "score":0.1784974236 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"su", + "task":"translation_from", + "metric":"chrf", + "score":0.4520828188 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"su", + "task":"translation_to", + "metric":"bleu", + "score":0.1435021957 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"su", + "task":"translation_to", + "metric":"chrf", + "score":0.4868234587 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sv", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sv", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sv", + "task":"translation_from", + "metric":"bleu", + "score":0.3258404036 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sv", + "task":"translation_from", + "metric":"chrf", + "score":0.5652149653 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sv", + "task":"translation_to", + "metric":"bleu", + "score":0.4264864443 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sv", + "task":"translation_to", + "metric":"chrf", + "score":0.6543542662 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sw", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sw", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sw", + "task":"translation_from", + "metric":"bleu", + "score":0.268709657 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sw", + "task":"translation_from", + "metric":"chrf", + "score":0.5306834056 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sw", + "task":"translation_to", + "metric":"bleu", + "score":0.3395981599 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sw", + "task":"translation_to", + "metric":"chrf", + "score":0.6130756934 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ta", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ta", + "task":"translation_from", + "metric":"bleu", + "score":0.2563448403 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ta", + "task":"translation_from", + "metric":"chrf", + "score":0.5007966916 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ta", + "task":"translation_to", + "metric":"bleu", + "score":0.2405135195 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ta", + "task":"translation_to", + "metric":"chrf", + "score":0.5564984925 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"te", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"te", + "task":"translation_from", + "metric":"bleu", + "score":0.2787922254 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"te", + "task":"translation_from", + "metric":"chrf", + "score":0.5420797212 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"te", + "task":"translation_to", + "metric":"bleu", + "score":0.259866454 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"te", + "task":"translation_to", + "metric":"chrf", + "score":0.48543634 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"tg", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"tg", + "task":"translation_from", + "metric":"bleu", + "score":0.2018690154 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"tg", + "task":"translation_from", + "metric":"chrf", + "score":0.4335923466 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"tg", + "task":"translation_to", + "metric":"bleu", + "score":0.0972794658 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"tg", + "task":"translation_to", + "metric":"chrf", + "score":0.327182503 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"th", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"th", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"th", + "task":"translation_from", + "metric":"bleu", + "score":0.2400131449 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"th", + "task":"translation_from", + "metric":"chrf", + "score":0.4851690277 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"th", + "task":"translation_to", + "metric":"bleu", + "score":0.383380628 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"th", + "task":"translation_to", + "metric":"chrf", + "score":0.5430720239 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ti", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ti", + "task":"translation_from", + "metric":"bleu", + "score":0.0736674948 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ti", + "task":"translation_from", + "metric":"chrf", + "score":0.2974206944 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ti", + "task":"translation_to", + "metric":"bleu", + "score":0.0241026131 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ti", + "task":"translation_to", + "metric":"chrf", + "score":0.1246172628 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"tr", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"tr", + "task":"translation_from", + "metric":"bleu", + "score":0.2757340333 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"tr", + "task":"translation_from", + "metric":"chrf", + "score":0.5244536559 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"tr", + "task":"translation_to", + "metric":"bleu", + "score":0.3185578758 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"tr", + "task":"translation_to", + "metric":"chrf", + "score":0.5765088485 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"uk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"uk", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"uk", + "task":"translation_from", + "metric":"bleu", + "score":0.2918547905 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"uk", + "task":"translation_from", + "metric":"chrf", + "score":0.5631912653 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"uk", + "task":"translation_to", + "metric":"bleu", + "score":0.3283437369 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"uk", + "task":"translation_to", + "metric":"chrf", + "score":0.5565790802 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"umb", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"umb", + "task":"translation_from", + "metric":"bleu", + "score":0.0359452883 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"umb", + "task":"translation_from", + "metric":"chrf", + "score":0.1779043042 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"umb", + "task":"translation_to", + "metric":"bleu", + "score":0.0305779168 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"umb", + "task":"translation_to", + "metric":"chrf", + "score":0.1838354035 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ur", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ur", + "task":"translation_from", + "metric":"bleu", + "score":0.2595582459 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ur", + "task":"translation_from", + "metric":"chrf", + "score":0.5043992681 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ur", + "task":"translation_to", + "metric":"bleu", + "score":0.2142625601 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ur", + "task":"translation_to", + "metric":"chrf", + "score":0.429749938 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"uz", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"uz", + "task":"translation_from", + "metric":"bleu", + "score":0.2595944841 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"uz", + "task":"translation_from", + "metric":"chrf", + "score":0.5081810113 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"uz", + "task":"translation_to", + "metric":"bleu", + "score":0.2601189518 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"uz", + "task":"translation_to", + "metric":"chrf", + "score":0.5225655991 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"vi", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"vi", + "task":"translation_from", + "metric":"bleu", + "score":0.2279880384 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"vi", + "task":"translation_from", + "metric":"chrf", + "score":0.4835933272 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"vi", + "task":"translation_to", + "metric":"bleu", + "score":0.3478085621 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"vi", + "task":"translation_to", + "metric":"chrf", + "score":0.5968604742 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"wo", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"wo", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"wo", + "task":"translation_from", + "metric":"bleu", + "score":0.065945115 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"wo", + "task":"translation_from", + "metric":"chrf", + "score":0.2358663461 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"wo", + "task":"translation_to", + "metric":"bleu", + "score":0.0540055322 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"wo", + "task":"translation_to", + "metric":"chrf", + "score":0.2390749172 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"wuu", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"bleu", + "score":0.246042863 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"chrf", + "score":0.4917114856 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"bleu", + "score":0.1017188886 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"chrf", + "score":0.1707828137 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"xh", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"xh", + "task":"translation_from", + "metric":"bleu", + "score":0.167004472 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"xh", + "task":"translation_from", + "metric":"chrf", + "score":0.400944552 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"xh", + "task":"translation_to", + "metric":"bleu", + "score":0.066271851 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"xh", + "task":"translation_to", + "metric":"chrf", + "score":0.3937495329 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"yo", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"yo", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"yo", + "task":"translation_from", + "metric":"bleu", + "score":0.0472060067 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"yo", + "task":"translation_from", + "metric":"chrf", + "score":0.2924612708 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"yo", + "task":"translation_to", + "metric":"bleu", + "score":0.0525309984 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"yo", + "task":"translation_to", + "metric":"chrf", + "score":0.2304098638 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"yue", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"yue", + "task":"translation_from", + "metric":"bleu", + "score":0.2124709579 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"yue", + "task":"translation_from", + "metric":"chrf", + "score":0.4811646042 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"yue", + "task":"translation_to", + "metric":"bleu", + "score":0.1392232 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"yue", + "task":"translation_to", + "metric":"chrf", + "score":0.2205120991 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"zh", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"zh", + "task":"translation_from", + "metric":"bleu", + "score":0.1900086584 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"zh", + "task":"translation_from", + "metric":"chrf", + "score":0.4895930442 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"zh", + "task":"translation_to", + "metric":"bleu", + "score":0.2395565562 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"zh", + "task":"translation_to", + "metric":"chrf", + "score":0.3237759485 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"zu", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"zu", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"zu", + "task":"translation_from", + "metric":"bleu", + "score":0.1607803472 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"zu", + "task":"translation_from", + "metric":"chrf", + "score":0.4377738064 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"zu", + "task":"translation_to", + "metric":"bleu", + "score":0.1538390263 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"zu", + "task":"translation_to", + "metric":"chrf", + "score":0.4751516021 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"aeb", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.0750313913 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.2689370364 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.1097950919 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.2459305972 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"af", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"af", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"af", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"af", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"af", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ak", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ak", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ak", + "task":"translation_from", + "metric":"bleu", + "score":0.04291871 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ak", + "task":"translation_from", + "metric":"chrf", + "score":0.1992226055 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ak", + "task":"translation_to", + "metric":"bleu", + "score":0.0012692029 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ak", + "task":"translation_to", + "metric":"chrf", + "score":0.1055962738 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"am", + "task":"classification", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"am", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"am", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"am", + "task":"translation_from", + "metric":"bleu", + "score":0.0135029462 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"am", + "task":"translation_from", + "metric":"chrf", + "score":0.1510010912 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"am", + "task":"translation_to", + "metric":"bleu", + "score":0.0033288372 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"am", + "task":"translation_to", + "metric":"chrf", + "score":0.0389705109 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"apc", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"apc", + "task":"translation_from", + "metric":"bleu", + "score":0.0592251547 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"apc", + "task":"translation_from", + "metric":"chrf", + "score":0.2921276604 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"apc", + "task":"translation_to", + "metric":"bleu", + "score":0.0366276845 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"apc", + "task":"translation_to", + "metric":"chrf", + "score":0.2393327958 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ar", + "task":"classification", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ar", + "task":"translation_from", + "metric":"bleu", + "score":0.0837265107 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ar", + "task":"translation_from", + "metric":"chrf", + "score":0.3012065838 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ar", + "task":"translation_to", + "metric":"bleu", + "score":0.1120670716 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ar", + "task":"translation_to", + "metric":"chrf", + "score":0.2771296913 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ary", + "task":"classification", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ary", + "task":"translation_from", + "metric":"bleu", + "score":0.0213908698 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ary", + "task":"translation_from", + "metric":"chrf", + "score":0.2206299292 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ary", + "task":"translation_to", + "metric":"bleu", + "score":0.0285726559 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ary", + "task":"translation_to", + "metric":"chrf", + "score":0.2326683564 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"arz", + "task":"classification", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"arz", + "task":"translation_from", + "metric":"bleu", + "score":0.0290259599 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"arz", + "task":"translation_from", + "metric":"chrf", + "score":0.2238098591 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"arz", + "task":"translation_to", + "metric":"bleu", + "score":0.0597935462 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"arz", + "task":"translation_to", + "metric":"chrf", + "score":0.2388670431 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"as", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"as", + "task":"translation_from", + "metric":"bleu", + "score":0.0254218054 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"as", + "task":"translation_from", + "metric":"chrf", + "score":0.1827114877 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"as", + "task":"translation_to", + "metric":"bleu", + "score":0.0012328171 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"as", + "task":"translation_to", + "metric":"chrf", + "score":0.1200208328 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"awa", + "task":"classification", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"awa", + "task":"translation_from", + "metric":"bleu", + "score":0.0888105743 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"awa", + "task":"translation_from", + "metric":"chrf", + "score":0.2644372522 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"awa", + "task":"translation_to", + "metric":"bleu", + "score":0.0668939667 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"awa", + "task":"translation_to", + "metric":"chrf", + "score":0.2520473985 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"az", + "task":"classification", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"az", + "task":"translation_from", + "metric":"bleu", + "score":0.0148972561 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"az", + "task":"translation_from", + "metric":"chrf", + "score":0.2336350172 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"az", + "task":"translation_to", + "metric":"bleu", + "score":0.0047574121 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"az", + "task":"translation_to", + "metric":"chrf", + "score":0.1922357185 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"be", + "task":"classification", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"be", + "task":"translation_from", + "metric":"bleu", + "score":0.0366814427 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"be", + "task":"translation_from", + "metric":"chrf", + "score":0.2731193887 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"be", + "task":"translation_to", + "metric":"bleu", + "score":0.0173677773 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"be", + "task":"translation_to", + "metric":"chrf", + "score":0.2136838993 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"bho", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"bho", + "task":"translation_from", + "metric":"bleu", + "score":0.0581882104 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"bho", + "task":"translation_from", + "metric":"chrf", + "score":0.2702416532 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"bho", + "task":"translation_to", + "metric":"bleu", + "score":0.0562052656 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"bho", + "task":"translation_to", + "metric":"chrf", + "score":0.2181774858 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"bm", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"bm", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"bm", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"bm", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"bm", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"bn", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"bn", + "task":"translation_from", + "metric":"bleu", + "score":0.021858254 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"bn", + "task":"translation_from", + "metric":"chrf", + "score":0.2327499821 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"bn", + "task":"translation_to", + "metric":"bleu", + "score":0.0253088472 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"bn", + "task":"translation_to", + "metric":"chrf", + "score":0.1918662187 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ca", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ca", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ca", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ca", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ca", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ceb", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"bleu", + "score":0.1238388635 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"chrf", + "score":0.3442960257 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"bleu", + "score":0.0243559813 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"chrf", + "score":0.2777667131 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ckb", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"bleu", + "score":0.0155834504 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"chrf", + "score":0.1833348617 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"chrf", + "score":0.1279598659 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"cs", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"cs", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"cs", + "task":"translation_from", + "metric":"bleu", + "score":0.1272159331 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"cs", + "task":"translation_from", + "metric":"chrf", + "score":0.3713000806 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"cs", + "task":"translation_to", + "metric":"bleu", + "score":0.1249879163 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"cs", + "task":"translation_to", + "metric":"chrf", + "score":0.332725923 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"de", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"de", + "task":"translation_from", + "metric":"bleu", + "score":0.1784955678 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"de", + "task":"translation_from", + "metric":"chrf", + "score":0.4008799371 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"de", + "task":"translation_to", + "metric":"bleu", + "score":0.1782663616 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"de", + "task":"translation_to", + "metric":"chrf", + "score":0.4070825897 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"el", + "task":"classification", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"el", + "task":"translation_from", + "metric":"bleu", + "score":0.0708485888 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"el", + "task":"translation_from", + "metric":"chrf", + "score":0.2987254392 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"el", + "task":"translation_to", + "metric":"bleu", + "score":0.0335582401 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"el", + "task":"translation_to", + "metric":"chrf", + "score":0.2213744022 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"en", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"en", + "task":"translation_from", + "metric":"bleu", + "score":0.2797104835 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"en", + "task":"translation_from", + "metric":"chrf", + "score":0.4601471921 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"en", + "task":"translation_to", + "metric":"bleu", + "score":0.3392404298 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"en", + "task":"translation_to", + "metric":"chrf", + "score":0.5518674496 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"es", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"es", + "task":"translation_from", + "metric":"bleu", + "score":0.1682956348 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"es", + "task":"translation_from", + "metric":"chrf", + "score":0.3705606944 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"es", + "task":"translation_to", + "metric":"bleu", + "score":0.1595479626 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"es", + "task":"translation_to", + "metric":"chrf", + "score":0.4040956812 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"fa", + "task":"classification", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"fa", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"fa", + "task":"translation_from", + "metric":"bleu", + "score":0.0333586544 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"fa", + "task":"translation_from", + "metric":"chrf", + "score":0.2582740293 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"fa", + "task":"translation_to", + "metric":"bleu", + "score":0.0187498765 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"fa", + "task":"translation_to", + "metric":"chrf", + "score":0.2265924477 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"fil", + "task":"classification", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"fil", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"fil", + "task":"translation_from", + "metric":"bleu", + "score":0.1122756663 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"fil", + "task":"translation_from", + "metric":"chrf", + "score":0.3654994366 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"fil", + "task":"translation_to", + "metric":"bleu", + "score":0.0565617503 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"fil", + "task":"translation_to", + "metric":"chrf", + "score":0.2914640343 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"fr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"fr", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"fr", + "task":"translation_from", + "metric":"bleu", + "score":0.1362099506 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"fr", + "task":"translation_from", + "metric":"chrf", + "score":0.4039646029 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"fr", + "task":"translation_to", + "metric":"bleu", + "score":0.2151785904 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"fr", + "task":"translation_to", + "metric":"chrf", + "score":0.4309035319 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.0308954874 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.1818653 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0168607588 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.1570666495 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"gu", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"gu", + "task":"translation_from", + "metric":"bleu", + "score":0.0426900866 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"gu", + "task":"translation_from", + "metric":"chrf", + "score":0.2179546047 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"gu", + "task":"translation_to", + "metric":"bleu", + "score":0.0232938459 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"gu", + "task":"translation_to", + "metric":"chrf", + "score":0.2007105106 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ha", + "task":"classification", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ha", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ha", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ha", + "task":"translation_from", + "metric":"bleu", + "score":0.0254280801 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ha", + "task":"translation_from", + "metric":"chrf", + "score":0.1890793851 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ha", + "task":"translation_to", + "metric":"bleu", + "score":0.0144953008 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ha", + "task":"translation_to", + "metric":"chrf", + "score":0.1884647114 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"hi", + "task":"classification", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"hi", + "task":"translation_from", + "metric":"bleu", + "score":0.1658307051 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"hi", + "task":"translation_from", + "metric":"chrf", + "score":0.3676480008 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"hi", + "task":"translation_to", + "metric":"bleu", + "score":0.1711676323 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"hi", + "task":"translation_to", + "metric":"chrf", + "score":0.360371738 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"hne", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"hne", + "task":"translation_from", + "metric":"bleu", + "score":0.0316097931 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"hne", + "task":"translation_from", + "metric":"chrf", + "score":0.2354084259 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"hne", + "task":"translation_to", + "metric":"bleu", + "score":0.0324437189 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"hne", + "task":"translation_to", + "metric":"chrf", + "score":0.2310907497 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ht", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ht", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ht", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ht", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ht", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"hu", + "task":"classification", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"hu", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"hu", + "task":"translation_from", + "metric":"bleu", + "score":0.1200885566 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"hu", + "task":"translation_from", + "metric":"chrf", + "score":0.3203716958 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"hu", + "task":"translation_to", + "metric":"bleu", + "score":0.1112414449 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"hu", + "task":"translation_to", + "metric":"chrf", + "score":0.3175953836 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"id", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"id", + "task":"translation_from", + "metric":"bleu", + "score":0.1399603895 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"id", + "task":"translation_from", + "metric":"chrf", + "score":0.3604113675 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"id", + "task":"translation_to", + "metric":"bleu", + "score":0.1312450274 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"id", + "task":"translation_to", + "metric":"chrf", + "score":0.3988827234 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ig", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ig", + "task":"translation_from", + "metric":"bleu", + "score":0.0365286922 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ig", + "task":"translation_from", + "metric":"chrf", + "score":0.1990661561 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ig", + "task":"translation_to", + "metric":"bleu", + "score":0.0199391634 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ig", + "task":"translation_to", + "metric":"chrf", + "score":0.1497878674 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ilo", + "task":"classification", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"bleu", + "score":0.0448341108 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"chrf", + "score":0.252793155 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"bleu", + "score":0.0162978516 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"chrf", + "score":0.2157203276 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"it", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"it", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"it", + "task":"translation_from", + "metric":"bleu", + "score":0.0992729275 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"it", + "task":"translation_from", + "metric":"chrf", + "score":0.3331935567 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"it", + "task":"translation_to", + "metric":"bleu", + "score":0.1507170285 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"it", + "task":"translation_to", + "metric":"chrf", + "score":0.4062498972 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ja", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ja", + "task":"translation_from", + "metric":"bleu", + "score":0.1222242366 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ja", + "task":"translation_from", + "metric":"chrf", + "score":0.3415186168 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ja", + "task":"translation_to", + "metric":"bleu", + "score":0.1607198845 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ja", + "task":"translation_to", + "metric":"chrf", + "score":0.2706371796 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"jv", + "task":"classification", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"jv", + "task":"translation_from", + "metric":"bleu", + "score":0.0550016522 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"jv", + "task":"translation_from", + "metric":"chrf", + "score":0.2468917982 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"jv", + "task":"translation_to", + "metric":"bleu", + "score":0.017690474 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"jv", + "task":"translation_to", + "metric":"chrf", + "score":0.2536001746 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ki", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ki", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ki", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ki", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ki", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"kk", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"kk", + "task":"translation_from", + "metric":"bleu", + "score":0.0436064509 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"kk", + "task":"translation_from", + "metric":"chrf", + "score":0.2149063632 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"kk", + "task":"translation_to", + "metric":"bleu", + "score":0.0078784523 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"kk", + "task":"translation_to", + "metric":"chrf", + "score":0.1640159488 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"km", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"km", + "task":"translation_from", + "metric":"bleu", + "score":0.0075610365 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"km", + "task":"translation_from", + "metric":"chrf", + "score":0.1887566902 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"km", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"km", + "task":"translation_to", + "metric":"chrf", + "score":0.0847212314 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"kn", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"kn", + "task":"translation_from", + "metric":"bleu", + "score":0.0397152583 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"kn", + "task":"translation_from", + "metric":"chrf", + "score":0.2037873099 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"kn", + "task":"translation_to", + "metric":"bleu", + "score":0.0137546968 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"kn", + "task":"translation_to", + "metric":"chrf", + "score":0.1710566423 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ko", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ko", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ko", + "task":"translation_from", + "metric":"bleu", + "score":0.0564413481 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ko", + "task":"translation_from", + "metric":"chrf", + "score":0.3212656259 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ko", + "task":"translation_to", + "metric":"bleu", + "score":0.0674768387 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ko", + "task":"translation_to", + "metric":"chrf", + "score":0.1657544717 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"lua", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"lua", + "task":"translation_from", + "metric":"bleu", + "score":0.037013395 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"lua", + "task":"translation_from", + "metric":"chrf", + "score":0.2338208281 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"lua", + "task":"translation_to", + "metric":"bleu", + "score":0.0011308834 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"lua", + "task":"translation_to", + "metric":"chrf", + "score":0.1078312824 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"mag", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"mag", + "task":"translation_from", + "metric":"bleu", + "score":0.068704384 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"mag", + "task":"translation_from", + "metric":"chrf", + "score":0.2935036324 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"mag", + "task":"translation_to", + "metric":"bleu", + "score":0.0888104824 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"mag", + "task":"translation_to", + "metric":"chrf", + "score":0.2740386167 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"mai", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"mai", + "task":"translation_from", + "metric":"bleu", + "score":0.039812774 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"mai", + "task":"translation_from", + "metric":"chrf", + "score":0.2668100649 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"mai", + "task":"translation_to", + "metric":"bleu", + "score":0.0365460997 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"mai", + "task":"translation_to", + "metric":"chrf", + "score":0.2177619304 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"mg", + "task":"classification", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"mg", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"mg", + "task":"translation_from", + "metric":"bleu", + "score":0.0221745742 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"mg", + "task":"translation_from", + "metric":"chrf", + "score":0.1989640913 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"mg", + "task":"translation_to", + "metric":"bleu", + "score":0.016161822 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"mg", + "task":"translation_to", + "metric":"chrf", + "score":0.1752502983 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ml", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ml", + "task":"translation_from", + "metric":"bleu", + "score":0.0532822129 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ml", + "task":"translation_from", + "metric":"chrf", + "score":0.2301007371 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ml", + "task":"translation_to", + "metric":"bleu", + "score":0.022639121 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ml", + "task":"translation_to", + "metric":"chrf", + "score":0.175884413 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"mr", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"mr", + "task":"translation_from", + "metric":"bleu", + "score":0.0411296617 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"mr", + "task":"translation_from", + "metric":"chrf", + "score":0.2442292695 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"mr", + "task":"translation_to", + "metric":"bleu", + "score":0.0482775033 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"mr", + "task":"translation_to", + "metric":"chrf", + "score":0.2211003771 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ms", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ms", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ms", + "task":"translation_from", + "metric":"bleu", + "score":0.1375979502 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ms", + "task":"translation_from", + "metric":"chrf", + "score":0.3518293272 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ms", + "task":"translation_to", + "metric":"bleu", + "score":0.1462646527 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ms", + "task":"translation_to", + "metric":"chrf", + "score":0.3886405702 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"my", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"my", + "task":"translation_from", + "metric":"bleu", + "score":0.1 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"my", + "task":"translation_from", + "metric":"chrf", + "score":0.2238699363 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"my", + "task":"translation_to", + "metric":"bleu", + "score":0.1 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"my", + "task":"translation_to", + "metric":"chrf", + "score":0.1606469353 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ne", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ne", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ne", + "task":"translation_from", + "metric":"bleu", + "score":0.0498052059 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ne", + "task":"translation_from", + "metric":"chrf", + "score":0.2651327526 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ne", + "task":"translation_to", + "metric":"bleu", + "score":0.0286452462 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ne", + "task":"translation_to", + "metric":"chrf", + "score":0.2023398596 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"nl", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"nl", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"nl", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"nl", + "task":"translation_from", + "metric":"bleu", + "score":0.122262497 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"nl", + "task":"translation_from", + "metric":"chrf", + "score":0.3515428019 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"nl", + "task":"translation_to", + "metric":"bleu", + "score":0.1527676878 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"nl", + "task":"translation_to", + "metric":"chrf", + "score":0.4249238432 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ny", + "task":"classification", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ny", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ny", + "task":"translation_from", + "metric":"bleu", + "score":0.0279631361 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ny", + "task":"translation_from", + "metric":"chrf", + "score":0.2321541854 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ny", + "task":"translation_to", + "metric":"bleu", + "score":0.0195222834 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ny", + "task":"translation_to", + "metric":"chrf", + "score":0.1762015362 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"om", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"om", + "task":"translation_from", + "metric":"bleu", + "score":0.0127402107 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"om", + "task":"translation_from", + "metric":"chrf", + "score":0.1651498064 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"om", + "task":"translation_to", + "metric":"bleu", + "score":0.0088808864 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"om", + "task":"translation_to", + "metric":"chrf", + "score":0.1702476721 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"or", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"or", + "task":"translation_from", + "metric":"bleu", + "score":0.0366762006 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"or", + "task":"translation_from", + "metric":"chrf", + "score":0.1697470704 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"or", + "task":"translation_to", + "metric":"bleu", + "score":0.0190635247 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"or", + "task":"translation_to", + "metric":"chrf", + "score":0.1343627089 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"pa", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"pa", + "task":"translation_from", + "metric":"bleu", + "score":0.2292007848 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"pa", + "task":"translation_from", + "metric":"chrf", + "score":0.3716655897 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"pa", + "task":"translation_to", + "metric":"bleu", + "score":0.2126702079 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"pa", + "task":"translation_to", + "metric":"chrf", + "score":0.3248815955 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"pl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"pl", + "task":"translation_from", + "metric":"bleu", + "score":0.1085949014 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"pl", + "task":"translation_from", + "metric":"chrf", + "score":0.3346783911 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"pl", + "task":"translation_to", + "metric":"bleu", + "score":0.1676106101 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"pl", + "task":"translation_to", + "metric":"chrf", + "score":0.3907504991 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"pt", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"pt", + "task":"translation_from", + "metric":"bleu", + "score":0.1013445398 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"pt", + "task":"translation_from", + "metric":"chrf", + "score":0.3063125264 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"pt", + "task":"translation_to", + "metric":"bleu", + "score":0.2231857524 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"pt", + "task":"translation_to", + "metric":"chrf", + "score":0.4401829864 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ro", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ro", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ro", + "task":"translation_from", + "metric":"bleu", + "score":0.0955350175 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ro", + "task":"translation_from", + "metric":"chrf", + "score":0.3286351702 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ro", + "task":"translation_to", + "metric":"bleu", + "score":0.1871630014 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ro", + "task":"translation_to", + "metric":"chrf", + "score":0.3655570607 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ru", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ru", + "task":"translation_from", + "metric":"bleu", + "score":0.1005466956 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ru", + "task":"translation_from", + "metric":"chrf", + "score":0.3356518748 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ru", + "task":"translation_to", + "metric":"bleu", + "score":0.1363185356 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ru", + "task":"translation_to", + "metric":"chrf", + "score":0.3769111636 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"rw", + "task":"classification", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"rw", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"rw", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"rw", + "task":"translation_from", + "metric":"bleu", + "score":0.0189997083 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"rw", + "task":"translation_from", + "metric":"chrf", + "score":0.1919557381 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"rw", + "task":"translation_to", + "metric":"bleu", + "score":0.0165320564 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"rw", + "task":"translation_to", + "metric":"chrf", + "score":0.1417103032 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sd", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sd", + "task":"translation_from", + "metric":"bleu", + "score":0.0441421075 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sd", + "task":"translation_from", + "metric":"chrf", + "score":0.1739314177 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sd", + "task":"translation_to", + "metric":"bleu", + "score":0.0182129294 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sd", + "task":"translation_to", + "metric":"chrf", + "score":0.119134604 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"si", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"si", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"si", + "task":"translation_from", + "metric":"bleu", + "score":0.0302406554 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"si", + "task":"translation_from", + "metric":"chrf", + "score":0.1787247799 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"si", + "task":"translation_to", + "metric":"bleu", + "score":0.0014746217 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"si", + "task":"translation_to", + "metric":"chrf", + "score":0.0931903615 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sn", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sn", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sn", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sn", + "task":"translation_from", + "metric":"bleu", + "score":0.0192199252 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sn", + "task":"translation_from", + "metric":"chrf", + "score":0.1851933727 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sn", + "task":"translation_to", + "metric":"bleu", + "score":0.016306816 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sn", + "task":"translation_to", + "metric":"chrf", + "score":0.1413916659 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"so", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"so", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"so", + "task":"translation_from", + "metric":"bleu", + "score":0.0299103049 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"so", + "task":"translation_from", + "metric":"chrf", + "score":0.1986832691 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"so", + "task":"translation_to", + "metric":"bleu", + "score":0.0138432 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"so", + "task":"translation_to", + "metric":"chrf", + "score":0.1610036541 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sr", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sr", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sr", + "task":"translation_from", + "metric":"bleu", + "score":0.1315135307 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sr", + "task":"translation_from", + "metric":"chrf", + "score":0.3968249514 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sr", + "task":"translation_to", + "metric":"bleu", + "score":0.1220351802 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sr", + "task":"translation_to", + "metric":"chrf", + "score":0.3505317727 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"su", + "task":"classification", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"su", + "task":"translation_from", + "metric":"bleu", + "score":0.0605189037 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"su", + "task":"translation_from", + "metric":"chrf", + "score":0.2644052383 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"su", + "task":"translation_to", + "metric":"bleu", + "score":0.0323301168 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"su", + "task":"translation_to", + "metric":"chrf", + "score":0.2153999563 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sv", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sv", + "task":"translation_from", + "metric":"bleu", + "score":0.1638179638 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sv", + "task":"translation_from", + "metric":"chrf", + "score":0.3812064776 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sv", + "task":"translation_to", + "metric":"bleu", + "score":0.2333909009 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sv", + "task":"translation_to", + "metric":"chrf", + "score":0.4689649165 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sw", + "task":"classification", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sw", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sw", + "task":"translation_from", + "metric":"bleu", + "score":0.0510060878 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sw", + "task":"translation_from", + "metric":"chrf", + "score":0.2132741272 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sw", + "task":"translation_to", + "metric":"bleu", + "score":0.0089146903 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"sw", + "task":"translation_to", + "metric":"chrf", + "score":0.2314109768 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ta", + "task":"classification", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ta", + "task":"translation_from", + "metric":"bleu", + "score":0.0303451125 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ta", + "task":"translation_from", + "metric":"chrf", + "score":0.1748071119 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ta", + "task":"translation_to", + "metric":"bleu", + "score":0.0076177075 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ta", + "task":"translation_to", + "metric":"chrf", + "score":0.1986647775 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"te", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"te", + "task":"translation_from", + "metric":"bleu", + "score":0.1096331511 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"te", + "task":"translation_from", + "metric":"chrf", + "score":0.2888090685 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"te", + "task":"translation_to", + "metric":"bleu", + "score":0.1206114883 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"te", + "task":"translation_to", + "metric":"chrf", + "score":0.2597106436 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"tg", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"tg", + "task":"translation_from", + "metric":"bleu", + "score":0.0268228091 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"tg", + "task":"translation_from", + "metric":"chrf", + "score":0.1751009974 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"tg", + "task":"translation_to", + "metric":"bleu", + "score":0.0015866917 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"tg", + "task":"translation_to", + "metric":"chrf", + "score":0.1423262509 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"th", + "task":"classification", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"th", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"th", + "task":"translation_from", + "metric":"bleu", + "score":0.0382115226 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"th", + "task":"translation_from", + "metric":"chrf", + "score":0.2562543067 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"th", + "task":"translation_to", + "metric":"bleu", + "score":0.0125933293 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"th", + "task":"translation_to", + "metric":"chrf", + "score":0.1659603426 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ti", + "task":"classification", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ti", + "task":"translation_from", + "metric":"bleu", + "score":0.0161407336 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ti", + "task":"translation_from", + "metric":"chrf", + "score":0.1568869137 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ti", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ti", + "task":"translation_to", + "metric":"chrf", + "score":0.0241402636 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"tr", + "task":"classification", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"tr", + "task":"translation_from", + "metric":"bleu", + "score":0.0907273605 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"tr", + "task":"translation_from", + "metric":"chrf", + "score":0.2666411269 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"tr", + "task":"translation_to", + "metric":"bleu", + "score":0.0495223383 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"tr", + "task":"translation_to", + "metric":"chrf", + "score":0.276468397 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"uk", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"uk", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"uk", + "task":"translation_from", + "metric":"bleu", + "score":0.1408426214 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"uk", + "task":"translation_from", + "metric":"chrf", + "score":0.3768513401 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"uk", + "task":"translation_to", + "metric":"bleu", + "score":0.1029189854 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"uk", + "task":"translation_to", + "metric":"chrf", + "score":0.3606378352 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"umb", + "task":"classification", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"umb", + "task":"translation_from", + "metric":"bleu", + "score":0.023064469 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"umb", + "task":"translation_from", + "metric":"chrf", + "score":0.0922502173 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"umb", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"umb", + "task":"translation_to", + "metric":"chrf", + "score":0.1015661134 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ur", + "task":"classification", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ur", + "task":"translation_from", + "metric":"bleu", + "score":0.0891185343 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ur", + "task":"translation_from", + "metric":"chrf", + "score":0.281793335 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ur", + "task":"translation_to", + "metric":"bleu", + "score":0.0799576366 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"ur", + "task":"translation_to", + "metric":"chrf", + "score":0.2661903898 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"uz", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"uz", + "task":"translation_from", + "metric":"bleu", + "score":0.0287030985 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"uz", + "task":"translation_from", + "metric":"chrf", + "score":0.2124751899 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"uz", + "task":"translation_to", + "metric":"bleu", + "score":0.0040250398 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"uz", + "task":"translation_to", + "metric":"chrf", + "score":0.1706379305 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"vi", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"vi", + "task":"translation_from", + "metric":"bleu", + "score":0.1389065496 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"vi", + "task":"translation_from", + "metric":"chrf", + "score":0.3708687542 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"vi", + "task":"translation_to", + "metric":"bleu", + "score":0.1661316612 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"vi", + "task":"translation_to", + "metric":"chrf", + "score":0.354399593 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"wo", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"wo", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"wo", + "task":"translation_from", + "metric":"bleu", + "score":0.0242583204 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"wo", + "task":"translation_from", + "metric":"chrf", + "score":0.1929988599 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"wo", + "task":"translation_to", + "metric":"bleu", + "score":0.012814538 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"wo", + "task":"translation_to", + "metric":"chrf", + "score":0.1551759179 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"wuu", + "task":"classification", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"bleu", + "score":0.0973024735 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"chrf", + "score":0.3076531166 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"bleu", + "score":0.0161682999 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"chrf", + "score":0.0635837055 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"xh", + "task":"classification", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"xh", + "task":"translation_from", + "metric":"bleu", + "score":0.0478834907 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"xh", + "task":"translation_from", + "metric":"chrf", + "score":0.208762819 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"xh", + "task":"translation_to", + "metric":"bleu", + "score":0.0095341532 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"xh", + "task":"translation_to", + "metric":"chrf", + "score":0.150635966 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"yo", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"yo", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"yo", + "task":"translation_from", + "metric":"bleu", + "score":0.0080365175 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"yo", + "task":"translation_from", + "metric":"chrf", + "score":0.1647602539 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"yo", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"yo", + "task":"translation_to", + "metric":"chrf", + "score":0.0909640555 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"yue", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"yue", + "task":"translation_from", + "metric":"bleu", + "score":0.1043191943 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"yue", + "task":"translation_from", + "metric":"chrf", + "score":0.3414129274 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"yue", + "task":"translation_to", + "metric":"bleu", + "score":0.0651436117 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"yue", + "task":"translation_to", + "metric":"chrf", + "score":0.1002582276 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"zh", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"zh", + "task":"translation_from", + "metric":"bleu", + "score":0.1133138775 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"zh", + "task":"translation_from", + "metric":"chrf", + "score":0.3754190494 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"zh", + "task":"translation_to", + "metric":"bleu", + "score":0.1672636279 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"zh", + "task":"translation_to", + "metric":"chrf", + "score":0.232325354 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"zu", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"zu", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"zu", + "task":"translation_from", + "metric":"bleu", + "score":0.0206894768 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"zu", + "task":"translation_from", + "metric":"chrf", + "score":0.1952546166 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"zu", + "task":"translation_to", + "metric":"bleu", + "score":0.0113901513 + }, + { + "model":"gryphe\/mythomax-l2-13b", + "bcp_47":"zu", + "task":"translation_to", + "metric":"chrf", + "score":0.1302687289 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"aeb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.2152631134 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.4621033585 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.1438913245 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.3637806215 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"af", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"af", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"af", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"af", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"af", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ak", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ak", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ak", + "task":"translation_from", + "metric":"bleu", + "score":0.0488692805 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ak", + "task":"translation_from", + "metric":"chrf", + "score":0.2406135335 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ak", + "task":"translation_to", + "metric":"bleu", + "score":0.0214880279 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ak", + "task":"translation_to", + "metric":"chrf", + "score":0.2270659336 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"am", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"am", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"am", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"am", + "task":"translation_from", + "metric":"bleu", + "score":0.1203676158 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"am", + "task":"translation_from", + "metric":"chrf", + "score":0.3241911739 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"am", + "task":"translation_to", + "metric":"bleu", + "score":0.0165994228 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"am", + "task":"translation_to", + "metric":"chrf", + "score":0.1058904177 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"apc", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"apc", + "task":"translation_from", + "metric":"bleu", + "score":0.2332719546 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"apc", + "task":"translation_from", + "metric":"chrf", + "score":0.4924788322 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"apc", + "task":"translation_to", + "metric":"bleu", + "score":0.1544598614 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"apc", + "task":"translation_to", + "metric":"chrf", + "score":0.403814105 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ar", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ar", + "task":"translation_from", + "metric":"bleu", + "score":0.2609114367 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ar", + "task":"translation_from", + "metric":"chrf", + "score":0.5167379854 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ar", + "task":"translation_to", + "metric":"bleu", + "score":0.1932802581 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ar", + "task":"translation_to", + "metric":"chrf", + "score":0.4648835751 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ary", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ary", + "task":"translation_from", + "metric":"bleu", + "score":0.1270864308 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ary", + "task":"translation_from", + "metric":"chrf", + "score":0.3882289796 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ary", + "task":"translation_to", + "metric":"bleu", + "score":0.1366193757 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ary", + "task":"translation_to", + "metric":"chrf", + "score":0.3691581345 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"arz", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"arz", + "task":"translation_from", + "metric":"bleu", + "score":0.1966421011 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"arz", + "task":"translation_from", + "metric":"chrf", + "score":0.4161867731 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"arz", + "task":"translation_to", + "metric":"bleu", + "score":0.1531147508 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"arz", + "task":"translation_to", + "metric":"chrf", + "score":0.3635575685 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"as", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"as", + "task":"translation_from", + "metric":"bleu", + "score":0.152657571 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"as", + "task":"translation_from", + "metric":"chrf", + "score":0.4132859119 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"as", + "task":"translation_to", + "metric":"bleu", + "score":0.0663682991 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"as", + "task":"translation_to", + "metric":"chrf", + "score":0.3007728685 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"awa", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"awa", + "task":"translation_from", + "metric":"bleu", + "score":0.2739426076 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"awa", + "task":"translation_from", + "metric":"chrf", + "score":0.5129388019 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"awa", + "task":"translation_to", + "metric":"bleu", + "score":0.1227671497 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"awa", + "task":"translation_to", + "metric":"chrf", + "score":0.3306179967 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"az", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"az", + "task":"translation_from", + "metric":"bleu", + "score":0.130005692 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"az", + "task":"translation_from", + "metric":"chrf", + "score":0.3815764307 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"az", + "task":"translation_to", + "metric":"bleu", + "score":0.136654027 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"az", + "task":"translation_to", + "metric":"chrf", + "score":0.3809883299 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"be", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"be", + "task":"translation_from", + "metric":"bleu", + "score":0.092815209 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"be", + "task":"translation_from", + "metric":"chrf", + "score":0.4056492611 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"be", + "task":"translation_to", + "metric":"bleu", + "score":0.2013843536 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"be", + "task":"translation_to", + "metric":"chrf", + "score":0.417738842 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"bho", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"bho", + "task":"translation_from", + "metric":"bleu", + "score":0.2451140745 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"bho", + "task":"translation_from", + "metric":"chrf", + "score":0.4883780153 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"bho", + "task":"translation_to", + "metric":"bleu", + "score":0.1334730215 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"bho", + "task":"translation_to", + "metric":"chrf", + "score":0.363000921 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"bm", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"bm", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"bm", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"bm", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"bm", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"bn", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"bn", + "task":"translation_from", + "metric":"bleu", + "score":0.1938367121 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"bn", + "task":"translation_from", + "metric":"chrf", + "score":0.4674774016 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"bn", + "task":"translation_to", + "metric":"bleu", + "score":0.2073541352 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"bn", + "task":"translation_to", + "metric":"chrf", + "score":0.4438396219 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ca", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ca", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ca", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ca", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ca", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ceb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"bleu", + "score":0.260902514 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"chrf", + "score":0.4589913242 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"bleu", + "score":0.2033313823 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"chrf", + "score":0.4899690932 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ckb", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"bleu", + "score":0.1866723671 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"chrf", + "score":0.3936568086 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"bleu", + "score":0.0494661624 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"chrf", + "score":0.320713519 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"cs", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"cs", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"cs", + "task":"translation_from", + "metric":"bleu", + "score":0.2435247423 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"cs", + "task":"translation_from", + "metric":"chrf", + "score":0.501836375 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"cs", + "task":"translation_to", + "metric":"bleu", + "score":0.1956638929 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"cs", + "task":"translation_to", + "metric":"chrf", + "score":0.4870538255 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"de", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"de", + "task":"translation_from", + "metric":"bleu", + "score":0.2685056004 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"de", + "task":"translation_from", + "metric":"chrf", + "score":0.506818165 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"de", + "task":"translation_to", + "metric":"bleu", + "score":0.3801657831 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"de", + "task":"translation_to", + "metric":"chrf", + "score":0.6056477234 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"el", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"el", + "task":"translation_from", + "metric":"bleu", + "score":0.2197756902 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"el", + "task":"translation_from", + "metric":"chrf", + "score":0.4571715629 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"el", + "task":"translation_to", + "metric":"bleu", + "score":0.2911113336 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"el", + "task":"translation_to", + "metric":"chrf", + "score":0.4641387139 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"en", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"en", + "task":"translation_from", + "metric":"bleu", + "score":0.2216031518 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"en", + "task":"translation_from", + "metric":"chrf", + "score":0.4429472312 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"en", + "task":"translation_to", + "metric":"bleu", + "score":0.3322887566 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"en", + "task":"translation_to", + "metric":"chrf", + "score":0.5824514758 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"es", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"es", + "task":"translation_from", + "metric":"bleu", + "score":0.1640783778 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"es", + "task":"translation_from", + "metric":"chrf", + "score":0.434749516 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"es", + "task":"translation_to", + "metric":"bleu", + "score":0.3126220052 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"es", + "task":"translation_to", + "metric":"chrf", + "score":0.6038883227 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fa", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fa", + "task":"translation_from", + "metric":"bleu", + "score":0.2147534918 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fa", + "task":"translation_from", + "metric":"chrf", + "score":0.4874495537 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fa", + "task":"translation_to", + "metric":"bleu", + "score":0.094833194 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fa", + "task":"translation_to", + "metric":"chrf", + "score":0.3292486732 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fil", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fil", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fil", + "task":"translation_from", + "metric":"bleu", + "score":0.3074477197 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fil", + "task":"translation_from", + "metric":"chrf", + "score":0.5168064726 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fil", + "task":"translation_to", + "metric":"bleu", + "score":0.2380541489 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fil", + "task":"translation_to", + "metric":"chrf", + "score":0.552589393 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fr", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fr", + "task":"translation_from", + "metric":"bleu", + "score":0.2261588318 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fr", + "task":"translation_from", + "metric":"chrf", + "score":0.4944996319 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fr", + "task":"translation_to", + "metric":"bleu", + "score":0.4626001556 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fr", + "task":"translation_to", + "metric":"chrf", + "score":0.6614963779 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.0704357087 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.214215478 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0113955269 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.1874434226 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"gu", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"gu", + "task":"translation_from", + "metric":"bleu", + "score":0.2250377214 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"gu", + "task":"translation_from", + "metric":"chrf", + "score":0.4688956519 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"gu", + "task":"translation_to", + "metric":"bleu", + "score":0.1515937263 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"gu", + "task":"translation_to", + "metric":"chrf", + "score":0.4251249067 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ha", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ha", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ha", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ha", + "task":"translation_from", + "metric":"bleu", + "score":0.0957125553 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ha", + "task":"translation_from", + "metric":"chrf", + "score":0.3135046613 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ha", + "task":"translation_to", + "metric":"bleu", + "score":0.1387309388 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ha", + "task":"translation_to", + "metric":"chrf", + "score":0.383923158 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"hi", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"hi", + "task":"translation_from", + "metric":"bleu", + "score":0.3316295853 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"hi", + "task":"translation_from", + "metric":"chrf", + "score":0.5594083443 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"hi", + "task":"translation_to", + "metric":"bleu", + "score":0.3598049012 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"hi", + "task":"translation_to", + "metric":"chrf", + "score":0.5828568956 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"hne", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"hne", + "task":"translation_from", + "metric":"bleu", + "score":0.1166136282 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"hne", + "task":"translation_from", + "metric":"chrf", + "score":0.3855078109 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"hne", + "task":"translation_to", + "metric":"bleu", + "score":0.0887957809 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"hne", + "task":"translation_to", + "metric":"chrf", + "score":0.3187695245 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ht", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ht", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ht", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ht", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ht", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"hu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"hu", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"hu", + "task":"translation_from", + "metric":"bleu", + "score":0.2237665442 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"hu", + "task":"translation_from", + "metric":"chrf", + "score":0.4896395702 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"hu", + "task":"translation_to", + "metric":"bleu", + "score":0.2614626337 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"hu", + "task":"translation_to", + "metric":"chrf", + "score":0.5280652466 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"id", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"id", + "task":"translation_from", + "metric":"bleu", + "score":0.2236143729 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"id", + "task":"translation_from", + "metric":"chrf", + "score":0.4912948296 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"id", + "task":"translation_to", + "metric":"bleu", + "score":0.2910526755 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"id", + "task":"translation_to", + "metric":"chrf", + "score":0.6005590773 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ig", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ig", + "task":"translation_from", + "metric":"bleu", + "score":0.0845382562 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ig", + "task":"translation_from", + "metric":"chrf", + "score":0.3303135434 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ig", + "task":"translation_to", + "metric":"bleu", + "score":0.1267144204 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ig", + "task":"translation_to", + "metric":"chrf", + "score":0.3667670284 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ilo", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"bleu", + "score":0.1301757317 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"chrf", + "score":0.3568142061 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"bleu", + "score":0.1161068297 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"chrf", + "score":0.4147684511 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"it", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"it", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"it", + "task":"translation_from", + "metric":"bleu", + "score":0.2150043089 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"it", + "task":"translation_from", + "metric":"chrf", + "score":0.4693148389 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"it", + "task":"translation_to", + "metric":"bleu", + "score":0.2998342329 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"it", + "task":"translation_to", + "metric":"chrf", + "score":0.5545377546 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ja", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ja", + "task":"translation_from", + "metric":"bleu", + "score":0.2131020144 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ja", + "task":"translation_from", + "metric":"chrf", + "score":0.4845704057 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ja", + "task":"translation_to", + "metric":"bleu", + "score":0.1446650781 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ja", + "task":"translation_to", + "metric":"chrf", + "score":0.2292145443 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"jv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"jv", + "task":"translation_from", + "metric":"bleu", + "score":0.1840709267 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"jv", + "task":"translation_from", + "metric":"chrf", + "score":0.4042090141 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"jv", + "task":"translation_to", + "metric":"bleu", + "score":0.1902389614 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"jv", + "task":"translation_to", + "metric":"chrf", + "score":0.4796942089 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ki", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ki", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ki", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ki", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ki", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"kk", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"kk", + "task":"translation_from", + "metric":"bleu", + "score":0.1500855 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"kk", + "task":"translation_from", + "metric":"chrf", + "score":0.4100527329 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"kk", + "task":"translation_to", + "metric":"bleu", + "score":0.1136442629 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"kk", + "task":"translation_to", + "metric":"chrf", + "score":0.4236240472 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"km", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"km", + "task":"translation_from", + "metric":"bleu", + "score":0.1899800627 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"km", + "task":"translation_from", + "metric":"chrf", + "score":0.4618900518 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"km", + "task":"translation_to", + "metric":"bleu", + "score":0.087831891 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"km", + "task":"translation_to", + "metric":"chrf", + "score":0.265907742 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"kn", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"kn", + "task":"translation_from", + "metric":"bleu", + "score":0.1797031918 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"kn", + "task":"translation_from", + "metric":"chrf", + "score":0.446466319 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"kn", + "task":"translation_to", + "metric":"bleu", + "score":0.1846339038 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"kn", + "task":"translation_to", + "metric":"chrf", + "score":0.4220658756 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ko", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ko", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ko", + "task":"translation_from", + "metric":"bleu", + "score":0.1932392069 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ko", + "task":"translation_from", + "metric":"chrf", + "score":0.4204852284 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ko", + "task":"translation_to", + "metric":"bleu", + "score":0.0476115004 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ko", + "task":"translation_to", + "metric":"chrf", + "score":0.0790735292 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"lua", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"lua", + "task":"translation_from", + "metric":"bleu", + "score":0.0505101039 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"lua", + "task":"translation_from", + "metric":"chrf", + "score":0.2502174391 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"lua", + "task":"translation_to", + "metric":"bleu", + "score":0.0135029462 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"lua", + "task":"translation_to", + "metric":"chrf", + "score":0.1682326163 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"mag", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"mag", + "task":"translation_from", + "metric":"bleu", + "score":0.2778994313 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"mag", + "task":"translation_from", + "metric":"chrf", + "score":0.534066621 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"mag", + "task":"translation_to", + "metric":"bleu", + "score":0.1661930328 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"mag", + "task":"translation_to", + "metric":"chrf", + "score":0.4001562798 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"mai", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"mai", + "task":"translation_from", + "metric":"bleu", + "score":0.212877318 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"mai", + "task":"translation_from", + "metric":"chrf", + "score":0.4587224182 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"mai", + "task":"translation_to", + "metric":"bleu", + "score":0.0873487304 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"mai", + "task":"translation_to", + "metric":"chrf", + "score":0.3409755146 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"mg", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"mg", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"mg", + "task":"translation_from", + "metric":"bleu", + "score":0.1013985932 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"mg", + "task":"translation_from", + "metric":"chrf", + "score":0.3022487832 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"mg", + "task":"translation_to", + "metric":"bleu", + "score":0.0611289601 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"mg", + "task":"translation_to", + "metric":"chrf", + "score":0.3842495071 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ml", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ml", + "task":"translation_from", + "metric":"bleu", + "score":0.2670990652 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ml", + "task":"translation_from", + "metric":"chrf", + "score":0.5220692033 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ml", + "task":"translation_to", + "metric":"bleu", + "score":0.1981851908 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ml", + "task":"translation_to", + "metric":"chrf", + "score":0.4555314776 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"mr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"mr", + "task":"translation_from", + "metric":"bleu", + "score":0.2152417217 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"mr", + "task":"translation_from", + "metric":"chrf", + "score":0.4578207034 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"mr", + "task":"translation_to", + "metric":"bleu", + "score":0.1654073391 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"mr", + "task":"translation_to", + "metric":"chrf", + "score":0.3941079443 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ms", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ms", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ms", + "task":"translation_from", + "metric":"bleu", + "score":0.2763114217 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ms", + "task":"translation_from", + "metric":"chrf", + "score":0.5353874356 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ms", + "task":"translation_to", + "metric":"bleu", + "score":0.3315044625 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ms", + "task":"translation_to", + "metric":"chrf", + "score":0.6241092077 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"my", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"my", + "task":"translation_from", + "metric":"bleu", + "score":0.2083780287 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"my", + "task":"translation_from", + "metric":"chrf", + "score":0.4466015977 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"my", + "task":"translation_to", + "metric":"bleu", + "score":0.0879797246 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"my", + "task":"translation_to", + "metric":"chrf", + "score":0.3441521948 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ne", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ne", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ne", + "task":"translation_from", + "metric":"bleu", + "score":0.2353570133 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ne", + "task":"translation_from", + "metric":"chrf", + "score":0.4846450712 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ne", + "task":"translation_to", + "metric":"bleu", + "score":0.1632876087 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ne", + "task":"translation_to", + "metric":"chrf", + "score":0.4158370821 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"nl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"nl", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"nl", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"nl", + "task":"translation_from", + "metric":"bleu", + "score":0.2136151785 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"nl", + "task":"translation_from", + "metric":"chrf", + "score":0.4670269701 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"nl", + "task":"translation_to", + "metric":"bleu", + "score":0.2202915792 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"nl", + "task":"translation_to", + "metric":"chrf", + "score":0.5233013945 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ny", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ny", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ny", + "task":"translation_from", + "metric":"bleu", + "score":0.0757269477 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ny", + "task":"translation_from", + "metric":"chrf", + "score":0.2848998148 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ny", + "task":"translation_to", + "metric":"bleu", + "score":0.0329429353 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ny", + "task":"translation_to", + "metric":"chrf", + "score":0.193397393 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"om", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"om", + "task":"translation_from", + "metric":"bleu", + "score":0.0206783974 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"om", + "task":"translation_from", + "metric":"chrf", + "score":0.2005424268 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"om", + "task":"translation_to", + "metric":"bleu", + "score":0.0171071488 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"om", + "task":"translation_to", + "metric":"chrf", + "score":0.239253642 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"or", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"or", + "task":"translation_from", + "metric":"bleu", + "score":0.1677012885 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"or", + "task":"translation_from", + "metric":"chrf", + "score":0.4316686173 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"or", + "task":"translation_to", + "metric":"bleu", + "score":0.1202133569 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"or", + "task":"translation_to", + "metric":"chrf", + "score":0.3816566526 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"pa", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"pa", + "task":"translation_from", + "metric":"bleu", + "score":0.1891048622 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"pa", + "task":"translation_from", + "metric":"chrf", + "score":0.4238091524 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"pa", + "task":"translation_to", + "metric":"bleu", + "score":0.2086330089 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"pa", + "task":"translation_to", + "metric":"chrf", + "score":0.364326938 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"pl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"pl", + "task":"translation_from", + "metric":"bleu", + "score":0.1998083747 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"pl", + "task":"translation_from", + "metric":"chrf", + "score":0.4667760664 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"pl", + "task":"translation_to", + "metric":"bleu", + "score":0.3336132898 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"pl", + "task":"translation_to", + "metric":"chrf", + "score":0.5541703282 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"pt", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"pt", + "task":"translation_from", + "metric":"bleu", + "score":0.2256776552 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"pt", + "task":"translation_from", + "metric":"chrf", + "score":0.4793769886 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"pt", + "task":"translation_to", + "metric":"bleu", + "score":0.3320822339 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"pt", + "task":"translation_to", + "metric":"chrf", + "score":0.6132478102 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ro", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ro", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ro", + "task":"translation_from", + "metric":"bleu", + "score":0.1978207058 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ro", + "task":"translation_from", + "metric":"chrf", + "score":0.4682392821 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ro", + "task":"translation_to", + "metric":"bleu", + "score":0.409911871 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ro", + "task":"translation_to", + "metric":"chrf", + "score":0.6078072484 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ru", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ru", + "task":"translation_from", + "metric":"bleu", + "score":0.1730354472 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ru", + "task":"translation_from", + "metric":"chrf", + "score":0.454951133 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ru", + "task":"translation_to", + "metric":"bleu", + "score":0.3073459183 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ru", + "task":"translation_to", + "metric":"chrf", + "score":0.554890569 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"rw", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"rw", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"rw", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"rw", + "task":"translation_from", + "metric":"bleu", + "score":0.0841096684 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"rw", + "task":"translation_from", + "metric":"chrf", + "score":0.2671346741 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"rw", + "task":"translation_to", + "metric":"bleu", + "score":0.0409000825 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"rw", + "task":"translation_to", + "metric":"chrf", + "score":0.3185422263 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sd", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sd", + "task":"translation_from", + "metric":"bleu", + "score":0.1343511225 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sd", + "task":"translation_from", + "metric":"chrf", + "score":0.385804118 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sd", + "task":"translation_to", + "metric":"bleu", + "score":0.0662090824 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sd", + "task":"translation_to", + "metric":"chrf", + "score":0.3030628402 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"si", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"si", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"si", + "task":"translation_from", + "metric":"bleu", + "score":0.1430431721 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"si", + "task":"translation_from", + "metric":"chrf", + "score":0.3858131555 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"si", + "task":"translation_to", + "metric":"bleu", + "score":0.1602151366 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"si", + "task":"translation_to", + "metric":"chrf", + "score":0.357355981 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sn", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sn", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sn", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sn", + "task":"translation_from", + "metric":"bleu", + "score":0.0399118136 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sn", + "task":"translation_from", + "metric":"chrf", + "score":0.2285191544 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sn", + "task":"translation_to", + "metric":"bleu", + "score":0.0269601697 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sn", + "task":"translation_to", + "metric":"chrf", + "score":0.3006594703 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"so", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"so", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"so", + "task":"translation_from", + "metric":"bleu", + "score":0.0705893599 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"so", + "task":"translation_from", + "metric":"chrf", + "score":0.26834967 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"so", + "task":"translation_to", + "metric":"bleu", + "score":0.0988956652 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"so", + "task":"translation_to", + "metric":"chrf", + "score":0.3896116232 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sr", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sr", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sr", + "task":"translation_from", + "metric":"bleu", + "score":0.2014976842 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sr", + "task":"translation_from", + "metric":"chrf", + "score":0.470196154 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sr", + "task":"translation_to", + "metric":"bleu", + "score":0.2922893702 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sr", + "task":"translation_to", + "metric":"chrf", + "score":0.504298223 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"su", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"su", + "task":"translation_from", + "metric":"bleu", + "score":0.1538893384 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"su", + "task":"translation_from", + "metric":"chrf", + "score":0.4005055487 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"su", + "task":"translation_to", + "metric":"bleu", + "score":0.123816759 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"su", + "task":"translation_to", + "metric":"chrf", + "score":0.4480197519 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sv", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sv", + "task":"translation_from", + "metric":"bleu", + "score":0.2739803344 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sv", + "task":"translation_from", + "metric":"chrf", + "score":0.5286596224 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sv", + "task":"translation_to", + "metric":"bleu", + "score":0.3468145126 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sv", + "task":"translation_to", + "metric":"chrf", + "score":0.6078627072 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sw", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sw", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sw", + "task":"translation_from", + "metric":"bleu", + "score":0.1798653655 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sw", + "task":"translation_from", + "metric":"chrf", + "score":0.4290347271 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sw", + "task":"translation_to", + "metric":"bleu", + "score":0.1709237193 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sw", + "task":"translation_to", + "metric":"chrf", + "score":0.522080463 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ta", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ta", + "task":"translation_from", + "metric":"bleu", + "score":0.1405088565 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ta", + "task":"translation_from", + "metric":"chrf", + "score":0.4088204523 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ta", + "task":"translation_to", + "metric":"bleu", + "score":0.2360333676 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ta", + "task":"translation_to", + "metric":"chrf", + "score":0.5038093602 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"te", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"te", + "task":"translation_from", + "metric":"bleu", + "score":0.2507091988 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"te", + "task":"translation_from", + "metric":"chrf", + "score":0.5067409185 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"te", + "task":"translation_to", + "metric":"bleu", + "score":0.2998213366 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"te", + "task":"translation_to", + "metric":"chrf", + "score":0.5112516267 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"tg", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"tg", + "task":"translation_from", + "metric":"bleu", + "score":0.1029119511 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"tg", + "task":"translation_from", + "metric":"chrf", + "score":0.37770665 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"tg", + "task":"translation_to", + "metric":"bleu", + "score":0.1507872741 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"tg", + "task":"translation_to", + "metric":"chrf", + "score":0.3945276116 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"th", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"th", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"th", + "task":"translation_from", + "metric":"bleu", + "score":0.2022308722 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"th", + "task":"translation_from", + "metric":"chrf", + "score":0.4620737135 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"th", + "task":"translation_to", + "metric":"bleu", + "score":0.2592698778 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"th", + "task":"translation_to", + "metric":"chrf", + "score":0.4253112122 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ti", + "task":"classification", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ti", + "task":"translation_from", + "metric":"bleu", + "score":0.052152068 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ti", + "task":"translation_from", + "metric":"chrf", + "score":0.2578037483 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ti", + "task":"translation_to", + "metric":"bleu", + "score":0.0237309602 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ti", + "task":"translation_to", + "metric":"chrf", + "score":0.0808540368 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"tr", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"tr", + "task":"translation_from", + "metric":"bleu", + "score":0.2231619401 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"tr", + "task":"translation_from", + "metric":"chrf", + "score":0.4653230255 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"tr", + "task":"translation_to", + "metric":"bleu", + "score":0.2701457179 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"tr", + "task":"translation_to", + "metric":"chrf", + "score":0.5043061571 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"uk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"uk", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"uk", + "task":"translation_from", + "metric":"bleu", + "score":0.2437336637 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"uk", + "task":"translation_from", + "metric":"chrf", + "score":0.5042825637 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"uk", + "task":"translation_to", + "metric":"bleu", + "score":0.3231504544 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"uk", + "task":"translation_to", + "metric":"chrf", + "score":0.5440009645 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"umb", + "task":"classification", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"umb", + "task":"translation_from", + "metric":"bleu", + "score":0.0461126383 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"umb", + "task":"translation_from", + "metric":"chrf", + "score":0.1577698173 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"umb", + "task":"translation_to", + "metric":"bleu", + "score":0.0008007826 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"umb", + "task":"translation_to", + "metric":"chrf", + "score":0.1426831674 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ur", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ur", + "task":"translation_from", + "metric":"bleu", + "score":0.194871957 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ur", + "task":"translation_from", + "metric":"chrf", + "score":0.4838690709 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ur", + "task":"translation_to", + "metric":"bleu", + "score":0.1908512613 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ur", + "task":"translation_to", + "metric":"chrf", + "score":0.3855814375 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"uz", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"uz", + "task":"translation_from", + "metric":"bleu", + "score":0.177513842 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"uz", + "task":"translation_from", + "metric":"chrf", + "score":0.386230097 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"uz", + "task":"translation_to", + "metric":"bleu", + "score":0.2544813414 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"uz", + "task":"translation_to", + "metric":"chrf", + "score":0.4948262917 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"vi", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"vi", + "task":"translation_from", + "metric":"bleu", + "score":0.2003733128 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"vi", + "task":"translation_from", + "metric":"chrf", + "score":0.4613442635 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"vi", + "task":"translation_to", + "metric":"bleu", + "score":0.3326058501 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"vi", + "task":"translation_to", + "metric":"chrf", + "score":0.5496097026 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"wo", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"wo", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"wo", + "task":"translation_from", + "metric":"bleu", + "score":0.0685259305 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"wo", + "task":"translation_from", + "metric":"chrf", + "score":0.234718691 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"wo", + "task":"translation_to", + "metric":"bleu", + "score":0.0319335459 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"wo", + "task":"translation_to", + "metric":"chrf", + "score":0.1970529604 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"wuu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"bleu", + "score":0.1538409962 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"chrf", + "score":0.4398974306 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"bleu", + "score":0.0373503953 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"chrf", + "score":0.074080246 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"xh", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"xh", + "task":"translation_from", + "metric":"bleu", + "score":0.0707946688 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"xh", + "task":"translation_from", + "metric":"chrf", + "score":0.2881582575 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"xh", + "task":"translation_to", + "metric":"bleu", + "score":0.0204932467 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"xh", + "task":"translation_to", + "metric":"chrf", + "score":0.2690069759 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"yo", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"yo", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"yo", + "task":"translation_from", + "metric":"bleu", + "score":0.0339322053 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"yo", + "task":"translation_from", + "metric":"chrf", + "score":0.2166922882 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"yo", + "task":"translation_to", + "metric":"bleu", + "score":0.0169319822 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"yo", + "task":"translation_to", + "metric":"chrf", + "score":0.1617793532 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"yue", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"yue", + "task":"translation_from", + "metric":"bleu", + "score":0.174955946 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"yue", + "task":"translation_from", + "metric":"chrf", + "score":0.4554476081 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"yue", + "task":"translation_to", + "metric":"bleu", + "score":0.1400846872 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"yue", + "task":"translation_to", + "metric":"chrf", + "score":0.1809201358 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"zh", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"zh", + "task":"translation_from", + "metric":"bleu", + "score":0.1869648376 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"zh", + "task":"translation_from", + "metric":"chrf", + "score":0.4664675781 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"zh", + "task":"translation_to", + "metric":"bleu", + "score":0.1696786467 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"zh", + "task":"translation_to", + "metric":"chrf", + "score":0.2325846099 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"zu", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"zu", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"zu", + "task":"translation_from", + "metric":"bleu", + "score":0.0515154857 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"zu", + "task":"translation_from", + "metric":"chrf", + "score":0.2819357103 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"zu", + "task":"translation_to", + "metric":"bleu", + "score":0.0804926199 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"zu", + "task":"translation_to", + "metric":"chrf", + "score":0.3473550746 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"aeb", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.2561356588 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.49648558 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.2071032166 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.4109686249 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"af", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"af", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"af", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"af", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"af", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ak", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ak", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ak", + "task":"translation_from", + "metric":"bleu", + "score":0.1091965593 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ak", + "task":"translation_from", + "metric":"chrf", + "score":0.3173514683 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ak", + "task":"translation_to", + "metric":"bleu", + "score":0.0490503072 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ak", + "task":"translation_to", + "metric":"chrf", + "score":0.2649288206 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"am", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"am", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"am", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"am", + "task":"translation_from", + "metric":"bleu", + "score":0.1375609672 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"am", + "task":"translation_from", + "metric":"chrf", + "score":0.3710873948 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"am", + "task":"translation_to", + "metric":"bleu", + "score":0.0526682247 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"am", + "task":"translation_to", + "metric":"chrf", + "score":0.1185738392 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"apc", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"apc", + "task":"translation_from", + "metric":"bleu", + "score":0.2624553878 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"apc", + "task":"translation_from", + "metric":"chrf", + "score":0.5118695802 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"apc", + "task":"translation_to", + "metric":"bleu", + "score":0.2175864677 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"apc", + "task":"translation_to", + "metric":"chrf", + "score":0.4641969296 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ar", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ar", + "task":"translation_from", + "metric":"bleu", + "score":0.2766513185 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ar", + "task":"translation_from", + "metric":"chrf", + "score":0.5528193738 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ar", + "task":"translation_to", + "metric":"bleu", + "score":0.3371708551 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ar", + "task":"translation_to", + "metric":"chrf", + "score":0.5607841978 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ary", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ary", + "task":"translation_from", + "metric":"bleu", + "score":0.1412140088 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ary", + "task":"translation_from", + "metric":"chrf", + "score":0.4082636767 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ary", + "task":"translation_to", + "metric":"bleu", + "score":0.1613157357 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ary", + "task":"translation_to", + "metric":"chrf", + "score":0.3896124669 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"arz", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"arz", + "task":"translation_from", + "metric":"bleu", + "score":0.2374604323 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"arz", + "task":"translation_from", + "metric":"chrf", + "score":0.4585263555 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"arz", + "task":"translation_to", + "metric":"bleu", + "score":0.2300327193 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"arz", + "task":"translation_to", + "metric":"chrf", + "score":0.43482663 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"as", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"as", + "task":"translation_from", + "metric":"bleu", + "score":0.220118305 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"as", + "task":"translation_from", + "metric":"chrf", + "score":0.4767360664 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"as", + "task":"translation_to", + "metric":"bleu", + "score":0.0623766799 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"as", + "task":"translation_to", + "metric":"chrf", + "score":0.2986098722 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"awa", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"awa", + "task":"translation_from", + "metric":"bleu", + "score":0.3261928856 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"awa", + "task":"translation_from", + "metric":"chrf", + "score":0.5339015736 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"awa", + "task":"translation_to", + "metric":"bleu", + "score":0.2330787096 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"awa", + "task":"translation_to", + "metric":"chrf", + "score":0.4427484336 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"az", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"az", + "task":"translation_from", + "metric":"bleu", + "score":0.1767618659 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"az", + "task":"translation_from", + "metric":"chrf", + "score":0.4088166263 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"az", + "task":"translation_to", + "metric":"bleu", + "score":0.1381246624 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"az", + "task":"translation_to", + "metric":"chrf", + "score":0.3730280956 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"be", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"be", + "task":"translation_from", + "metric":"bleu", + "score":0.161760748 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"be", + "task":"translation_from", + "metric":"chrf", + "score":0.450732576 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"be", + "task":"translation_to", + "metric":"bleu", + "score":0.2170520787 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"be", + "task":"translation_to", + "metric":"chrf", + "score":0.4098923096 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"bho", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"bho", + "task":"translation_from", + "metric":"bleu", + "score":0.2731033294 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"bho", + "task":"translation_from", + "metric":"chrf", + "score":0.5159041397 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"bho", + "task":"translation_to", + "metric":"bleu", + "score":0.2075901182 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"bho", + "task":"translation_to", + "metric":"chrf", + "score":0.4086862509 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"bm", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"bm", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"bm", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"bm", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"bm", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"bn", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"bn", + "task":"translation_from", + "metric":"bleu", + "score":0.2623045124 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"bn", + "task":"translation_from", + "metric":"chrf", + "score":0.512895511 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"bn", + "task":"translation_to", + "metric":"bleu", + "score":0.3328087961 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"bn", + "task":"translation_to", + "metric":"chrf", + "score":0.5013967236 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ca", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ca", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ca", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ca", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ca", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ceb", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"bleu", + "score":0.36364203 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"chrf", + "score":0.5712362729 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"bleu", + "score":0.2701190878 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"chrf", + "score":0.551918321 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ckb", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"bleu", + "score":0.1903904403 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"chrf", + "score":0.4687496067 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"bleu", + "score":0.0520773173 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"chrf", + "score":0.3368230674 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"cs", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"cs", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"cs", + "task":"translation_from", + "metric":"bleu", + "score":0.3416129059 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"cs", + "task":"translation_from", + "metric":"chrf", + "score":0.5845038999 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"cs", + "task":"translation_to", + "metric":"bleu", + "score":0.2726323508 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"cs", + "task":"translation_to", + "metric":"chrf", + "score":0.5283879512 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"de", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"de", + "task":"translation_from", + "metric":"bleu", + "score":0.3059254014 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"de", + "task":"translation_from", + "metric":"chrf", + "score":0.5403551155 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"de", + "task":"translation_to", + "metric":"bleu", + "score":0.4588037752 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"de", + "task":"translation_to", + "metric":"chrf", + "score":0.6692431614 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"el", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"el", + "task":"translation_from", + "metric":"bleu", + "score":0.268843518 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"el", + "task":"translation_from", + "metric":"chrf", + "score":0.493449014 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"el", + "task":"translation_to", + "metric":"bleu", + "score":0.3403168702 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"el", + "task":"translation_to", + "metric":"chrf", + "score":0.5086292148 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"en", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"en", + "task":"translation_from", + "metric":"bleu", + "score":0.5486108614 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"en", + "task":"translation_from", + "metric":"chrf", + "score":0.6873139374 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"en", + "task":"translation_to", + "metric":"bleu", + "score":0.691450825 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"en", + "task":"translation_to", + "metric":"chrf", + "score":0.8407064328 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"es", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"es", + "task":"translation_from", + "metric":"bleu", + "score":0.3021494986 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"es", + "task":"translation_from", + "metric":"chrf", + "score":0.5604145602 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"es", + "task":"translation_to", + "metric":"bleu", + "score":0.3865320679 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"es", + "task":"translation_to", + "metric":"chrf", + "score":0.6126903448 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fa", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fa", + "task":"translation_from", + "metric":"bleu", + "score":0.3383579693 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fa", + "task":"translation_from", + "metric":"chrf", + "score":0.5641679075 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fa", + "task":"translation_to", + "metric":"bleu", + "score":0.2069613925 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fa", + "task":"translation_to", + "metric":"chrf", + "score":0.4288746449 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fil", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fil", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fil", + "task":"translation_from", + "metric":"bleu", + "score":0.3771163962 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fil", + "task":"translation_from", + "metric":"chrf", + "score":0.5827777548 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fil", + "task":"translation_to", + "metric":"bleu", + "score":0.3225619014 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fil", + "task":"translation_to", + "metric":"chrf", + "score":0.5830090459 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fr", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fr", + "task":"translation_from", + "metric":"bleu", + "score":0.2924853239 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fr", + "task":"translation_from", + "metric":"chrf", + "score":0.5462367408 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fr", + "task":"translation_to", + "metric":"bleu", + "score":0.4963618411 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fr", + "task":"translation_to", + "metric":"chrf", + "score":0.682573515 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.0727409119 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.1973579541 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0147511412 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.1172295571 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"gu", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"gu", + "task":"translation_from", + "metric":"bleu", + "score":0.3220032872 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"gu", + "task":"translation_from", + "metric":"chrf", + "score":0.537784261 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"gu", + "task":"translation_to", + "metric":"bleu", + "score":0.2206953431 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"gu", + "task":"translation_to", + "metric":"chrf", + "score":0.4990640113 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ha", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ha", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ha", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ha", + "task":"translation_from", + "metric":"bleu", + "score":0.1527043255 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ha", + "task":"translation_from", + "metric":"chrf", + "score":0.4074071592 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ha", + "task":"translation_to", + "metric":"bleu", + "score":0.1567942198 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ha", + "task":"translation_to", + "metric":"chrf", + "score":0.4125213011 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"hi", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"hi", + "task":"translation_from", + "metric":"bleu", + "score":0.3914590212 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"hi", + "task":"translation_from", + "metric":"chrf", + "score":0.6128431348 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"hi", + "task":"translation_to", + "metric":"bleu", + "score":0.4189427376 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"hi", + "task":"translation_to", + "metric":"chrf", + "score":0.6262550579 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"hne", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"hne", + "task":"translation_from", + "metric":"bleu", + "score":0.2338808528 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"hne", + "task":"translation_from", + "metric":"chrf", + "score":0.4544102907 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"hne", + "task":"translation_to", + "metric":"bleu", + "score":0.1243598882 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"hne", + "task":"translation_to", + "metric":"chrf", + "score":0.4051657211 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ht", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ht", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ht", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ht", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ht", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"hu", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"hu", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"hu", + "task":"translation_from", + "metric":"bleu", + "score":0.2678903597 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"hu", + "task":"translation_from", + "metric":"chrf", + "score":0.520149627 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"hu", + "task":"translation_to", + "metric":"bleu", + "score":0.3361911519 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"hu", + "task":"translation_to", + "metric":"chrf", + "score":0.5583527487 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"id", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"id", + "task":"translation_from", + "metric":"bleu", + "score":0.290274553 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"id", + "task":"translation_from", + "metric":"chrf", + "score":0.5143960108 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"id", + "task":"translation_to", + "metric":"bleu", + "score":0.3789023659 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"id", + "task":"translation_to", + "metric":"chrf", + "score":0.6751523776 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ig", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ig", + "task":"translation_from", + "metric":"bleu", + "score":0.1640789976 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ig", + "task":"translation_from", + "metric":"chrf", + "score":0.4462743519 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ig", + "task":"translation_to", + "metric":"bleu", + "score":0.1964520184 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ig", + "task":"translation_to", + "metric":"chrf", + "score":0.3861299089 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ilo", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"bleu", + "score":0.1899251487 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"chrf", + "score":0.428775702 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"bleu", + "score":0.1861284915 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"chrf", + "score":0.4568269097 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"it", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"it", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"it", + "task":"translation_from", + "metric":"bleu", + "score":0.296179579 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"it", + "task":"translation_from", + "metric":"chrf", + "score":0.5259369403 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"it", + "task":"translation_to", + "metric":"bleu", + "score":0.3187240753 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"it", + "task":"translation_to", + "metric":"chrf", + "score":0.5786749514 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ja", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ja", + "task":"translation_from", + "metric":"bleu", + "score":0.3306727326 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ja", + "task":"translation_from", + "metric":"chrf", + "score":0.5648258387 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ja", + "task":"translation_to", + "metric":"bleu", + "score":0.262512317 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ja", + "task":"translation_to", + "metric":"chrf", + "score":0.4036795798 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"jv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"jv", + "task":"translation_from", + "metric":"bleu", + "score":0.2593989014 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"jv", + "task":"translation_from", + "metric":"chrf", + "score":0.4825732152 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"jv", + "task":"translation_to", + "metric":"bleu", + "score":0.2177203514 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"jv", + "task":"translation_to", + "metric":"chrf", + "score":0.452576603 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ki", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ki", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ki", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ki", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ki", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"kk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"kk", + "task":"translation_from", + "metric":"bleu", + "score":0.2013677498 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"kk", + "task":"translation_from", + "metric":"chrf", + "score":0.4740327886 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"kk", + "task":"translation_to", + "metric":"bleu", + "score":0.2015887265 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"kk", + "task":"translation_to", + "metric":"chrf", + "score":0.4935901226 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"km", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"km", + "task":"translation_from", + "metric":"bleu", + "score":0.3098535214 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"km", + "task":"translation_from", + "metric":"chrf", + "score":0.5740290935 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"km", + "task":"translation_to", + "metric":"bleu", + "score":0.0913702814 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"km", + "task":"translation_to", + "metric":"chrf", + "score":0.3128837987 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"kn", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"kn", + "task":"translation_from", + "metric":"bleu", + "score":0.2155836452 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"kn", + "task":"translation_from", + "metric":"chrf", + "score":0.4583181839 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"kn", + "task":"translation_to", + "metric":"bleu", + "score":0.2468017951 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"kn", + "task":"translation_to", + "metric":"chrf", + "score":0.4734415865 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ko", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ko", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ko", + "task":"translation_from", + "metric":"bleu", + "score":0.2276258723 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ko", + "task":"translation_from", + "metric":"chrf", + "score":0.4577745447 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ko", + "task":"translation_to", + "metric":"bleu", + "score":0.3046437152 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ko", + "task":"translation_to", + "metric":"chrf", + "score":0.3825631739 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"lua", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"lua", + "task":"translation_from", + "metric":"bleu", + "score":0.1034813211 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"lua", + "task":"translation_from", + "metric":"chrf", + "score":0.2900727397 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"lua", + "task":"translation_to", + "metric":"bleu", + "score":0.0357350273 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"lua", + "task":"translation_to", + "metric":"chrf", + "score":0.2486408005 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"mag", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"mag", + "task":"translation_from", + "metric":"bleu", + "score":0.3838720489 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"mag", + "task":"translation_from", + "metric":"chrf", + "score":0.5776118345 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"mag", + "task":"translation_to", + "metric":"bleu", + "score":0.200683389 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"mag", + "task":"translation_to", + "metric":"chrf", + "score":0.4892134584 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"mai", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"mai", + "task":"translation_from", + "metric":"bleu", + "score":0.2846718719 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"mai", + "task":"translation_from", + "metric":"chrf", + "score":0.5239506053 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"mai", + "task":"translation_to", + "metric":"bleu", + "score":0.135802286 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"mai", + "task":"translation_to", + "metric":"chrf", + "score":0.3994207414 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"mg", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"mg", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"mg", + "task":"translation_from", + "metric":"bleu", + "score":0.1470288737 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"mg", + "task":"translation_from", + "metric":"chrf", + "score":0.370597998 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"mg", + "task":"translation_to", + "metric":"bleu", + "score":0.0624257747 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"mg", + "task":"translation_to", + "metric":"chrf", + "score":0.3667603362 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ml", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ml", + "task":"translation_from", + "metric":"bleu", + "score":0.271926141 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ml", + "task":"translation_from", + "metric":"chrf", + "score":0.5318057054 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ml", + "task":"translation_to", + "metric":"bleu", + "score":0.2579782083 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ml", + "task":"translation_to", + "metric":"chrf", + "score":0.4806502272 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"mr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"mr", + "task":"translation_from", + "metric":"bleu", + "score":0.2987546297 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"mr", + "task":"translation_from", + "metric":"chrf", + "score":0.526361525 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"mr", + "task":"translation_to", + "metric":"bleu", + "score":0.1515083487 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"mr", + "task":"translation_to", + "metric":"chrf", + "score":0.4332812085 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ms", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ms", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ms", + "task":"translation_from", + "metric":"bleu", + "score":0.3458633411 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ms", + "task":"translation_from", + "metric":"chrf", + "score":0.5703964991 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ms", + "task":"translation_to", + "metric":"bleu", + "score":0.4050410338 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ms", + "task":"translation_to", + "metric":"chrf", + "score":0.6535211779 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"my", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"my", + "task":"translation_from", + "metric":"bleu", + "score":0.2598947984 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"my", + "task":"translation_from", + "metric":"chrf", + "score":0.4881220333 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"my", + "task":"translation_to", + "metric":"bleu", + "score":0.2015903544 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"my", + "task":"translation_to", + "metric":"chrf", + "score":0.4513077936 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ne", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ne", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ne", + "task":"translation_from", + "metric":"bleu", + "score":0.260901002 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ne", + "task":"translation_from", + "metric":"chrf", + "score":0.4896606547 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ne", + "task":"translation_to", + "metric":"bleu", + "score":0.1429173328 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ne", + "task":"translation_to", + "metric":"chrf", + "score":0.4071639857 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"nl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"nl", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"nl", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"nl", + "task":"translation_from", + "metric":"bleu", + "score":0.2472539314 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"nl", + "task":"translation_from", + "metric":"chrf", + "score":0.4972878378 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"nl", + "task":"translation_to", + "metric":"bleu", + "score":0.2865823477 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"nl", + "task":"translation_to", + "metric":"chrf", + "score":0.5850706516 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ny", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ny", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ny", + "task":"translation_from", + "metric":"bleu", + "score":0.0888165228 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ny", + "task":"translation_from", + "metric":"chrf", + "score":0.2927704081 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ny", + "task":"translation_to", + "metric":"bleu", + "score":0.0527161443 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ny", + "task":"translation_to", + "metric":"chrf", + "score":0.3183888298 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"om", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"om", + "task":"translation_from", + "metric":"bleu", + "score":0.024472012 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"om", + "task":"translation_from", + "metric":"chrf", + "score":0.2143061298 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"om", + "task":"translation_to", + "metric":"bleu", + "score":0.0100859589 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"om", + "task":"translation_to", + "metric":"chrf", + "score":0.2528047704 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"or", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"or", + "task":"translation_from", + "metric":"bleu", + "score":0.285587224 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"or", + "task":"translation_from", + "metric":"chrf", + "score":0.5216659729 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"or", + "task":"translation_to", + "metric":"bleu", + "score":0.1281773816 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"or", + "task":"translation_to", + "metric":"chrf", + "score":0.3720376754 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"pa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"pa", + "task":"translation_from", + "metric":"bleu", + "score":0.4479091606 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"pa", + "task":"translation_from", + "metric":"chrf", + "score":0.6272058507 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"pa", + "task":"translation_to", + "metric":"bleu", + "score":0.4155919737 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"pa", + "task":"translation_to", + "metric":"chrf", + "score":0.5685427433 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"pl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"pl", + "task":"translation_from", + "metric":"bleu", + "score":0.2568309796 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"pl", + "task":"translation_from", + "metric":"chrf", + "score":0.5058927884 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"pl", + "task":"translation_to", + "metric":"bleu", + "score":0.3323405641 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"pl", + "task":"translation_to", + "metric":"chrf", + "score":0.5569354008 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"pt", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"pt", + "task":"translation_from", + "metric":"bleu", + "score":0.3183331223 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"pt", + "task":"translation_from", + "metric":"chrf", + "score":0.5559144449 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"pt", + "task":"translation_to", + "metric":"bleu", + "score":0.4500659682 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"pt", + "task":"translation_to", + "metric":"chrf", + "score":0.6761551234 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ro", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ro", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ro", + "task":"translation_from", + "metric":"bleu", + "score":0.2803966495 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ro", + "task":"translation_from", + "metric":"chrf", + "score":0.5308215606 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ro", + "task":"translation_to", + "metric":"bleu", + "score":0.5346576918 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ro", + "task":"translation_to", + "metric":"chrf", + "score":0.7024180686 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ru", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ru", + "task":"translation_from", + "metric":"bleu", + "score":0.2051262499 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ru", + "task":"translation_from", + "metric":"chrf", + "score":0.4837372958 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ru", + "task":"translation_to", + "metric":"bleu", + "score":0.3699194641 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ru", + "task":"translation_to", + "metric":"chrf", + "score":0.5770913921 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"rw", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"rw", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"rw", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"rw", + "task":"translation_from", + "metric":"bleu", + "score":0.1806014296 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"rw", + "task":"translation_from", + "metric":"chrf", + "score":0.4291519278 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"rw", + "task":"translation_to", + "metric":"bleu", + "score":0.0966721561 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"rw", + "task":"translation_to", + "metric":"chrf", + "score":0.3133383199 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sd", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sd", + "task":"translation_from", + "metric":"bleu", + "score":0.2666171334 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sd", + "task":"translation_from", + "metric":"chrf", + "score":0.4765001737 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sd", + "task":"translation_to", + "metric":"bleu", + "score":0.1168753501 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sd", + "task":"translation_to", + "metric":"chrf", + "score":0.3522716786 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"si", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"si", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"si", + "task":"translation_from", + "metric":"bleu", + "score":0.2270309753 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"si", + "task":"translation_from", + "metric":"chrf", + "score":0.4841536531 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"si", + "task":"translation_to", + "metric":"bleu", + "score":0.1352090178 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"si", + "task":"translation_to", + "metric":"chrf", + "score":0.3326584955 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sn", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sn", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sn", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sn", + "task":"translation_from", + "metric":"bleu", + "score":0.067782587 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sn", + "task":"translation_from", + "metric":"chrf", + "score":0.2594122638 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sn", + "task":"translation_to", + "metric":"bleu", + "score":0.0496762437 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sn", + "task":"translation_to", + "metric":"chrf", + "score":0.2555516699 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"so", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"so", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"so", + "task":"translation_from", + "metric":"bleu", + "score":0.1103212906 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"so", + "task":"translation_from", + "metric":"chrf", + "score":0.3317936338 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"so", + "task":"translation_to", + "metric":"bleu", + "score":0.1178727843 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"so", + "task":"translation_to", + "metric":"chrf", + "score":0.3706477532 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sr", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sr", + "task":"translation_from", + "metric":"bleu", + "score":0.2704960778 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sr", + "task":"translation_from", + "metric":"chrf", + "score":0.5452851397 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sr", + "task":"translation_to", + "metric":"bleu", + "score":0.395555296 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sr", + "task":"translation_to", + "metric":"chrf", + "score":0.5799018584 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"su", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"su", + "task":"translation_from", + "metric":"bleu", + "score":0.253350788 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"su", + "task":"translation_from", + "metric":"chrf", + "score":0.458172945 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"su", + "task":"translation_to", + "metric":"bleu", + "score":0.1663559354 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"su", + "task":"translation_to", + "metric":"chrf", + "score":0.4946292339 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sv", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sv", + "task":"translation_from", + "metric":"bleu", + "score":0.3079953173 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sv", + "task":"translation_from", + "metric":"chrf", + "score":0.5447429639 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sv", + "task":"translation_to", + "metric":"bleu", + "score":0.3935950974 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sv", + "task":"translation_to", + "metric":"chrf", + "score":0.6342780862 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sw", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sw", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sw", + "task":"translation_from", + "metric":"bleu", + "score":0.2983575506 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sw", + "task":"translation_from", + "metric":"chrf", + "score":0.5283269577 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sw", + "task":"translation_to", + "metric":"bleu", + "score":0.3087303367 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"sw", + "task":"translation_to", + "metric":"chrf", + "score":0.6028401745 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ta", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ta", + "task":"translation_from", + "metric":"bleu", + "score":0.2210855899 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ta", + "task":"translation_from", + "metric":"chrf", + "score":0.4616487061 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ta", + "task":"translation_to", + "metric":"bleu", + "score":0.2867265678 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ta", + "task":"translation_to", + "metric":"chrf", + "score":0.5646798034 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"te", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"te", + "task":"translation_from", + "metric":"bleu", + "score":0.357367421 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"te", + "task":"translation_from", + "metric":"chrf", + "score":0.5659157865 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"te", + "task":"translation_to", + "metric":"bleu", + "score":0.3515649071 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"te", + "task":"translation_to", + "metric":"chrf", + "score":0.5645706042 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"tg", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"tg", + "task":"translation_from", + "metric":"bleu", + "score":0.1896909211 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"tg", + "task":"translation_from", + "metric":"chrf", + "score":0.4144350541 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"tg", + "task":"translation_to", + "metric":"bleu", + "score":0.202234159 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"tg", + "task":"translation_to", + "metric":"chrf", + "score":0.4284203038 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"th", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"th", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"th", + "task":"translation_from", + "metric":"bleu", + "score":0.2422208114 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"th", + "task":"translation_from", + "metric":"chrf", + "score":0.4745802383 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"th", + "task":"translation_to", + "metric":"bleu", + "score":0.3118363896 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"th", + "task":"translation_to", + "metric":"chrf", + "score":0.4892437324 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ti", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ti", + "task":"translation_from", + "metric":"bleu", + "score":0.0689409767 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ti", + "task":"translation_from", + "metric":"chrf", + "score":0.2722531305 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ti", + "task":"translation_to", + "metric":"bleu", + "score":0.0406781073 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ti", + "task":"translation_to", + "metric":"chrf", + "score":0.0970886698 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"tr", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"tr", + "task":"translation_from", + "metric":"bleu", + "score":0.2772171859 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"tr", + "task":"translation_from", + "metric":"chrf", + "score":0.5118206984 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"tr", + "task":"translation_to", + "metric":"bleu", + "score":0.3271066365 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"tr", + "task":"translation_to", + "metric":"chrf", + "score":0.5803660329 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"uk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"uk", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"uk", + "task":"translation_from", + "metric":"bleu", + "score":0.2451818788 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"uk", + "task":"translation_from", + "metric":"chrf", + "score":0.4929183421 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"uk", + "task":"translation_to", + "metric":"bleu", + "score":0.2948409512 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"uk", + "task":"translation_to", + "metric":"chrf", + "score":0.5143250682 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"umb", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"umb", + "task":"translation_from", + "metric":"bleu", + "score":0.0677223644 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"umb", + "task":"translation_from", + "metric":"chrf", + "score":0.1661136189 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"umb", + "task":"translation_to", + "metric":"bleu", + "score":0.0419433658 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"umb", + "task":"translation_to", + "metric":"chrf", + "score":0.1567633534 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ur", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ur", + "task":"translation_from", + "metric":"bleu", + "score":0.2584265792 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ur", + "task":"translation_from", + "metric":"chrf", + "score":0.5020697076 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ur", + "task":"translation_to", + "metric":"bleu", + "score":0.2624388601 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ur", + "task":"translation_to", + "metric":"chrf", + "score":0.4452300688 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"uz", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"uz", + "task":"translation_from", + "metric":"bleu", + "score":0.2640324297 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"uz", + "task":"translation_from", + "metric":"chrf", + "score":0.5196545965 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"uz", + "task":"translation_to", + "metric":"bleu", + "score":0.2748329219 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"uz", + "task":"translation_to", + "metric":"chrf", + "score":0.5341998684 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"vi", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"vi", + "task":"translation_from", + "metric":"bleu", + "score":0.2872551102 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"vi", + "task":"translation_from", + "metric":"chrf", + "score":0.5360250569 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"vi", + "task":"translation_to", + "metric":"bleu", + "score":0.3575088107 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"vi", + "task":"translation_to", + "metric":"chrf", + "score":0.5879974234 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"wo", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"wo", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"wo", + "task":"translation_from", + "metric":"bleu", + "score":0.0892196115 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"wo", + "task":"translation_from", + "metric":"chrf", + "score":0.266303191 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"wo", + "task":"translation_to", + "metric":"bleu", + "score":0.0392376693 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"wo", + "task":"translation_to", + "metric":"chrf", + "score":0.1442620012 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"wuu", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"bleu", + "score":0.2174626032 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"chrf", + "score":0.4686565248 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"bleu", + "score":0.0941401506 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"chrf", + "score":0.1690248565 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"xh", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"xh", + "task":"translation_from", + "metric":"bleu", + "score":0.0921572696 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"xh", + "task":"translation_from", + "metric":"chrf", + "score":0.3072945662 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"xh", + "task":"translation_to", + "metric":"bleu", + "score":0.052810575 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"xh", + "task":"translation_to", + "metric":"chrf", + "score":0.2387421258 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"yo", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"yo", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"yo", + "task":"translation_from", + "metric":"bleu", + "score":0.0706373037 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"yo", + "task":"translation_from", + "metric":"chrf", + "score":0.2741240176 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"yo", + "task":"translation_to", + "metric":"bleu", + "score":0.0463945559 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"yo", + "task":"translation_to", + "metric":"chrf", + "score":0.1664955069 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"yue", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"yue", + "task":"translation_from", + "metric":"bleu", + "score":0.2098595469 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"yue", + "task":"translation_from", + "metric":"chrf", + "score":0.4603190119 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"yue", + "task":"translation_to", + "metric":"bleu", + "score":0.0831701767 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"yue", + "task":"translation_to", + "metric":"chrf", + "score":0.2065328404 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"zh", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"zh", + "task":"translation_from", + "metric":"bleu", + "score":0.2619931658 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"zh", + "task":"translation_from", + "metric":"chrf", + "score":0.5251502482 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"zh", + "task":"translation_to", + "metric":"bleu", + "score":0.2725475868 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"zh", + "task":"translation_to", + "metric":"chrf", + "score":0.3148065512 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"zu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"zu", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"zu", + "task":"translation_from", + "metric":"bleu", + "score":0.1611133093 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"zu", + "task":"translation_from", + "metric":"chrf", + "score":0.379825756 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"zu", + "task":"translation_to", + "metric":"bleu", + "score":0.0702261565 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"zu", + "task":"translation_to", + "metric":"chrf", + "score":0.3706020457 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"aeb", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.1723520986 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.4083355109 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.1631097827 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.3376536763 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"af", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"af", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"af", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"af", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"af", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ak", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ak", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ak", + "task":"translation_from", + "metric":"bleu", + "score":0.0539023061 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ak", + "task":"translation_from", + "metric":"chrf", + "score":0.1825644081 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ak", + "task":"translation_to", + "metric":"bleu", + "score":0.0390551527 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ak", + "task":"translation_to", + "metric":"chrf", + "score":0.1712135521 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"am", + "task":"classification", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"am", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"am", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"am", + "task":"translation_from", + "metric":"bleu", + "score":0.0584274365 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"am", + "task":"translation_from", + "metric":"chrf", + "score":0.2032749366 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"am", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"am", + "task":"translation_to", + "metric":"chrf", + "score":0.0680986525 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"apc", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"apc", + "task":"translation_from", + "metric":"bleu", + "score":0.1147231502 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"apc", + "task":"translation_from", + "metric":"chrf", + "score":0.3942588381 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"apc", + "task":"translation_to", + "metric":"bleu", + "score":0.1208986545 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"apc", + "task":"translation_to", + "metric":"chrf", + "score":0.329533412 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ar", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ar", + "task":"translation_from", + "metric":"bleu", + "score":0.2166642565 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ar", + "task":"translation_from", + "metric":"chrf", + "score":0.4531623464 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ar", + "task":"translation_to", + "metric":"bleu", + "score":0.2433592841 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ar", + "task":"translation_to", + "metric":"chrf", + "score":0.3890038008 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ary", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ary", + "task":"translation_from", + "metric":"bleu", + "score":0.0907074882 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ary", + "task":"translation_from", + "metric":"chrf", + "score":0.3354239861 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ary", + "task":"translation_to", + "metric":"bleu", + "score":0.0993142086 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ary", + "task":"translation_to", + "metric":"chrf", + "score":0.3089493054 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"arz", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"arz", + "task":"translation_from", + "metric":"bleu", + "score":0.1494352369 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"arz", + "task":"translation_from", + "metric":"chrf", + "score":0.3928912763 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"arz", + "task":"translation_to", + "metric":"bleu", + "score":0.212669524 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"arz", + "task":"translation_to", + "metric":"chrf", + "score":0.4040671507 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"as", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"as", + "task":"translation_from", + "metric":"bleu", + "score":0.1385938854 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"as", + "task":"translation_from", + "metric":"chrf", + "score":0.3301851724 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"as", + "task":"translation_to", + "metric":"bleu", + "score":0.0056778273 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"as", + "task":"translation_to", + "metric":"chrf", + "score":0.2000094468 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"awa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"awa", + "task":"translation_from", + "metric":"bleu", + "score":0.1920493262 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"awa", + "task":"translation_from", + "metric":"chrf", + "score":0.3987398592 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"awa", + "task":"translation_to", + "metric":"bleu", + "score":0.1143530268 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"awa", + "task":"translation_to", + "metric":"chrf", + "score":0.3000528345 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"az", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"az", + "task":"translation_from", + "metric":"bleu", + "score":0.090597898 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"az", + "task":"translation_from", + "metric":"chrf", + "score":0.3141862136 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"az", + "task":"translation_to", + "metric":"bleu", + "score":0.0583354997 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"az", + "task":"translation_to", + "metric":"chrf", + "score":0.2066334095 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"be", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"be", + "task":"translation_from", + "metric":"bleu", + "score":0.0984443913 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"be", + "task":"translation_from", + "metric":"chrf", + "score":0.385398237 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"be", + "task":"translation_to", + "metric":"bleu", + "score":0.0906994852 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"be", + "task":"translation_to", + "metric":"chrf", + "score":0.3103360752 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"bho", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"bho", + "task":"translation_from", + "metric":"bleu", + "score":0.1762047672 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"bho", + "task":"translation_from", + "metric":"chrf", + "score":0.4472079773 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"bho", + "task":"translation_to", + "metric":"bleu", + "score":0.1314817408 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"bho", + "task":"translation_to", + "metric":"chrf", + "score":0.3114200678 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"bm", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"bm", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"bm", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"bm", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"bm", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"bn", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"bn", + "task":"translation_from", + "metric":"bleu", + "score":0.1749870589 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"bn", + "task":"translation_from", + "metric":"chrf", + "score":0.3959743603 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"bn", + "task":"translation_to", + "metric":"bleu", + "score":0.1992458221 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"bn", + "task":"translation_to", + "metric":"chrf", + "score":0.3995820747 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ca", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ca", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ca", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ca", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ca", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ceb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"bleu", + "score":0.1578229782 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"chrf", + "score":0.3697628875 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"bleu", + "score":0.0776521407 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"chrf", + "score":0.2805707324 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ckb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"bleu", + "score":0.0726133349 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"chrf", + "score":0.2357676924 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"bleu", + "score":0.0025842148 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"chrf", + "score":0.2080643735 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"cs", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"cs", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"cs", + "task":"translation_from", + "metric":"bleu", + "score":0.2220546496 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"cs", + "task":"translation_from", + "metric":"chrf", + "score":0.4769435204 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"cs", + "task":"translation_to", + "metric":"bleu", + "score":0.2026562463 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"cs", + "task":"translation_to", + "metric":"chrf", + "score":0.3851807662 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"de", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"de", + "task":"translation_from", + "metric":"bleu", + "score":0.2301502689 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"de", + "task":"translation_from", + "metric":"chrf", + "score":0.4644650793 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"de", + "task":"translation_to", + "metric":"bleu", + "score":0.2921772734 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"de", + "task":"translation_to", + "metric":"chrf", + "score":0.4951314188 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"el", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"el", + "task":"translation_from", + "metric":"bleu", + "score":0.2059164492 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"el", + "task":"translation_from", + "metric":"chrf", + "score":0.4480550849 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"el", + "task":"translation_to", + "metric":"bleu", + "score":0.0964637139 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"el", + "task":"translation_to", + "metric":"chrf", + "score":0.2014449762 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"en", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"en", + "task":"translation_from", + "metric":"bleu", + "score":0.4124666467 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"en", + "task":"translation_from", + "metric":"chrf", + "score":0.582315662 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"en", + "task":"translation_to", + "metric":"bleu", + "score":0.5519762012 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"en", + "task":"translation_to", + "metric":"chrf", + "score":0.7446058172 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"es", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"es", + "task":"translation_from", + "metric":"bleu", + "score":0.2337331881 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"es", + "task":"translation_from", + "metric":"chrf", + "score":0.4523774022 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"es", + "task":"translation_to", + "metric":"bleu", + "score":0.2045157252 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"es", + "task":"translation_to", + "metric":"chrf", + "score":0.4389018917 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"fa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"fa", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"fa", + "task":"translation_from", + "metric":"bleu", + "score":0.1671223511 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"fa", + "task":"translation_from", + "metric":"chrf", + "score":0.4271635079 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"fa", + "task":"translation_to", + "metric":"bleu", + "score":0.0972518606 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"fa", + "task":"translation_to", + "metric":"chrf", + "score":0.3009816209 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"fil", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"fil", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"fil", + "task":"translation_from", + "metric":"bleu", + "score":0.2033697572 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"fil", + "task":"translation_from", + "metric":"chrf", + "score":0.4085758597 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"fil", + "task":"translation_to", + "metric":"bleu", + "score":0.1337024916 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"fil", + "task":"translation_to", + "metric":"chrf", + "score":0.3569658269 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"fr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"fr", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"fr", + "task":"translation_from", + "metric":"bleu", + "score":0.2381890937 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"fr", + "task":"translation_from", + "metric":"chrf", + "score":0.4806457757 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"fr", + "task":"translation_to", + "metric":"bleu", + "score":0.3213357404 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"fr", + "task":"translation_to", + "metric":"chrf", + "score":0.5096591733 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.0354285129 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.1982926593 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0009992134 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.0462874193 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"gu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"gu", + "task":"translation_from", + "metric":"bleu", + "score":0.168790959 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"gu", + "task":"translation_from", + "metric":"chrf", + "score":0.3588726594 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"gu", + "task":"translation_to", + "metric":"bleu", + "score":0.0998466384 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"gu", + "task":"translation_to", + "metric":"chrf", + "score":0.3089879911 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ha", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ha", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ha", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ha", + "task":"translation_from", + "metric":"bleu", + "score":0.0730728705 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ha", + "task":"translation_from", + "metric":"chrf", + "score":0.2880810134 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ha", + "task":"translation_to", + "metric":"bleu", + "score":0.032930228 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ha", + "task":"translation_to", + "metric":"chrf", + "score":0.1836595807 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"hi", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"hi", + "task":"translation_from", + "metric":"bleu", + "score":0.2951777856 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"hi", + "task":"translation_from", + "metric":"chrf", + "score":0.5193991656 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"hi", + "task":"translation_to", + "metric":"bleu", + "score":0.332068694 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"hi", + "task":"translation_to", + "metric":"chrf", + "score":0.5232846835 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"hne", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"hne", + "task":"translation_from", + "metric":"bleu", + "score":0.0924512162 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"hne", + "task":"translation_from", + "metric":"chrf", + "score":0.2983835975 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"hne", + "task":"translation_to", + "metric":"bleu", + "score":0.081522251 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"hne", + "task":"translation_to", + "metric":"chrf", + "score":0.3091578658 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ht", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ht", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ht", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ht", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ht", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"hu", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"hu", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"hu", + "task":"translation_from", + "metric":"bleu", + "score":0.1578469391 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"hu", + "task":"translation_from", + "metric":"chrf", + "score":0.3871847635 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"hu", + "task":"translation_to", + "metric":"bleu", + "score":0.0748322147 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"hu", + "task":"translation_to", + "metric":"chrf", + "score":0.2638608298 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"id", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"id", + "task":"translation_from", + "metric":"bleu", + "score":0.1717243204 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"id", + "task":"translation_from", + "metric":"chrf", + "score":0.4178336488 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"id", + "task":"translation_to", + "metric":"bleu", + "score":0.1865357446 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"id", + "task":"translation_to", + "metric":"chrf", + "score":0.429444403 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ig", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ig", + "task":"translation_from", + "metric":"bleu", + "score":0.0478268633 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ig", + "task":"translation_from", + "metric":"chrf", + "score":0.2570257732 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ig", + "task":"translation_to", + "metric":"bleu", + "score":0.0018410191 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ig", + "task":"translation_to", + "metric":"chrf", + "score":0.1558631502 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ilo", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"bleu", + "score":0.0364948502 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"chrf", + "score":0.2541169376 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"bleu", + "score":0.0232335134 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"chrf", + "score":0.2533249921 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"it", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"it", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"it", + "task":"translation_from", + "metric":"bleu", + "score":0.1826323546 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"it", + "task":"translation_from", + "metric":"chrf", + "score":0.4460216478 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"it", + "task":"translation_to", + "metric":"bleu", + "score":0.1650968642 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"it", + "task":"translation_to", + "metric":"chrf", + "score":0.3244010767 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ja", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ja", + "task":"translation_from", + "metric":"bleu", + "score":0.1933631076 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ja", + "task":"translation_from", + "metric":"chrf", + "score":0.4686346426 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ja", + "task":"translation_to", + "metric":"bleu", + "score":0.1629637627 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ja", + "task":"translation_to", + "metric":"chrf", + "score":0.265082494 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"jv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"jv", + "task":"translation_from", + "metric":"bleu", + "score":0.0726508623 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"jv", + "task":"translation_from", + "metric":"chrf", + "score":0.3051851212 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"jv", + "task":"translation_to", + "metric":"bleu", + "score":0.1282743245 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"jv", + "task":"translation_to", + "metric":"chrf", + "score":0.3321469572 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ki", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ki", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ki", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ki", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ki", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"kk", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"kk", + "task":"translation_from", + "metric":"bleu", + "score":0.1233188769 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"kk", + "task":"translation_from", + "metric":"chrf", + "score":0.3275167565 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"kk", + "task":"translation_to", + "metric":"bleu", + "score":0.0449879835 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"kk", + "task":"translation_to", + "metric":"chrf", + "score":0.2826754009 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"km", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"km", + "task":"translation_from", + "metric":"bleu", + "score":0.1013719184 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"km", + "task":"translation_from", + "metric":"chrf", + "score":0.2292361214 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"km", + "task":"translation_to", + "metric":"bleu", + "score":0.0071013458 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"km", + "task":"translation_to", + "metric":"chrf", + "score":0.1783377636 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"kn", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"kn", + "task":"translation_from", + "metric":"bleu", + "score":0.1401399582 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"kn", + "task":"translation_from", + "metric":"chrf", + "score":0.3051974688 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"kn", + "task":"translation_to", + "metric":"bleu", + "score":0.0942053588 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"kn", + "task":"translation_to", + "metric":"chrf", + "score":0.3363687748 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ko", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ko", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ko", + "task":"translation_from", + "metric":"bleu", + "score":0.1324044329 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ko", + "task":"translation_from", + "metric":"chrf", + "score":0.3790251178 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ko", + "task":"translation_to", + "metric":"bleu", + "score":0.1547958954 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ko", + "task":"translation_to", + "metric":"chrf", + "score":0.2281907624 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"lua", + "task":"classification", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"lua", + "task":"translation_from", + "metric":"bleu", + "score":0.04633447 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"lua", + "task":"translation_from", + "metric":"chrf", + "score":0.2489624204 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"lua", + "task":"translation_to", + "metric":"bleu", + "score":0.0124095873 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"lua", + "task":"translation_to", + "metric":"chrf", + "score":0.0933720751 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"mag", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"mag", + "task":"translation_from", + "metric":"bleu", + "score":0.2273546789 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"mag", + "task":"translation_from", + "metric":"chrf", + "score":0.4493238694 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"mag", + "task":"translation_to", + "metric":"bleu", + "score":0.1724674084 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"mag", + "task":"translation_to", + "metric":"chrf", + "score":0.3974478706 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"mai", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"mai", + "task":"translation_from", + "metric":"bleu", + "score":0.1570380948 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"mai", + "task":"translation_from", + "metric":"chrf", + "score":0.4536227649 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"mai", + "task":"translation_to", + "metric":"bleu", + "score":0.0768901169 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"mai", + "task":"translation_to", + "metric":"chrf", + "score":0.2918693283 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"mg", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"mg", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"mg", + "task":"translation_from", + "metric":"bleu", + "score":0.0180474118 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"mg", + "task":"translation_from", + "metric":"chrf", + "score":0.2099411444 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"mg", + "task":"translation_to", + "metric":"bleu", + "score":0.0414049927 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"mg", + "task":"translation_to", + "metric":"chrf", + "score":0.2278780188 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ml", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ml", + "task":"translation_from", + "metric":"bleu", + "score":0.171951865 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ml", + "task":"translation_from", + "metric":"chrf", + "score":0.3835379408 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ml", + "task":"translation_to", + "metric":"bleu", + "score":0.1659756056 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ml", + "task":"translation_to", + "metric":"chrf", + "score":0.4178488097 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"mr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"mr", + "task":"translation_from", + "metric":"bleu", + "score":0.144541816 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"mr", + "task":"translation_from", + "metric":"chrf", + "score":0.3648764501 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"mr", + "task":"translation_to", + "metric":"bleu", + "score":0.1047482644 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"mr", + "task":"translation_to", + "metric":"chrf", + "score":0.2965277611 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ms", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ms", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ms", + "task":"translation_from", + "metric":"bleu", + "score":0.2497767256 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ms", + "task":"translation_from", + "metric":"chrf", + "score":0.4824221555 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ms", + "task":"translation_to", + "metric":"bleu", + "score":0.1854347311 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ms", + "task":"translation_to", + "metric":"chrf", + "score":0.331339842 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"my", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"my", + "task":"translation_from", + "metric":"bleu", + "score":0.0578909241 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"my", + "task":"translation_from", + "metric":"chrf", + "score":0.2614924673 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"my", + "task":"translation_to", + "metric":"bleu", + "score":0.1528509146 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"my", + "task":"translation_to", + "metric":"chrf", + "score":0.347684852 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ne", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ne", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ne", + "task":"translation_from", + "metric":"bleu", + "score":0.1703660079 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ne", + "task":"translation_from", + "metric":"chrf", + "score":0.4009054828 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ne", + "task":"translation_to", + "metric":"bleu", + "score":0.0612834989 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ne", + "task":"translation_to", + "metric":"chrf", + "score":0.3159716539 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"nl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"nl", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"nl", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"nl", + "task":"translation_from", + "metric":"bleu", + "score":0.1766082572 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"nl", + "task":"translation_from", + "metric":"chrf", + "score":0.4438802086 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"nl", + "task":"translation_to", + "metric":"bleu", + "score":0.2113751191 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"nl", + "task":"translation_to", + "metric":"chrf", + "score":0.3971789312 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ny", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ny", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ny", + "task":"translation_from", + "metric":"bleu", + "score":0.0288119948 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ny", + "task":"translation_from", + "metric":"chrf", + "score":0.1974757162 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ny", + "task":"translation_to", + "metric":"bleu", + "score":0.0004462318 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ny", + "task":"translation_to", + "metric":"chrf", + "score":0.1835550789 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"om", + "task":"classification", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"om", + "task":"translation_from", + "metric":"bleu", + "score":0.0322766368 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"om", + "task":"translation_from", + "metric":"chrf", + "score":0.1548467965 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"om", + "task":"translation_to", + "metric":"bleu", + "score":0.0104672499 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"om", + "task":"translation_to", + "metric":"chrf", + "score":0.1495897529 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"or", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"or", + "task":"translation_from", + "metric":"bleu", + "score":0.1266427785 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"or", + "task":"translation_from", + "metric":"chrf", + "score":0.3740164648 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"or", + "task":"translation_to", + "metric":"bleu", + "score":0.0281188176 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"or", + "task":"translation_to", + "metric":"chrf", + "score":0.1879339756 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"pa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"pa", + "task":"translation_from", + "metric":"bleu", + "score":0.3595710948 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"pa", + "task":"translation_from", + "metric":"chrf", + "score":0.539538196 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"pa", + "task":"translation_to", + "metric":"bleu", + "score":0.3110476538 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"pa", + "task":"translation_to", + "metric":"chrf", + "score":0.4964416902 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"pl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"pl", + "task":"translation_from", + "metric":"bleu", + "score":0.1791082561 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"pl", + "task":"translation_from", + "metric":"chrf", + "score":0.4315704667 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"pl", + "task":"translation_to", + "metric":"bleu", + "score":0.1725231395 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"pl", + "task":"translation_to", + "metric":"chrf", + "score":0.3476924531 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"pt", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"pt", + "task":"translation_from", + "metric":"bleu", + "score":0.2073899393 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"pt", + "task":"translation_from", + "metric":"chrf", + "score":0.4691838054 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"pt", + "task":"translation_to", + "metric":"bleu", + "score":0.1956364634 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"pt", + "task":"translation_to", + "metric":"chrf", + "score":0.3100521945 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ro", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ro", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ro", + "task":"translation_from", + "metric":"bleu", + "score":0.2131558334 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ro", + "task":"translation_from", + "metric":"chrf", + "score":0.4133959067 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ro", + "task":"translation_to", + "metric":"bleu", + "score":0.1729368847 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ro", + "task":"translation_to", + "metric":"chrf", + "score":0.3072044813 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ru", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ru", + "task":"translation_from", + "metric":"bleu", + "score":0.1671614266 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ru", + "task":"translation_from", + "metric":"chrf", + "score":0.4422244829 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ru", + "task":"translation_to", + "metric":"bleu", + "score":0.1893614933 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ru", + "task":"translation_to", + "metric":"chrf", + "score":0.4605763082 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"rw", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"rw", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"rw", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"rw", + "task":"translation_from", + "metric":"bleu", + "score":0.0204702219 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"rw", + "task":"translation_from", + "metric":"chrf", + "score":0.2077171561 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"rw", + "task":"translation_to", + "metric":"bleu", + "score":0.0015730125 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"rw", + "task":"translation_to", + "metric":"chrf", + "score":0.1513689177 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sd", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sd", + "task":"translation_from", + "metric":"bleu", + "score":0.1191725522 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sd", + "task":"translation_from", + "metric":"chrf", + "score":0.3048062246 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sd", + "task":"translation_to", + "metric":"bleu", + "score":0.0235301378 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sd", + "task":"translation_to", + "metric":"chrf", + "score":0.1674956015 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"si", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"si", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"si", + "task":"translation_from", + "metric":"bleu", + "score":0.079322028 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"si", + "task":"translation_from", + "metric":"chrf", + "score":0.330454367 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"si", + "task":"translation_to", + "metric":"bleu", + "score":0.0184455254 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"si", + "task":"translation_to", + "metric":"chrf", + "score":0.1256002879 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sn", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sn", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sn", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sn", + "task":"translation_from", + "metric":"bleu", + "score":0.038846423 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sn", + "task":"translation_from", + "metric":"chrf", + "score":0.2024296237 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sn", + "task":"translation_to", + "metric":"bleu", + "score":0.0139189497 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sn", + "task":"translation_to", + "metric":"chrf", + "score":0.1438358845 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"so", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"so", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"so", + "task":"translation_from", + "metric":"bleu", + "score":0.027300431 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"so", + "task":"translation_from", + "metric":"chrf", + "score":0.1864710841 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"so", + "task":"translation_to", + "metric":"bleu", + "score":0.0183915432 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"so", + "task":"translation_to", + "metric":"chrf", + "score":0.1602963374 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sr", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sr", + "task":"translation_from", + "metric":"bleu", + "score":0.139057659 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sr", + "task":"translation_from", + "metric":"chrf", + "score":0.366792492 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sr", + "task":"translation_to", + "metric":"bleu", + "score":0.237878029 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sr", + "task":"translation_to", + "metric":"chrf", + "score":0.4452128635 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"su", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"su", + "task":"translation_from", + "metric":"bleu", + "score":0.1119370423 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"su", + "task":"translation_from", + "metric":"chrf", + "score":0.3476430008 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"su", + "task":"translation_to", + "metric":"bleu", + "score":0.016563929 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"su", + "task":"translation_to", + "metric":"chrf", + "score":0.225837323 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sv", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sv", + "task":"translation_from", + "metric":"bleu", + "score":0.2563194972 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sv", + "task":"translation_from", + "metric":"chrf", + "score":0.498105827 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sv", + "task":"translation_to", + "metric":"bleu", + "score":0.2800341704 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sv", + "task":"translation_to", + "metric":"chrf", + "score":0.4239442229 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sw", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sw", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sw", + "task":"translation_from", + "metric":"bleu", + "score":0.153544279 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sw", + "task":"translation_from", + "metric":"chrf", + "score":0.381670314 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sw", + "task":"translation_to", + "metric":"bleu", + "score":0.0470329064 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"sw", + "task":"translation_to", + "metric":"chrf", + "score":0.3516233998 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ta", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ta", + "task":"translation_from", + "metric":"bleu", + "score":0.116565827 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ta", + "task":"translation_from", + "metric":"chrf", + "score":0.3259696821 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ta", + "task":"translation_to", + "metric":"bleu", + "score":0.1799251119 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ta", + "task":"translation_to", + "metric":"chrf", + "score":0.4422961909 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"te", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"te", + "task":"translation_from", + "metric":"bleu", + "score":0.2177874056 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"te", + "task":"translation_from", + "metric":"chrf", + "score":0.4228885108 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"te", + "task":"translation_to", + "metric":"bleu", + "score":0.2215396728 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"te", + "task":"translation_to", + "metric":"chrf", + "score":0.4514044695 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"tg", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"tg", + "task":"translation_from", + "metric":"bleu", + "score":0.0505657194 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"tg", + "task":"translation_from", + "metric":"chrf", + "score":0.297617816 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"tg", + "task":"translation_to", + "metric":"bleu", + "score":0.0562697145 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"tg", + "task":"translation_to", + "metric":"chrf", + "score":0.2287718392 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"th", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"th", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"th", + "task":"translation_from", + "metric":"bleu", + "score":0.1077250531 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"th", + "task":"translation_from", + "metric":"chrf", + "score":0.3466580166 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"th", + "task":"translation_to", + "metric":"bleu", + "score":0.2151882368 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"th", + "task":"translation_to", + "metric":"chrf", + "score":0.3617567446 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ti", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ti", + "task":"translation_from", + "metric":"bleu", + "score":0.0275426369 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ti", + "task":"translation_from", + "metric":"chrf", + "score":0.1625316134 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ti", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ti", + "task":"translation_to", + "metric":"chrf", + "score":0.0540664405 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"tr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"tr", + "task":"translation_from", + "metric":"bleu", + "score":0.1246699911 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"tr", + "task":"translation_from", + "metric":"chrf", + "score":0.3740469363 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"tr", + "task":"translation_to", + "metric":"bleu", + "score":0.1584629952 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"tr", + "task":"translation_to", + "metric":"chrf", + "score":0.3608300472 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"uk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"uk", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"uk", + "task":"translation_from", + "metric":"bleu", + "score":0.1934348695 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"uk", + "task":"translation_from", + "metric":"chrf", + "score":0.4161013327 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"uk", + "task":"translation_to", + "metric":"bleu", + "score":0.2103705273 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"uk", + "task":"translation_to", + "metric":"chrf", + "score":0.4294671925 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"umb", + "task":"classification", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"umb", + "task":"translation_from", + "metric":"bleu", + "score":0.0244434593 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"umb", + "task":"translation_from", + "metric":"chrf", + "score":0.1675541923 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"umb", + "task":"translation_to", + "metric":"bleu", + "score":0.0007178002 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"umb", + "task":"translation_to", + "metric":"chrf", + "score":0.1007849921 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ur", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ur", + "task":"translation_from", + "metric":"bleu", + "score":0.142024307 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ur", + "task":"translation_from", + "metric":"chrf", + "score":0.3925303581 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ur", + "task":"translation_to", + "metric":"bleu", + "score":0.13811776 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"ur", + "task":"translation_to", + "metric":"chrf", + "score":0.3521086255 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"uz", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"uz", + "task":"translation_from", + "metric":"bleu", + "score":0.1642228534 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"uz", + "task":"translation_from", + "metric":"chrf", + "score":0.3736012886 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"uz", + "task":"translation_to", + "metric":"bleu", + "score":0.055748564 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"uz", + "task":"translation_to", + "metric":"chrf", + "score":0.2468016347 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"vi", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"vi", + "task":"translation_from", + "metric":"bleu", + "score":0.1850447544 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"vi", + "task":"translation_from", + "metric":"chrf", + "score":0.4328029287 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"vi", + "task":"translation_to", + "metric":"bleu", + "score":0.2262846976 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"vi", + "task":"translation_to", + "metric":"chrf", + "score":0.3523271738 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"wo", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"wo", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"wo", + "task":"translation_from", + "metric":"bleu", + "score":0.0509608434 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"wo", + "task":"translation_from", + "metric":"chrf", + "score":0.225219126 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"wo", + "task":"translation_to", + "metric":"bleu", + "score":0.0166144137 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"wo", + "task":"translation_to", + "metric":"chrf", + "score":0.160771848 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"wuu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"bleu", + "score":0.1255642972 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"chrf", + "score":0.3734878168 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"bleu", + "score":0.0067248884 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"chrf", + "score":0.0887426693 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"xh", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"xh", + "task":"translation_from", + "metric":"bleu", + "score":0.0447439631 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"xh", + "task":"translation_from", + "metric":"chrf", + "score":0.2216512685 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"xh", + "task":"translation_to", + "metric":"bleu", + "score":0.0026591548 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"xh", + "task":"translation_to", + "metric":"chrf", + "score":0.1403714517 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"yo", + "task":"classification", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"yo", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"yo", + "task":"translation_from", + "metric":"bleu", + "score":0.0254727037 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"yo", + "task":"translation_from", + "metric":"chrf", + "score":0.2062253383 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"yo", + "task":"translation_to", + "metric":"bleu", + "score":0.0094132633 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"yo", + "task":"translation_to", + "metric":"chrf", + "score":0.0989408911 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"yue", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"yue", + "task":"translation_from", + "metric":"bleu", + "score":0.1143976046 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"yue", + "task":"translation_from", + "metric":"chrf", + "score":0.3625809543 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"yue", + "task":"translation_to", + "metric":"bleu", + "score":0.1277032117 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"yue", + "task":"translation_to", + "metric":"chrf", + "score":0.2179430009 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"zh", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"zh", + "task":"translation_from", + "metric":"bleu", + "score":0.2115579648 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"zh", + "task":"translation_from", + "metric":"chrf", + "score":0.4634573062 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"zh", + "task":"translation_to", + "metric":"bleu", + "score":0.1903215556 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"zh", + "task":"translation_to", + "metric":"chrf", + "score":0.2429625775 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"zu", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"zu", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"zu", + "task":"translation_from", + "metric":"bleu", + "score":0.0151163425 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"zu", + "task":"translation_from", + "metric":"chrf", + "score":0.1971831566 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"zu", + "task":"translation_to", + "metric":"bleu", + "score":0.023417855 + }, + { + "model":"meta-llama\/llama-3.1-8b-instruct", + "bcp_47":"zu", + "task":"translation_to", + "metric":"chrf", + "score":0.1827820551 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"ar", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"ar", + "task":"translation_from", + "metric":"bleu", + "score":0.0534412445 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"ar", + "task":"translation_from", + "metric":"chrf", + "score":0.1423750168 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"ar", + "task":"translation_to", + "metric":"bleu", + "score":0.0522677244 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"ar", + "task":"translation_to", + "metric":"chrf", + "score":0.1317238701 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"bn", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"bn", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"bn", + "task":"translation_from", + "metric":"chrf", + "score":0.0061046998 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"bn", + "task":"translation_to", + "metric":"bleu", + "score":0.048395385 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"bn", + "task":"translation_to", + "metric":"chrf", + "score":0.1624192131 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"de", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"de", + "task":"translation_from", + "metric":"bleu", + "score":0.0365328036 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"de", + "task":"translation_from", + "metric":"chrf", + "score":0.1594198405 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"de", + "task":"translation_to", + "metric":"bleu", + "score":0.089863703 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"de", + "task":"translation_to", + "metric":"chrf", + "score":0.2290725718 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"en", + "task":"classification", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"en", + "task":"translation_from", + "metric":"bleu", + "score":0.1186358374 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"en", + "task":"translation_from", + "metric":"chrf", + "score":0.2861009841 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"en", + "task":"translation_to", + "metric":"bleu", + "score":0.0659782167 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"en", + "task":"translation_to", + "metric":"chrf", + "score":0.1219080159 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"es", + "task":"classification", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"es", + "task":"translation_from", + "metric":"bleu", + "score":0.0197183104 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"es", + "task":"translation_from", + "metric":"chrf", + "score":0.1858500787 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"es", + "task":"translation_to", + "metric":"bleu", + "score":0.1372446539 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"es", + "task":"translation_to", + "metric":"chrf", + "score":0.1970334371 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"fr", + "task":"classification", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"fr", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"fr", + "task":"translation_from", + "metric":"bleu", + "score":0.0225723033 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"fr", + "task":"translation_from", + "metric":"chrf", + "score":0.2128372612 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"fr", + "task":"translation_to", + "metric":"bleu", + "score":0.0900337367 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"fr", + "task":"translation_to", + "metric":"chrf", + "score":0.2030113676 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"hi", + "task":"classification", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"hi", + "task":"translation_from", + "metric":"bleu", + "score":0.1275394125 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"hi", + "task":"translation_from", + "metric":"chrf", + "score":0.2249822055 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"hi", + "task":"translation_to", + "metric":"bleu", + "score":0.1164104087 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"hi", + "task":"translation_to", + "metric":"chrf", + "score":0.2255759794 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"id", + "task":"classification", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"id", + "task":"translation_from", + "metric":"bleu", + "score":0.0396919548 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"id", + "task":"translation_from", + "metric":"chrf", + "score":0.193498077 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"id", + "task":"translation_to", + "metric":"bleu", + "score":0.0463130015 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"id", + "task":"translation_to", + "metric":"chrf", + "score":0.147263979 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"ja", + "task":"classification", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"ja", + "task":"translation_from", + "metric":"bleu", + "score":0.0196332917 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"ja", + "task":"translation_from", + "metric":"chrf", + "score":0.0615297483 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"ja", + "task":"translation_to", + "metric":"bleu", + "score":0.002077843 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"ja", + "task":"translation_to", + "metric":"chrf", + "score":0.0228028425 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"jv", + "task":"classification", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"jv", + "task":"translation_from", + "metric":"bleu", + "score":0.0192847454 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"jv", + "task":"translation_from", + "metric":"chrf", + "score":0.1432000045 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"jv", + "task":"translation_to", + "metric":"bleu", + "score":0.0179600462 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"jv", + "task":"translation_to", + "metric":"chrf", + "score":0.1308378956 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"mr", + "task":"classification", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"mr", + "task":"translation_from", + "metric":"bleu", + "score":0.0103335448 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"mr", + "task":"translation_from", + "metric":"chrf", + "score":0.0394434629 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"mr", + "task":"translation_to", + "metric":"bleu", + "score":0.0093410183 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"mr", + "task":"translation_to", + "metric":"chrf", + "score":0.0758287765 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"pa", + "task":"classification", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"pa", + "task":"translation_from", + "metric":"bleu", + "score":0.2072883352 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"pa", + "task":"translation_from", + "metric":"chrf", + "score":0.2238489904 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"pa", + "task":"translation_to", + "metric":"bleu", + "score":0.2192906863 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"pa", + "task":"translation_to", + "metric":"chrf", + "score":0.330676254 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"pt", + "task":"classification", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"pt", + "task":"translation_from", + "metric":"bleu", + "score":0.0506856305 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"pt", + "task":"translation_from", + "metric":"chrf", + "score":0.2502940387 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"pt", + "task":"translation_to", + "metric":"bleu", + "score":0.0801303171 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"pt", + "task":"translation_to", + "metric":"chrf", + "score":0.1635269784 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"ru", + "task":"classification", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"ru", + "task":"translation_from", + "metric":"bleu", + "score":0.050859162 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"ru", + "task":"translation_from", + "metric":"chrf", + "score":0.2002283949 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"ru", + "task":"translation_to", + "metric":"bleu", + "score":0.0199756762 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"ru", + "task":"translation_to", + "metric":"chrf", + "score":0.1055944134 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"sw", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"sw", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"sw", + "task":"translation_from", + "metric":"bleu", + "score":0.001996605 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"sw", + "task":"translation_from", + "metric":"chrf", + "score":0.1999016804 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"sw", + "task":"translation_to", + "metric":"bleu", + "score":0.0453589274 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"sw", + "task":"translation_to", + "metric":"chrf", + "score":0.1405820992 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"te", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"te", + "task":"translation_from", + "metric":"bleu", + "score":0.1115247653 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"te", + "task":"translation_from", + "metric":"chrf", + "score":0.1296059134 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"te", + "task":"translation_to", + "metric":"bleu", + "score":0.1480453761 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"te", + "task":"translation_to", + "metric":"chrf", + "score":0.2690624141 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"ur", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"ur", + "task":"translation_from", + "metric":"bleu", + "score":0.0114376329 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"ur", + "task":"translation_from", + "metric":"chrf", + "score":0.0233475148 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"ur", + "task":"translation_to", + "metric":"bleu", + "score":0.0385720696 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"ur", + "task":"translation_to", + "metric":"chrf", + "score":0.1423687352 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"vi", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"vi", + "task":"translation_from", + "metric":"bleu", + "score":0.0697220351 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"vi", + "task":"translation_from", + "metric":"chrf", + "score":0.1874677848 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"vi", + "task":"translation_to", + "metric":"bleu", + "score":0.135086862 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"vi", + "task":"translation_to", + "metric":"chrf", + "score":0.2446182636 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"zh", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"zh", + "task":"translation_from", + "metric":"bleu", + "score":0.0190942897 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"zh", + "task":"translation_from", + "metric":"chrf", + "score":0.1108498114 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"zh", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.2-1b-instruct", + "bcp_47":"zh", + "task":"translation_to", + "metric":"chrf", + "score":0.0294450289 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"aeb", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.2279903683 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.4722573355 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.1435174722 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.3991235315 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"af", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"af", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"af", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"af", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"af", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ak", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ak", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ak", + "task":"translation_from", + "metric":"bleu", + "score":0.1058038471 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ak", + "task":"translation_from", + "metric":"chrf", + "score":0.3048469769 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ak", + "task":"translation_to", + "metric":"bleu", + "score":0.0491812173 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ak", + "task":"translation_to", + "metric":"chrf", + "score":0.2808449794 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"am", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"am", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"am", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"am", + "task":"translation_from", + "metric":"bleu", + "score":0.1452228976 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"am", + "task":"translation_from", + "metric":"chrf", + "score":0.3699202818 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"am", + "task":"translation_to", + "metric":"bleu", + "score":0.0630164833 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"am", + "task":"translation_to", + "metric":"chrf", + "score":0.1755172285 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"apc", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"apc", + "task":"translation_from", + "metric":"bleu", + "score":0.2933386948 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"apc", + "task":"translation_from", + "metric":"chrf", + "score":0.5447211689 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"apc", + "task":"translation_to", + "metric":"bleu", + "score":0.2166524228 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"apc", + "task":"translation_to", + "metric":"chrf", + "score":0.4496497227 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ar", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ar", + "task":"translation_from", + "metric":"bleu", + "score":0.2997360932 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ar", + "task":"translation_from", + "metric":"chrf", + "score":0.552448295 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ar", + "task":"translation_to", + "metric":"bleu", + "score":0.2837522278 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ar", + "task":"translation_to", + "metric":"chrf", + "score":0.5150814494 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ary", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ary", + "task":"translation_from", + "metric":"bleu", + "score":0.1559168311 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ary", + "task":"translation_from", + "metric":"chrf", + "score":0.4268663808 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ary", + "task":"translation_to", + "metric":"bleu", + "score":0.1391913129 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ary", + "task":"translation_to", + "metric":"chrf", + "score":0.3773300026 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"arz", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"arz", + "task":"translation_from", + "metric":"bleu", + "score":0.1936957127 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"arz", + "task":"translation_from", + "metric":"chrf", + "score":0.4274660929 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"arz", + "task":"translation_to", + "metric":"bleu", + "score":0.2338775014 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"arz", + "task":"translation_to", + "metric":"chrf", + "score":0.4546098648 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"as", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"as", + "task":"translation_from", + "metric":"bleu", + "score":0.2240336457 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"as", + "task":"translation_from", + "metric":"chrf", + "score":0.456891102 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"as", + "task":"translation_to", + "metric":"bleu", + "score":0.0249457171 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"as", + "task":"translation_to", + "metric":"chrf", + "score":0.237299794 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"awa", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"awa", + "task":"translation_from", + "metric":"bleu", + "score":0.3606359676 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"awa", + "task":"translation_from", + "metric":"chrf", + "score":0.5477908661 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"awa", + "task":"translation_to", + "metric":"bleu", + "score":0.1847580734 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"awa", + "task":"translation_to", + "metric":"chrf", + "score":0.3911269476 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"az", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"az", + "task":"translation_from", + "metric":"bleu", + "score":0.1576463626 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"az", + "task":"translation_from", + "metric":"chrf", + "score":0.3910005157 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"az", + "task":"translation_to", + "metric":"bleu", + "score":0.1690495289 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"az", + "task":"translation_to", + "metric":"chrf", + "score":0.3930640761 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"be", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"be", + "task":"translation_from", + "metric":"bleu", + "score":0.1487255467 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"be", + "task":"translation_from", + "metric":"chrf", + "score":0.4407404732 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"be", + "task":"translation_to", + "metric":"bleu", + "score":0.2175383868 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"be", + "task":"translation_to", + "metric":"chrf", + "score":0.4344749015 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"bho", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"bho", + "task":"translation_from", + "metric":"bleu", + "score":0.3061950313 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"bho", + "task":"translation_from", + "metric":"chrf", + "score":0.5535821276 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"bho", + "task":"translation_to", + "metric":"bleu", + "score":0.1811004213 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"bho", + "task":"translation_to", + "metric":"chrf", + "score":0.3534531968 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"bm", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"bm", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"bm", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"bm", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"bm", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"bn", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"bn", + "task":"translation_from", + "metric":"bleu", + "score":0.2646772038 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"bn", + "task":"translation_from", + "metric":"chrf", + "score":0.5157826791 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"bn", + "task":"translation_to", + "metric":"bleu", + "score":0.331255344 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"bn", + "task":"translation_to", + "metric":"chrf", + "score":0.5093924414 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ca", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ca", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ca", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ca", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ca", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ceb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"bleu", + "score":0.3806413844 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"chrf", + "score":0.5722776653 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"bleu", + "score":0.2863154138 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"chrf", + "score":0.5492472281 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ckb", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"bleu", + "score":0.181535472 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"chrf", + "score":0.4498383877 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"bleu", + "score":0.0712120544 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"chrf", + "score":0.3404533027 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"cs", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"cs", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"cs", + "task":"translation_from", + "metric":"bleu", + "score":0.2928040954 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"cs", + "task":"translation_from", + "metric":"chrf", + "score":0.5416342014 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"cs", + "task":"translation_to", + "metric":"bleu", + "score":0.3623393932 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"cs", + "task":"translation_to", + "metric":"chrf", + "score":0.5863625454 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"de", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"de", + "task":"translation_from", + "metric":"bleu", + "score":0.3129672706 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"de", + "task":"translation_from", + "metric":"chrf", + "score":0.5456543979 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"de", + "task":"translation_to", + "metric":"bleu", + "score":0.4852409005 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"de", + "task":"translation_to", + "metric":"chrf", + "score":0.6908376394 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"el", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"el", + "task":"translation_from", + "metric":"bleu", + "score":0.2581336709 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"el", + "task":"translation_from", + "metric":"chrf", + "score":0.4704308834 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"el", + "task":"translation_to", + "metric":"bleu", + "score":0.3342775397 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"el", + "task":"translation_to", + "metric":"chrf", + "score":0.5026657233 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"en", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"en", + "task":"translation_from", + "metric":"bleu", + "score":0.5510215557 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"en", + "task":"translation_from", + "metric":"chrf", + "score":0.6909834226 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"en", + "task":"translation_to", + "metric":"bleu", + "score":0.6679215449 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"en", + "task":"translation_to", + "metric":"chrf", + "score":0.823262947 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"es", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"es", + "task":"translation_from", + "metric":"bleu", + "score":0.3139331841 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"es", + "task":"translation_from", + "metric":"chrf", + "score":0.5454623234 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"es", + "task":"translation_to", + "metric":"bleu", + "score":0.3561290923 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"es", + "task":"translation_to", + "metric":"chrf", + "score":0.599796306 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fa", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fa", + "task":"translation_from", + "metric":"bleu", + "score":0.3069040556 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fa", + "task":"translation_from", + "metric":"chrf", + "score":0.5327832177 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fa", + "task":"translation_to", + "metric":"bleu", + "score":0.2185015953 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fa", + "task":"translation_to", + "metric":"chrf", + "score":0.4264089038 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fil", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fil", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fil", + "task":"translation_from", + "metric":"bleu", + "score":0.3745780882 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fil", + "task":"translation_from", + "metric":"chrf", + "score":0.5785175063 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fil", + "task":"translation_to", + "metric":"bleu", + "score":0.2904415478 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fil", + "task":"translation_to", + "metric":"chrf", + "score":0.5908280404 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fr", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fr", + "task":"translation_from", + "metric":"bleu", + "score":0.2963449909 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fr", + "task":"translation_from", + "metric":"chrf", + "score":0.5544997379 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fr", + "task":"translation_to", + "metric":"bleu", + "score":0.5091700689 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fr", + "task":"translation_to", + "metric":"chrf", + "score":0.690320784 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.0862885919 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.2372420697 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0261732885 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.168027641 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"gu", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"gu", + "task":"translation_from", + "metric":"bleu", + "score":0.295613677 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"gu", + "task":"translation_from", + "metric":"chrf", + "score":0.5221513183 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"gu", + "task":"translation_to", + "metric":"bleu", + "score":0.1697878702 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"gu", + "task":"translation_to", + "metric":"chrf", + "score":0.4619303787 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ha", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ha", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ha", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ha", + "task":"translation_from", + "metric":"bleu", + "score":0.1704488365 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ha", + "task":"translation_from", + "metric":"chrf", + "score":0.4403441536 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ha", + "task":"translation_to", + "metric":"bleu", + "score":0.1466885285 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ha", + "task":"translation_to", + "metric":"chrf", + "score":0.4179596519 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"hi", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"hi", + "task":"translation_from", + "metric":"bleu", + "score":0.385731086 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"hi", + "task":"translation_from", + "metric":"chrf", + "score":0.6034244629 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"hi", + "task":"translation_to", + "metric":"bleu", + "score":0.357812342 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"hi", + "task":"translation_to", + "metric":"chrf", + "score":0.5894721809 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"hne", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"hne", + "task":"translation_from", + "metric":"bleu", + "score":0.2543010782 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"hne", + "task":"translation_from", + "metric":"chrf", + "score":0.4974062413 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"hne", + "task":"translation_to", + "metric":"bleu", + "score":0.1038893205 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"hne", + "task":"translation_to", + "metric":"chrf", + "score":0.3250555425 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ht", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ht", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ht", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ht", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ht", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"hu", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"hu", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"hu", + "task":"translation_from", + "metric":"bleu", + "score":0.276319154 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"hu", + "task":"translation_from", + "metric":"chrf", + "score":0.5531277158 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"hu", + "task":"translation_to", + "metric":"bleu", + "score":0.3130631115 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"hu", + "task":"translation_to", + "metric":"chrf", + "score":0.576837791 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"id", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"id", + "task":"translation_from", + "metric":"bleu", + "score":0.3143630083 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"id", + "task":"translation_from", + "metric":"chrf", + "score":0.5621460006 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"id", + "task":"translation_to", + "metric":"bleu", + "score":0.3372718385 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"id", + "task":"translation_to", + "metric":"chrf", + "score":0.6543894215 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ig", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ig", + "task":"translation_from", + "metric":"bleu", + "score":0.1641186812 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ig", + "task":"translation_from", + "metric":"chrf", + "score":0.4109013799 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ig", + "task":"translation_to", + "metric":"bleu", + "score":0.1375093856 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ig", + "task":"translation_to", + "metric":"chrf", + "score":0.3810358014 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ilo", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"bleu", + "score":0.2236376263 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"chrf", + "score":0.4348813399 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"bleu", + "score":0.1135128656 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"chrf", + "score":0.4345857133 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"it", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"it", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"it", + "task":"translation_from", + "metric":"bleu", + "score":0.2934122255 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"it", + "task":"translation_from", + "metric":"chrf", + "score":0.5393871714 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"it", + "task":"translation_to", + "metric":"bleu", + "score":0.3100077394 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"it", + "task":"translation_to", + "metric":"chrf", + "score":0.5714730187 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ja", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ja", + "task":"translation_from", + "metric":"bleu", + "score":0.284322765 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ja", + "task":"translation_from", + "metric":"chrf", + "score":0.5304019177 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ja", + "task":"translation_to", + "metric":"bleu", + "score":0.2212745751 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ja", + "task":"translation_to", + "metric":"chrf", + "score":0.355950114 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"jv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"jv", + "task":"translation_from", + "metric":"bleu", + "score":0.2779520489 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"jv", + "task":"translation_from", + "metric":"chrf", + "score":0.5022141687 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"jv", + "task":"translation_to", + "metric":"bleu", + "score":0.2476437073 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"jv", + "task":"translation_to", + "metric":"chrf", + "score":0.4805413308 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ki", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ki", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ki", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ki", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ki", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"kk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"kk", + "task":"translation_from", + "metric":"bleu", + "score":0.1839138217 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"kk", + "task":"translation_from", + "metric":"chrf", + "score":0.4860524069 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"kk", + "task":"translation_to", + "metric":"bleu", + "score":0.170404008 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"kk", + "task":"translation_to", + "metric":"chrf", + "score":0.4549282359 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"km", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"km", + "task":"translation_from", + "metric":"bleu", + "score":0.2759135194 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"km", + "task":"translation_from", + "metric":"chrf", + "score":0.5427685716 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"km", + "task":"translation_to", + "metric":"bleu", + "score":0.1237988917 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"km", + "task":"translation_to", + "metric":"chrf", + "score":0.3265823778 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"kn", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"kn", + "task":"translation_from", + "metric":"bleu", + "score":0.2379701997 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"kn", + "task":"translation_from", + "metric":"chrf", + "score":0.4807978998 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"kn", + "task":"translation_to", + "metric":"bleu", + "score":0.2068140088 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"kn", + "task":"translation_to", + "metric":"chrf", + "score":0.4615143451 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ko", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ko", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ko", + "task":"translation_from", + "metric":"bleu", + "score":0.2508944927 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ko", + "task":"translation_from", + "metric":"chrf", + "score":0.4998320266 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ko", + "task":"translation_to", + "metric":"bleu", + "score":0.210142355 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ko", + "task":"translation_to", + "metric":"chrf", + "score":0.3127505848 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"lua", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"lua", + "task":"translation_from", + "metric":"bleu", + "score":0.0890010757 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"lua", + "task":"translation_from", + "metric":"chrf", + "score":0.2623679578 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"lua", + "task":"translation_to", + "metric":"bleu", + "score":0.0406768013 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"lua", + "task":"translation_to", + "metric":"chrf", + "score":0.2265562343 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"mag", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"mag", + "task":"translation_from", + "metric":"bleu", + "score":0.3934799806 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"mag", + "task":"translation_from", + "metric":"chrf", + "score":0.6000359011 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"mag", + "task":"translation_to", + "metric":"bleu", + "score":0.2497480714 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"mag", + "task":"translation_to", + "metric":"chrf", + "score":0.5149579975 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"mai", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"mai", + "task":"translation_from", + "metric":"bleu", + "score":0.2776870629 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"mai", + "task":"translation_from", + "metric":"chrf", + "score":0.5361437897 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"mai", + "task":"translation_to", + "metric":"bleu", + "score":0.101231398 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"mai", + "task":"translation_to", + "metric":"chrf", + "score":0.3867790942 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"mg", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"mg", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"mg", + "task":"translation_from", + "metric":"bleu", + "score":0.1710070826 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"mg", + "task":"translation_from", + "metric":"chrf", + "score":0.3961869922 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"mg", + "task":"translation_to", + "metric":"bleu", + "score":0.0586978059 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"mg", + "task":"translation_to", + "metric":"chrf", + "score":0.3322172345 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ml", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ml", + "task":"translation_from", + "metric":"bleu", + "score":0.2566290969 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ml", + "task":"translation_from", + "metric":"chrf", + "score":0.5196341734 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ml", + "task":"translation_to", + "metric":"bleu", + "score":0.2701878605 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ml", + "task":"translation_to", + "metric":"chrf", + "score":0.4964908212 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"mr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"mr", + "task":"translation_from", + "metric":"bleu", + "score":0.3224419544 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"mr", + "task":"translation_from", + "metric":"chrf", + "score":0.5606155155 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"mr", + "task":"translation_to", + "metric":"bleu", + "score":0.1663847917 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"mr", + "task":"translation_to", + "metric":"chrf", + "score":0.4383662593 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ms", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ms", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ms", + "task":"translation_from", + "metric":"bleu", + "score":0.3103894957 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ms", + "task":"translation_from", + "metric":"chrf", + "score":0.5854645421 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ms", + "task":"translation_to", + "metric":"bleu", + "score":0.3913336262 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ms", + "task":"translation_to", + "metric":"chrf", + "score":0.6467989318 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"my", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"my", + "task":"translation_from", + "metric":"bleu", + "score":0.2392486974 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"my", + "task":"translation_from", + "metric":"chrf", + "score":0.4920626101 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"my", + "task":"translation_to", + "metric":"bleu", + "score":0.2130836675 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"my", + "task":"translation_to", + "metric":"chrf", + "score":0.4622075168 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ne", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ne", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ne", + "task":"translation_from", + "metric":"bleu", + "score":0.2893481535 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ne", + "task":"translation_from", + "metric":"chrf", + "score":0.5215715176 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ne", + "task":"translation_to", + "metric":"bleu", + "score":0.1419402772 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ne", + "task":"translation_to", + "metric":"chrf", + "score":0.4014256358 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"nl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"nl", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"nl", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"nl", + "task":"translation_from", + "metric":"bleu", + "score":0.249611031 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"nl", + "task":"translation_from", + "metric":"chrf", + "score":0.4991029967 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"nl", + "task":"translation_to", + "metric":"bleu", + "score":0.2942599953 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"nl", + "task":"translation_to", + "metric":"chrf", + "score":0.5860228525 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ny", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ny", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ny", + "task":"translation_from", + "metric":"bleu", + "score":0.0973366086 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ny", + "task":"translation_from", + "metric":"chrf", + "score":0.3232614896 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ny", + "task":"translation_to", + "metric":"bleu", + "score":0.0552969578 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ny", + "task":"translation_to", + "metric":"chrf", + "score":0.3314346183 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"om", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"om", + "task":"translation_from", + "metric":"bleu", + "score":0.0356994946 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"om", + "task":"translation_from", + "metric":"chrf", + "score":0.2438060785 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"om", + "task":"translation_to", + "metric":"bleu", + "score":0.0183592041 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"om", + "task":"translation_to", + "metric":"chrf", + "score":0.3076327609 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"or", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"or", + "task":"translation_from", + "metric":"bleu", + "score":0.2403245803 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"or", + "task":"translation_from", + "metric":"chrf", + "score":0.5023246313 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"or", + "task":"translation_to", + "metric":"bleu", + "score":0.1415388613 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"or", + "task":"translation_to", + "metric":"chrf", + "score":0.4055113288 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"pa", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"pa", + "task":"translation_from", + "metric":"bleu", + "score":0.4519562833 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"pa", + "task":"translation_from", + "metric":"chrf", + "score":0.6328740374 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"pa", + "task":"translation_to", + "metric":"bleu", + "score":0.3918546765 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"pa", + "task":"translation_to", + "metric":"chrf", + "score":0.551810658 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"pl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"pl", + "task":"translation_from", + "metric":"bleu", + "score":0.2474554181 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"pl", + "task":"translation_from", + "metric":"chrf", + "score":0.490135462 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"pl", + "task":"translation_to", + "metric":"bleu", + "score":0.3387973296 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"pl", + "task":"translation_to", + "metric":"chrf", + "score":0.5550868321 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"pt", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"pt", + "task":"translation_from", + "metric":"bleu", + "score":0.3065957195 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"pt", + "task":"translation_from", + "metric":"chrf", + "score":0.5567333989 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"pt", + "task":"translation_to", + "metric":"bleu", + "score":0.4450524918 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"pt", + "task":"translation_to", + "metric":"chrf", + "score":0.6712742861 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ro", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ro", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ro", + "task":"translation_from", + "metric":"bleu", + "score":0.2717880574 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ro", + "task":"translation_from", + "metric":"chrf", + "score":0.5367497902 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ro", + "task":"translation_to", + "metric":"bleu", + "score":0.4990357373 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ro", + "task":"translation_to", + "metric":"chrf", + "score":0.6703309998 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ru", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ru", + "task":"translation_from", + "metric":"bleu", + "score":0.2184907643 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ru", + "task":"translation_from", + "metric":"chrf", + "score":0.4824691404 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ru", + "task":"translation_to", + "metric":"bleu", + "score":0.3406091079 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ru", + "task":"translation_to", + "metric":"chrf", + "score":0.5689518318 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"rw", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"rw", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"rw", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"rw", + "task":"translation_from", + "metric":"bleu", + "score":0.1780482269 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"rw", + "task":"translation_from", + "metric":"chrf", + "score":0.4251975218 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"rw", + "task":"translation_to", + "metric":"bleu", + "score":0.1238628432 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"rw", + "task":"translation_to", + "metric":"chrf", + "score":0.3651594596 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sd", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sd", + "task":"translation_from", + "metric":"bleu", + "score":0.2363136631 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sd", + "task":"translation_from", + "metric":"chrf", + "score":0.4724628618 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sd", + "task":"translation_to", + "metric":"bleu", + "score":0.1012580658 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sd", + "task":"translation_to", + "metric":"chrf", + "score":0.3226539734 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"si", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"si", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"si", + "task":"translation_from", + "metric":"bleu", + "score":0.1702954814 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"si", + "task":"translation_from", + "metric":"chrf", + "score":0.4314499751 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"si", + "task":"translation_to", + "metric":"bleu", + "score":0.1165218233 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"si", + "task":"translation_to", + "metric":"chrf", + "score":0.3219658957 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sn", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sn", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sn", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sn", + "task":"translation_from", + "metric":"bleu", + "score":0.0415760658 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sn", + "task":"translation_from", + "metric":"chrf", + "score":0.2726763268 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sn", + "task":"translation_to", + "metric":"bleu", + "score":0.059393934 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sn", + "task":"translation_to", + "metric":"chrf", + "score":0.3265574234 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"so", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"so", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"so", + "task":"translation_from", + "metric":"bleu", + "score":0.0974935448 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"so", + "task":"translation_from", + "metric":"chrf", + "score":0.337395124 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"so", + "task":"translation_to", + "metric":"bleu", + "score":0.0786475166 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"so", + "task":"translation_to", + "metric":"chrf", + "score":0.3616383914 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sr", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sr", + "task":"translation_from", + "metric":"bleu", + "score":0.2468393111 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sr", + "task":"translation_from", + "metric":"chrf", + "score":0.497224405 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sr", + "task":"translation_to", + "metric":"bleu", + "score":0.4165200238 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sr", + "task":"translation_to", + "metric":"chrf", + "score":0.60128551 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"su", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"su", + "task":"translation_from", + "metric":"bleu", + "score":0.2331294709 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"su", + "task":"translation_from", + "metric":"chrf", + "score":0.4605502791 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"su", + "task":"translation_to", + "metric":"bleu", + "score":0.1664653883 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"su", + "task":"translation_to", + "metric":"chrf", + "score":0.4762879225 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sv", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sv", + "task":"translation_from", + "metric":"bleu", + "score":0.3181506443 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sv", + "task":"translation_from", + "metric":"chrf", + "score":0.5441377883 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sv", + "task":"translation_to", + "metric":"bleu", + "score":0.384958542 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sv", + "task":"translation_to", + "metric":"chrf", + "score":0.6364660715 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sw", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sw", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sw", + "task":"translation_from", + "metric":"bleu", + "score":0.2373393477 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sw", + "task":"translation_from", + "metric":"chrf", + "score":0.5017230165 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sw", + "task":"translation_to", + "metric":"bleu", + "score":0.2334583695 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sw", + "task":"translation_to", + "metric":"chrf", + "score":0.5603415221 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ta", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ta", + "task":"translation_from", + "metric":"bleu", + "score":0.2147204762 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ta", + "task":"translation_from", + "metric":"chrf", + "score":0.4649686586 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ta", + "task":"translation_to", + "metric":"bleu", + "score":0.2451735521 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ta", + "task":"translation_to", + "metric":"chrf", + "score":0.5352886898 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"te", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"te", + "task":"translation_from", + "metric":"bleu", + "score":0.3767393472 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"te", + "task":"translation_from", + "metric":"chrf", + "score":0.5870286691 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"te", + "task":"translation_to", + "metric":"bleu", + "score":0.3415510311 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"te", + "task":"translation_to", + "metric":"chrf", + "score":0.5592933672 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"tg", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"tg", + "task":"translation_from", + "metric":"bleu", + "score":0.1801710665 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"tg", + "task":"translation_from", + "metric":"chrf", + "score":0.4238537274 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"tg", + "task":"translation_to", + "metric":"bleu", + "score":0.1125461134 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"tg", + "task":"translation_to", + "metric":"chrf", + "score":0.3456654305 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"th", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"th", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"th", + "task":"translation_from", + "metric":"bleu", + "score":0.2385233061 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"th", + "task":"translation_from", + "metric":"chrf", + "score":0.4987667959 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"th", + "task":"translation_to", + "metric":"bleu", + "score":0.3202315883 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"th", + "task":"translation_to", + "metric":"chrf", + "score":0.4748886274 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ti", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ti", + "task":"translation_from", + "metric":"bleu", + "score":0.0653357736 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ti", + "task":"translation_from", + "metric":"chrf", + "score":0.3152990905 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ti", + "task":"translation_to", + "metric":"bleu", + "score":0.0468367135 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ti", + "task":"translation_to", + "metric":"chrf", + "score":0.1314286197 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"tr", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"tr", + "task":"translation_from", + "metric":"bleu", + "score":0.2786347493 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"tr", + "task":"translation_from", + "metric":"chrf", + "score":0.5143010521 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"tr", + "task":"translation_to", + "metric":"bleu", + "score":0.3361615644 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"tr", + "task":"translation_to", + "metric":"chrf", + "score":0.5732166456 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"uk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"uk", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"uk", + "task":"translation_from", + "metric":"bleu", + "score":0.2384384134 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"uk", + "task":"translation_from", + "metric":"chrf", + "score":0.4989290832 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"uk", + "task":"translation_to", + "metric":"bleu", + "score":0.4068700974 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"uk", + "task":"translation_to", + "metric":"chrf", + "score":0.5784786574 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"umb", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"umb", + "task":"translation_from", + "metric":"bleu", + "score":0.0295327628 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"umb", + "task":"translation_from", + "metric":"chrf", + "score":0.168725075 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"umb", + "task":"translation_to", + "metric":"bleu", + "score":0.047075079 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"umb", + "task":"translation_to", + "metric":"chrf", + "score":0.2446929278 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ur", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ur", + "task":"translation_from", + "metric":"bleu", + "score":0.252958993 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ur", + "task":"translation_from", + "metric":"chrf", + "score":0.5053979802 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ur", + "task":"translation_to", + "metric":"bleu", + "score":0.2339821201 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ur", + "task":"translation_to", + "metric":"chrf", + "score":0.425306622 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"uz", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"uz", + "task":"translation_from", + "metric":"bleu", + "score":0.236632122 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"uz", + "task":"translation_from", + "metric":"chrf", + "score":0.4793696196 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"uz", + "task":"translation_to", + "metric":"bleu", + "score":0.265421135 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"uz", + "task":"translation_to", + "metric":"chrf", + "score":0.5116987882 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"vi", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"vi", + "task":"translation_from", + "metric":"bleu", + "score":0.2721498467 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"vi", + "task":"translation_from", + "metric":"chrf", + "score":0.5200799335 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"vi", + "task":"translation_to", + "metric":"bleu", + "score":0.3613736416 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"vi", + "task":"translation_to", + "metric":"chrf", + "score":0.5866656133 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"wo", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"wo", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"wo", + "task":"translation_from", + "metric":"bleu", + "score":0.0887261142 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"wo", + "task":"translation_from", + "metric":"chrf", + "score":0.2752257416 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"wo", + "task":"translation_to", + "metric":"bleu", + "score":0.0469317169 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"wo", + "task":"translation_to", + "metric":"chrf", + "score":0.2008453897 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"wuu", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"bleu", + "score":0.1844305556 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"chrf", + "score":0.4417239043 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"bleu", + "score":0.1248600823 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"chrf", + "score":0.1650750126 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"xh", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"xh", + "task":"translation_from", + "metric":"bleu", + "score":0.0773908628 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"xh", + "task":"translation_from", + "metric":"chrf", + "score":0.2972337309 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"xh", + "task":"translation_to", + "metric":"bleu", + "score":0.0211167911 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"xh", + "task":"translation_to", + "metric":"chrf", + "score":0.2699477659 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"yo", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"yo", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"yo", + "task":"translation_from", + "metric":"bleu", + "score":0.0578164805 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"yo", + "task":"translation_from", + "metric":"chrf", + "score":0.2633608218 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"yo", + "task":"translation_to", + "metric":"bleu", + "score":0.0591720568 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"yo", + "task":"translation_to", + "metric":"chrf", + "score":0.1753356197 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"yue", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"yue", + "task":"translation_from", + "metric":"bleu", + "score":0.2018552397 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"yue", + "task":"translation_from", + "metric":"chrf", + "score":0.4546838419 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"yue", + "task":"translation_to", + "metric":"bleu", + "score":0.1477972133 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"yue", + "task":"translation_to", + "metric":"chrf", + "score":0.238559837 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"zh", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"zh", + "task":"translation_from", + "metric":"bleu", + "score":0.2259180607 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"zh", + "task":"translation_from", + "metric":"chrf", + "score":0.5258178103 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"zh", + "task":"translation_to", + "metric":"bleu", + "score":0.2474954475 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"zh", + "task":"translation_to", + "metric":"chrf", + "score":0.2841722148 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"zu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"zu", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"zu", + "task":"translation_from", + "metric":"bleu", + "score":0.1511814979 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"zu", + "task":"translation_from", + "metric":"chrf", + "score":0.3667501588 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"zu", + "task":"translation_to", + "metric":"bleu", + "score":0.0635700737 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"zu", + "task":"translation_to", + "metric":"chrf", + "score":0.3690469819 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"aeb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.3304277157 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.5443905094 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.1851657228 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.4035662808 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"af", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"af", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"af", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"af", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"af", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ak", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ak", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ak", + "task":"translation_from", + "metric":"bleu", + "score":0.109249521 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ak", + "task":"translation_from", + "metric":"chrf", + "score":0.3018012797 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ak", + "task":"translation_to", + "metric":"bleu", + "score":0.0601412463 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ak", + "task":"translation_to", + "metric":"chrf", + "score":0.3378209538 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"am", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"am", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"am", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"am", + "task":"translation_from", + "metric":"bleu", + "score":0.278050095 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"am", + "task":"translation_from", + "metric":"chrf", + "score":0.5030892659 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"am", + "task":"translation_to", + "metric":"bleu", + "score":0.2056413876 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"am", + "task":"translation_to", + "metric":"chrf", + "score":0.319475702 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"apc", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"apc", + "task":"translation_from", + "metric":"bleu", + "score":0.3412628716 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"apc", + "task":"translation_from", + "metric":"chrf", + "score":0.6168944847 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"apc", + "task":"translation_to", + "metric":"bleu", + "score":0.2079777284 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"apc", + "task":"translation_to", + "metric":"chrf", + "score":0.4737326062 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ar", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ar", + "task":"translation_from", + "metric":"bleu", + "score":0.3288891576 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ar", + "task":"translation_from", + "metric":"chrf", + "score":0.560493221 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ar", + "task":"translation_to", + "metric":"bleu", + "score":0.3370289388 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ar", + "task":"translation_to", + "metric":"chrf", + "score":0.5616376735 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ary", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ary", + "task":"translation_from", + "metric":"bleu", + "score":0.1877842343 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ary", + "task":"translation_from", + "metric":"chrf", + "score":0.4430965745 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ary", + "task":"translation_to", + "metric":"bleu", + "score":0.1822974398 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ary", + "task":"translation_to", + "metric":"chrf", + "score":0.3877585115 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"arz", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"arz", + "task":"translation_from", + "metric":"bleu", + "score":0.2820784803 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"arz", + "task":"translation_from", + "metric":"chrf", + "score":0.5005600008 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"arz", + "task":"translation_to", + "metric":"bleu", + "score":0.1762767818 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"arz", + "task":"translation_to", + "metric":"chrf", + "score":0.3980584269 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"as", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"as", + "task":"translation_from", + "metric":"bleu", + "score":0.2678950965 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"as", + "task":"translation_from", + "metric":"chrf", + "score":0.5139106802 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"as", + "task":"translation_to", + "metric":"bleu", + "score":0.1062771627 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"as", + "task":"translation_to", + "metric":"chrf", + "score":0.3373123707 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"awa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"awa", + "task":"translation_from", + "metric":"bleu", + "score":0.3378377362 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"awa", + "task":"translation_from", + "metric":"chrf", + "score":0.5424277928 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"awa", + "task":"translation_to", + "metric":"bleu", + "score":0.2039436913 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"awa", + "task":"translation_to", + "metric":"chrf", + "score":0.413295677 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"az", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"az", + "task":"translation_from", + "metric":"bleu", + "score":0.2078798411 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"az", + "task":"translation_from", + "metric":"chrf", + "score":0.4443945632 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"az", + "task":"translation_to", + "metric":"bleu", + "score":0.1864199422 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"az", + "task":"translation_to", + "metric":"chrf", + "score":0.4220840798 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"be", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"be", + "task":"translation_from", + "metric":"bleu", + "score":0.1482839317 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"be", + "task":"translation_from", + "metric":"chrf", + "score":0.4568926673 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"be", + "task":"translation_to", + "metric":"bleu", + "score":0.2815774482 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"be", + "task":"translation_to", + "metric":"chrf", + "score":0.4716025494 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"bho", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"bho", + "task":"translation_from", + "metric":"bleu", + "score":0.2239129937 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"bho", + "task":"translation_from", + "metric":"chrf", + "score":0.4981762083 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"bho", + "task":"translation_to", + "metric":"bleu", + "score":0.1952639614 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"bho", + "task":"translation_to", + "metric":"chrf", + "score":0.40510597 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"bm", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"bm", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"bm", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"bm", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"bm", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"bn", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"bn", + "task":"translation_from", + "metric":"bleu", + "score":0.3130233588 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"bn", + "task":"translation_from", + "metric":"chrf", + "score":0.5569163893 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"bn", + "task":"translation_to", + "metric":"bleu", + "score":0.3322667951 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"bn", + "task":"translation_to", + "metric":"chrf", + "score":0.5140240989 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ca", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ca", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ca", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ca", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ca", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ceb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"bleu", + "score":0.3401088117 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"chrf", + "score":0.5684561927 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"bleu", + "score":0.4507021781 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"chrf", + "score":0.6542740054 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ckb", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"bleu", + "score":0.2563123252 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"chrf", + "score":0.517826657 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"bleu", + "score":0.2261228199 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"chrf", + "score":0.4918700987 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"cs", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"cs", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"cs", + "task":"translation_from", + "metric":"bleu", + "score":0.3778406936 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"cs", + "task":"translation_from", + "metric":"chrf", + "score":0.6293186521 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"cs", + "task":"translation_to", + "metric":"bleu", + "score":0.4207498261 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"cs", + "task":"translation_to", + "metric":"chrf", + "score":0.6224036774 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"de", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"de", + "task":"translation_from", + "metric":"bleu", + "score":0.386239845 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"de", + "task":"translation_from", + "metric":"chrf", + "score":0.6110300223 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"de", + "task":"translation_to", + "metric":"bleu", + "score":0.4508475568 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"de", + "task":"translation_to", + "metric":"chrf", + "score":0.6653203029 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"el", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"el", + "task":"translation_from", + "metric":"bleu", + "score":0.3208174129 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"el", + "task":"translation_from", + "metric":"chrf", + "score":0.5441131834 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"el", + "task":"translation_to", + "metric":"bleu", + "score":0.3167289307 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"el", + "task":"translation_to", + "metric":"chrf", + "score":0.5086510118 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"en", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"en", + "task":"translation_from", + "metric":"bleu", + "score":0.5649266234 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"en", + "task":"translation_from", + "metric":"chrf", + "score":0.7240609445 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"en", + "task":"translation_to", + "metric":"bleu", + "score":0.6160790992 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"en", + "task":"translation_to", + "metric":"chrf", + "score":0.8133281991 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"es", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"es", + "task":"translation_from", + "metric":"bleu", + "score":0.3152773331 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"es", + "task":"translation_from", + "metric":"chrf", + "score":0.5548531112 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"es", + "task":"translation_to", + "metric":"bleu", + "score":0.3335962816 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"es", + "task":"translation_to", + "metric":"chrf", + "score":0.5859881472 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fa", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fa", + "task":"translation_from", + "metric":"bleu", + "score":0.2974755741 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fa", + "task":"translation_from", + "metric":"chrf", + "score":0.548510072 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fa", + "task":"translation_to", + "metric":"bleu", + "score":0.198877694 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fa", + "task":"translation_to", + "metric":"chrf", + "score":0.4016676481 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fil", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fil", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fil", + "task":"translation_from", + "metric":"bleu", + "score":0.3394346908 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fil", + "task":"translation_from", + "metric":"chrf", + "score":0.5772205685 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fil", + "task":"translation_to", + "metric":"bleu", + "score":0.2961737536 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fil", + "task":"translation_to", + "metric":"chrf", + "score":0.5732830973 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fr", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fr", + "task":"translation_from", + "metric":"bleu", + "score":0.3174175523 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fr", + "task":"translation_from", + "metric":"chrf", + "score":0.5682518332 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fr", + "task":"translation_to", + "metric":"bleu", + "score":0.5173973527 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fr", + "task":"translation_to", + "metric":"chrf", + "score":0.7056428374 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.0282301718 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.2509358266 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0302470726 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.2143808411 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"gu", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"gu", + "task":"translation_from", + "metric":"bleu", + "score":0.336179684 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"gu", + "task":"translation_from", + "metric":"chrf", + "score":0.5448761462 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"gu", + "task":"translation_to", + "metric":"bleu", + "score":0.1255076156 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"gu", + "task":"translation_to", + "metric":"chrf", + "score":0.4301109075 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ha", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ha", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ha", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ha", + "task":"translation_from", + "metric":"bleu", + "score":0.2176466652 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ha", + "task":"translation_from", + "metric":"chrf", + "score":0.4472887488 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ha", + "task":"translation_to", + "metric":"bleu", + "score":0.2048605344 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ha", + "task":"translation_to", + "metric":"chrf", + "score":0.4547067722 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"hi", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"hi", + "task":"translation_from", + "metric":"bleu", + "score":0.3796955055 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"hi", + "task":"translation_from", + "metric":"chrf", + "score":0.6056742688 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"hi", + "task":"translation_to", + "metric":"bleu", + "score":0.382370623 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"hi", + "task":"translation_to", + "metric":"chrf", + "score":0.5922578575 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"hne", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"hne", + "task":"translation_from", + "metric":"bleu", + "score":0.2583771315 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"hne", + "task":"translation_from", + "metric":"chrf", + "score":0.4968818998 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"hne", + "task":"translation_to", + "metric":"bleu", + "score":0.116404849 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"hne", + "task":"translation_to", + "metric":"chrf", + "score":0.355624191 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ht", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ht", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ht", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ht", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ht", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"hu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"hu", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"hu", + "task":"translation_from", + "metric":"bleu", + "score":0.2893259192 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"hu", + "task":"translation_from", + "metric":"chrf", + "score":0.5696888872 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"hu", + "task":"translation_to", + "metric":"bleu", + "score":0.3664678104 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"hu", + "task":"translation_to", + "metric":"chrf", + "score":0.6152145331 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"id", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"id", + "task":"translation_from", + "metric":"bleu", + "score":0.2523550022 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"id", + "task":"translation_from", + "metric":"chrf", + "score":0.5458277736 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"id", + "task":"translation_to", + "metric":"bleu", + "score":0.3774331947 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"id", + "task":"translation_to", + "metric":"chrf", + "score":0.6486159416 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ig", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ig", + "task":"translation_from", + "metric":"bleu", + "score":0.2004372781 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ig", + "task":"translation_from", + "metric":"chrf", + "score":0.4254008414 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ig", + "task":"translation_to", + "metric":"bleu", + "score":0.2594342647 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ig", + "task":"translation_to", + "metric":"chrf", + "score":0.4939201844 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ilo", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"bleu", + "score":0.1883645682 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"chrf", + "score":0.4379611856 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"bleu", + "score":0.166061461 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"chrf", + "score":0.4725232576 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"it", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"it", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"it", + "task":"translation_from", + "metric":"bleu", + "score":0.2923994901 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"it", + "task":"translation_from", + "metric":"chrf", + "score":0.5447705341 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"it", + "task":"translation_to", + "metric":"bleu", + "score":0.4037821428 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"it", + "task":"translation_to", + "metric":"chrf", + "score":0.6296260979 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ja", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ja", + "task":"translation_from", + "metric":"bleu", + "score":0.3130983776 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ja", + "task":"translation_from", + "metric":"chrf", + "score":0.5536124921 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ja", + "task":"translation_to", + "metric":"bleu", + "score":0.3266051607 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ja", + "task":"translation_to", + "metric":"chrf", + "score":0.4444671407 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"jv", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"jv", + "task":"translation_from", + "metric":"bleu", + "score":0.3146151088 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"jv", + "task":"translation_from", + "metric":"chrf", + "score":0.5434123174 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"jv", + "task":"translation_to", + "metric":"bleu", + "score":0.3068652176 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"jv", + "task":"translation_to", + "metric":"chrf", + "score":0.5696595268 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ki", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ki", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ki", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ki", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ki", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"kk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"kk", + "task":"translation_from", + "metric":"bleu", + "score":0.2107380254 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"kk", + "task":"translation_from", + "metric":"chrf", + "score":0.4991705013 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"kk", + "task":"translation_to", + "metric":"bleu", + "score":0.331371608 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"kk", + "task":"translation_to", + "metric":"chrf", + "score":0.5825812793 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"km", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"km", + "task":"translation_from", + "metric":"bleu", + "score":0.3610313078 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"km", + "task":"translation_from", + "metric":"chrf", + "score":0.605032383 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"km", + "task":"translation_to", + "metric":"bleu", + "score":0.1827077293 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"km", + "task":"translation_to", + "metric":"chrf", + "score":0.4206815495 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"kn", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"kn", + "task":"translation_from", + "metric":"bleu", + "score":0.273765965 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"kn", + "task":"translation_from", + "metric":"chrf", + "score":0.5541955864 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"kn", + "task":"translation_to", + "metric":"bleu", + "score":0.2689874625 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"kn", + "task":"translation_to", + "metric":"chrf", + "score":0.5150630417 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ko", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ko", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ko", + "task":"translation_from", + "metric":"bleu", + "score":0.2599758467 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ko", + "task":"translation_from", + "metric":"chrf", + "score":0.4915631618 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ko", + "task":"translation_to", + "metric":"bleu", + "score":0.1778560135 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ko", + "task":"translation_to", + "metric":"chrf", + "score":0.2969773205 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"lua", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"lua", + "task":"translation_from", + "metric":"bleu", + "score":0.0622795727 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"lua", + "task":"translation_from", + "metric":"chrf", + "score":0.2675764955 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"lua", + "task":"translation_to", + "metric":"bleu", + "score":0.0381251381 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"lua", + "task":"translation_to", + "metric":"chrf", + "score":0.2812186233 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"mag", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"mag", + "task":"translation_from", + "metric":"bleu", + "score":0.2963258613 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"mag", + "task":"translation_from", + "metric":"chrf", + "score":0.5478698134 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"mag", + "task":"translation_to", + "metric":"bleu", + "score":0.2490501232 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"mag", + "task":"translation_to", + "metric":"chrf", + "score":0.470734921 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"mai", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"mai", + "task":"translation_from", + "metric":"bleu", + "score":0.2517024761 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"mai", + "task":"translation_from", + "metric":"chrf", + "score":0.5071223357 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"mai", + "task":"translation_to", + "metric":"bleu", + "score":0.1690507631 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"mai", + "task":"translation_to", + "metric":"chrf", + "score":0.4610312304 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"mg", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"mg", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"mg", + "task":"translation_from", + "metric":"bleu", + "score":0.245769233 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"mg", + "task":"translation_from", + "metric":"chrf", + "score":0.4441647844 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"mg", + "task":"translation_to", + "metric":"bleu", + "score":0.1869691691 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"mg", + "task":"translation_to", + "metric":"chrf", + "score":0.4993277276 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ml", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ml", + "task":"translation_from", + "metric":"bleu", + "score":0.3697837131 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ml", + "task":"translation_from", + "metric":"chrf", + "score":0.598263628 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ml", + "task":"translation_to", + "metric":"bleu", + "score":0.2866761532 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ml", + "task":"translation_to", + "metric":"chrf", + "score":0.5500074549 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"mr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"mr", + "task":"translation_from", + "metric":"bleu", + "score":0.3125095049 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"mr", + "task":"translation_from", + "metric":"chrf", + "score":0.5535296132 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"mr", + "task":"translation_to", + "metric":"bleu", + "score":0.2275791183 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"mr", + "task":"translation_to", + "metric":"chrf", + "score":0.4569915545 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ms", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ms", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ms", + "task":"translation_from", + "metric":"bleu", + "score":0.345465339 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ms", + "task":"translation_from", + "metric":"chrf", + "score":0.5897544047 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ms", + "task":"translation_to", + "metric":"bleu", + "score":0.4313143535 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ms", + "task":"translation_to", + "metric":"chrf", + "score":0.672362003 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"my", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"my", + "task":"translation_from", + "metric":"bleu", + "score":0.3075903861 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"my", + "task":"translation_from", + "metric":"chrf", + "score":0.578349632 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"my", + "task":"translation_to", + "metric":"bleu", + "score":0.1897910105 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"my", + "task":"translation_to", + "metric":"chrf", + "score":0.4717519215 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ne", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ne", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ne", + "task":"translation_from", + "metric":"bleu", + "score":0.3557303786 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ne", + "task":"translation_from", + "metric":"chrf", + "score":0.5879008408 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ne", + "task":"translation_to", + "metric":"bleu", + "score":0.1851047496 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ne", + "task":"translation_to", + "metric":"chrf", + "score":0.4783025401 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"nl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"nl", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"nl", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"nl", + "task":"translation_from", + "metric":"bleu", + "score":0.2465270522 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"nl", + "task":"translation_from", + "metric":"chrf", + "score":0.5037852263 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"nl", + "task":"translation_to", + "metric":"bleu", + "score":0.3149743955 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"nl", + "task":"translation_to", + "metric":"chrf", + "score":0.5635296931 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ny", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ny", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ny", + "task":"translation_from", + "metric":"bleu", + "score":0.1800815958 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ny", + "task":"translation_from", + "metric":"chrf", + "score":0.4077560746 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ny", + "task":"translation_to", + "metric":"bleu", + "score":0.0667158921 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ny", + "task":"translation_to", + "metric":"chrf", + "score":0.3678415876 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"om", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"om", + "task":"translation_from", + "metric":"bleu", + "score":0.0536067183 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"om", + "task":"translation_from", + "metric":"chrf", + "score":0.2934406231 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"om", + "task":"translation_to", + "metric":"bleu", + "score":0.0212136796 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"om", + "task":"translation_to", + "metric":"chrf", + "score":0.3367052821 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"or", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"or", + "task":"translation_from", + "metric":"bleu", + "score":0.2884546263 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"or", + "task":"translation_from", + "metric":"chrf", + "score":0.5474826718 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"or", + "task":"translation_to", + "metric":"bleu", + "score":0.2053276951 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"or", + "task":"translation_to", + "metric":"chrf", + "score":0.4215800492 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"pa", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"pa", + "task":"translation_from", + "metric":"bleu", + "score":0.4246522462 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"pa", + "task":"translation_from", + "metric":"chrf", + "score":0.6364852561 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"pa", + "task":"translation_to", + "metric":"bleu", + "score":0.439726575 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"pa", + "task":"translation_to", + "metric":"chrf", + "score":0.5806732389 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"pl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"pl", + "task":"translation_from", + "metric":"bleu", + "score":0.2708043929 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"pl", + "task":"translation_from", + "metric":"chrf", + "score":0.5320865131 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"pl", + "task":"translation_to", + "metric":"bleu", + "score":0.2827359953 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"pl", + "task":"translation_to", + "metric":"chrf", + "score":0.5407300006 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"pt", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"pt", + "task":"translation_from", + "metric":"bleu", + "score":0.3451568022 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"pt", + "task":"translation_from", + "metric":"chrf", + "score":0.5845365036 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"pt", + "task":"translation_to", + "metric":"bleu", + "score":0.4582156105 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"pt", + "task":"translation_to", + "metric":"chrf", + "score":0.6491023878 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ro", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ro", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ro", + "task":"translation_from", + "metric":"bleu", + "score":0.3130092522 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ro", + "task":"translation_from", + "metric":"chrf", + "score":0.5728467895 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ro", + "task":"translation_to", + "metric":"bleu", + "score":0.503492173 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ro", + "task":"translation_to", + "metric":"chrf", + "score":0.6731092747 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ru", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ru", + "task":"translation_from", + "metric":"bleu", + "score":0.2567420946 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ru", + "task":"translation_from", + "metric":"chrf", + "score":0.5061211552 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ru", + "task":"translation_to", + "metric":"bleu", + "score":0.4025875747 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ru", + "task":"translation_to", + "metric":"chrf", + "score":0.6083538055 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"rw", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"rw", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"rw", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"rw", + "task":"translation_from", + "metric":"bleu", + "score":0.1596218382 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"rw", + "task":"translation_from", + "metric":"chrf", + "score":0.3642420922 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"rw", + "task":"translation_to", + "metric":"bleu", + "score":0.1505395069 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"rw", + "task":"translation_to", + "metric":"chrf", + "score":0.4131000516 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sd", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sd", + "task":"translation_from", + "metric":"bleu", + "score":0.3060556532 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sd", + "task":"translation_from", + "metric":"chrf", + "score":0.5236224481 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sd", + "task":"translation_to", + "metric":"bleu", + "score":0.2303677631 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sd", + "task":"translation_to", + "metric":"chrf", + "score":0.4550652237 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"si", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"si", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"si", + "task":"translation_from", + "metric":"bleu", + "score":0.2505378464 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"si", + "task":"translation_from", + "metric":"chrf", + "score":0.4777570712 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"si", + "task":"translation_to", + "metric":"bleu", + "score":0.238193304 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"si", + "task":"translation_to", + "metric":"chrf", + "score":0.4255249112 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sn", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sn", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sn", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sn", + "task":"translation_from", + "metric":"bleu", + "score":0.1176743345 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sn", + "task":"translation_from", + "metric":"chrf", + "score":0.3404474685 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sn", + "task":"translation_to", + "metric":"bleu", + "score":0.1289978109 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sn", + "task":"translation_to", + "metric":"chrf", + "score":0.426186094 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"so", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"so", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"so", + "task":"translation_from", + "metric":"bleu", + "score":0.2374825749 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"so", + "task":"translation_from", + "metric":"chrf", + "score":0.4257984603 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"so", + "task":"translation_to", + "metric":"bleu", + "score":0.1278040594 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"so", + "task":"translation_to", + "metric":"chrf", + "score":0.4360467159 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sr", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sr", + "task":"translation_from", + "metric":"bleu", + "score":0.2878836927 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sr", + "task":"translation_from", + "metric":"chrf", + "score":0.5437304451 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sr", + "task":"translation_to", + "metric":"bleu", + "score":0.4038152012 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sr", + "task":"translation_to", + "metric":"chrf", + "score":0.5978824564 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"su", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"su", + "task":"translation_from", + "metric":"bleu", + "score":0.2373274152 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"su", + "task":"translation_from", + "metric":"chrf", + "score":0.4608187705 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"su", + "task":"translation_to", + "metric":"bleu", + "score":0.1899355362 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"su", + "task":"translation_to", + "metric":"chrf", + "score":0.4693159323 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sv", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sv", + "task":"translation_from", + "metric":"bleu", + "score":0.298223826 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sv", + "task":"translation_from", + "metric":"chrf", + "score":0.5684457257 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sv", + "task":"translation_to", + "metric":"bleu", + "score":0.3825937295 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sv", + "task":"translation_to", + "metric":"chrf", + "score":0.6393626909 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sw", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sw", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sw", + "task":"translation_from", + "metric":"bleu", + "score":0.3425500041 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sw", + "task":"translation_from", + "metric":"chrf", + "score":0.5680420054 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sw", + "task":"translation_to", + "metric":"bleu", + "score":0.2980763573 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sw", + "task":"translation_to", + "metric":"chrf", + "score":0.5924685945 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ta", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ta", + "task":"translation_from", + "metric":"bleu", + "score":0.2473591284 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ta", + "task":"translation_from", + "metric":"chrf", + "score":0.5382867852 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ta", + "task":"translation_to", + "metric":"bleu", + "score":0.3068229029 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ta", + "task":"translation_to", + "metric":"chrf", + "score":0.5637367471 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"te", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"te", + "task":"translation_from", + "metric":"bleu", + "score":0.3462186566 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"te", + "task":"translation_from", + "metric":"chrf", + "score":0.6055817314 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"te", + "task":"translation_to", + "metric":"bleu", + "score":0.3822149946 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"te", + "task":"translation_to", + "metric":"chrf", + "score":0.5783618359 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"tg", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"tg", + "task":"translation_from", + "metric":"bleu", + "score":0.2141866571 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"tg", + "task":"translation_from", + "metric":"chrf", + "score":0.4746491206 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"tg", + "task":"translation_to", + "metric":"bleu", + "score":0.2383903304 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"tg", + "task":"translation_to", + "metric":"chrf", + "score":0.4750617701 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"th", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"th", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"th", + "task":"translation_from", + "metric":"bleu", + "score":0.2652851581 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"th", + "task":"translation_from", + "metric":"chrf", + "score":0.5278626321 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"th", + "task":"translation_to", + "metric":"bleu", + "score":0.3718263092 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"th", + "task":"translation_to", + "metric":"chrf", + "score":0.5255136074 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ti", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ti", + "task":"translation_from", + "metric":"bleu", + "score":0.1999962108 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ti", + "task":"translation_from", + "metric":"chrf", + "score":0.4183108341 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ti", + "task":"translation_to", + "metric":"bleu", + "score":0.1133461632 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ti", + "task":"translation_to", + "metric":"chrf", + "score":0.2113810541 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"tr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"tr", + "task":"translation_from", + "metric":"bleu", + "score":0.2978237586 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"tr", + "task":"translation_from", + "metric":"chrf", + "score":0.5152360665 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"tr", + "task":"translation_to", + "metric":"bleu", + "score":0.3447394658 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"tr", + "task":"translation_to", + "metric":"chrf", + "score":0.5850690403 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"uk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"uk", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"uk", + "task":"translation_from", + "metric":"bleu", + "score":0.2589937034 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"uk", + "task":"translation_from", + "metric":"chrf", + "score":0.5348601679 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"uk", + "task":"translation_to", + "metric":"bleu", + "score":0.3544986277 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"uk", + "task":"translation_to", + "metric":"chrf", + "score":0.5913345073 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"umb", + "task":"classification", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"umb", + "task":"translation_from", + "metric":"bleu", + "score":0.0650028377 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"umb", + "task":"translation_from", + "metric":"chrf", + "score":0.1912574022 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"umb", + "task":"translation_to", + "metric":"bleu", + "score":0.0525305732 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"umb", + "task":"translation_to", + "metric":"chrf", + "score":0.2699878572 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ur", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ur", + "task":"translation_from", + "metric":"bleu", + "score":0.253549974 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ur", + "task":"translation_from", + "metric":"chrf", + "score":0.5235064606 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ur", + "task":"translation_to", + "metric":"bleu", + "score":0.2484556869 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ur", + "task":"translation_to", + "metric":"chrf", + "score":0.429442787 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"uz", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"uz", + "task":"translation_from", + "metric":"bleu", + "score":0.2701010494 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"uz", + "task":"translation_from", + "metric":"chrf", + "score":0.5241051692 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"uz", + "task":"translation_to", + "metric":"bleu", + "score":0.3181656056 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"uz", + "task":"translation_to", + "metric":"chrf", + "score":0.5907906511 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"vi", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"vi", + "task":"translation_from", + "metric":"bleu", + "score":0.2670924013 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"vi", + "task":"translation_from", + "metric":"chrf", + "score":0.5198891912 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"vi", + "task":"translation_to", + "metric":"bleu", + "score":0.3597766713 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"vi", + "task":"translation_to", + "metric":"chrf", + "score":0.6081806669 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"wo", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"wo", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"wo", + "task":"translation_from", + "metric":"bleu", + "score":0.0741464388 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"wo", + "task":"translation_from", + "metric":"chrf", + "score":0.2660826012 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"wo", + "task":"translation_to", + "metric":"bleu", + "score":0.0695734356 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"wo", + "task":"translation_to", + "metric":"chrf", + "score":0.2997632689 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"wuu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"bleu", + "score":0.2653942694 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"chrf", + "score":0.4893923691 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"bleu", + "score":0.1157826458 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"chrf", + "score":0.1765005496 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"xh", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"xh", + "task":"translation_from", + "metric":"bleu", + "score":0.1376742076 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"xh", + "task":"translation_from", + "metric":"chrf", + "score":0.3734228567 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"xh", + "task":"translation_to", + "metric":"bleu", + "score":0.0864151864 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"xh", + "task":"translation_to", + "metric":"chrf", + "score":0.4104899998 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"yo", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"yo", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"yo", + "task":"translation_from", + "metric":"bleu", + "score":0.0937886749 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"yo", + "task":"translation_from", + "metric":"chrf", + "score":0.3196766983 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"yo", + "task":"translation_to", + "metric":"bleu", + "score":0.1093519063 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"yo", + "task":"translation_to", + "metric":"chrf", + "score":0.3224056963 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"yue", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"yue", + "task":"translation_from", + "metric":"bleu", + "score":0.2204568545 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"yue", + "task":"translation_from", + "metric":"chrf", + "score":0.4894165826 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"yue", + "task":"translation_to", + "metric":"bleu", + "score":0.1569463992 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"yue", + "task":"translation_to", + "metric":"chrf", + "score":0.232785021 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"zh", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"zh", + "task":"translation_from", + "metric":"bleu", + "score":0.2703289724 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"zh", + "task":"translation_from", + "metric":"chrf", + "score":0.5473102513 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"zh", + "task":"translation_to", + "metric":"bleu", + "score":0.317769874 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"zh", + "task":"translation_to", + "metric":"chrf", + "score":0.3676906362 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"zu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"zu", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"zu", + "task":"translation_from", + "metric":"bleu", + "score":0.2474518428 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"zu", + "task":"translation_from", + "metric":"chrf", + "score":0.5019415605 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"zu", + "task":"translation_to", + "metric":"bleu", + "score":0.19092807 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"zu", + "task":"translation_to", + "metric":"chrf", + "score":0.4983188666 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"aeb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.1327783313 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.3636961218 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.1557273583 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.3515058711 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"af", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"af", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"af", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"af", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"af", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ak", + "task":"classification", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ak", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ak", + "task":"translation_from", + "metric":"bleu", + "score":0.0375398146 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ak", + "task":"translation_from", + "metric":"chrf", + "score":0.1986406573 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ak", + "task":"translation_to", + "metric":"bleu", + "score":0.0015655622 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ak", + "task":"translation_to", + "metric":"chrf", + "score":0.0623964125 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"am", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"am", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"am", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"am", + "task":"translation_from", + "metric":"bleu", + "score":0.0476085337 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"am", + "task":"translation_from", + "metric":"chrf", + "score":0.205897506 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"am", + "task":"translation_to", + "metric":"bleu", + "score":0.0110136998 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"am", + "task":"translation_to", + "metric":"chrf", + "score":0.0688367427 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"apc", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"apc", + "task":"translation_from", + "metric":"bleu", + "score":0.0927070911 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"apc", + "task":"translation_from", + "metric":"chrf", + "score":0.3300356171 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"apc", + "task":"translation_to", + "metric":"bleu", + "score":0.1909661669 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"apc", + "task":"translation_to", + "metric":"chrf", + "score":0.4391780261 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ar", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ar", + "task":"translation_from", + "metric":"bleu", + "score":0.1548779531 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ar", + "task":"translation_from", + "metric":"chrf", + "score":0.3887963415 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ar", + "task":"translation_to", + "metric":"bleu", + "score":0.268706305 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ar", + "task":"translation_to", + "metric":"chrf", + "score":0.4959259833 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ary", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ary", + "task":"translation_from", + "metric":"bleu", + "score":0.0374286633 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ary", + "task":"translation_from", + "metric":"chrf", + "score":0.276784029 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ary", + "task":"translation_to", + "metric":"bleu", + "score":0.1363017113 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ary", + "task":"translation_to", + "metric":"chrf", + "score":0.3536429421 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"arz", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"arz", + "task":"translation_from", + "metric":"bleu", + "score":0.106947781 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"arz", + "task":"translation_from", + "metric":"chrf", + "score":0.3169488071 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"arz", + "task":"translation_to", + "metric":"bleu", + "score":0.1479958867 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"arz", + "task":"translation_to", + "metric":"chrf", + "score":0.3761797641 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"as", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"as", + "task":"translation_from", + "metric":"bleu", + "score":0.0312538317 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"as", + "task":"translation_from", + "metric":"chrf", + "score":0.2922637643 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"as", + "task":"translation_to", + "metric":"bleu", + "score":0.0234894436 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"as", + "task":"translation_to", + "metric":"chrf", + "score":0.2225963414 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"awa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"awa", + "task":"translation_from", + "metric":"bleu", + "score":0.2171579973 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"awa", + "task":"translation_from", + "metric":"chrf", + "score":0.456713607 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"awa", + "task":"translation_to", + "metric":"bleu", + "score":0.1681044686 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"awa", + "task":"translation_to", + "metric":"chrf", + "score":0.3440820027 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"az", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"az", + "task":"translation_from", + "metric":"bleu", + "score":0.0298418752 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"az", + "task":"translation_from", + "metric":"chrf", + "score":0.2580610439 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"az", + "task":"translation_to", + "metric":"bleu", + "score":0.041095966 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"az", + "task":"translation_to", + "metric":"chrf", + "score":0.2930729253 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"be", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"be", + "task":"translation_from", + "metric":"bleu", + "score":0.0556571943 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"be", + "task":"translation_from", + "metric":"chrf", + "score":0.3548784075 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"be", + "task":"translation_to", + "metric":"bleu", + "score":0.066482798 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"be", + "task":"translation_to", + "metric":"chrf", + "score":0.3295363828 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"bho", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"bho", + "task":"translation_from", + "metric":"bleu", + "score":0.1569501012 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"bho", + "task":"translation_from", + "metric":"chrf", + "score":0.4039420627 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"bho", + "task":"translation_to", + "metric":"bleu", + "score":0.1151073387 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"bho", + "task":"translation_to", + "metric":"chrf", + "score":0.3126448605 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"bm", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"bm", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"bm", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"bm", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"bm", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"bn", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"bn", + "task":"translation_from", "metric":"bleu", - "score":0.4660772497 + "score":0.095240952 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", + "bcp_47":"bn", + "task":"translation_from", + "metric":"chrf", + "score":0.3840548344 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"bn", + "task":"translation_to", + "metric":"bleu", + "score":0.1876367188 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"bn", + "task":"translation_to", + "metric":"chrf", + "score":0.4310988737 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ca", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ca", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ca", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ca", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ca", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ceb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"bleu", + "score":0.1916153649 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"chrf", + "score":0.4266920518 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"bleu", + "score":0.0532026402 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"chrf", + "score":0.2442653709 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ckb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"bleu", + "score":0.0233838479 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"chrf", + "score":0.2071232952 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"bleu", + "score":0.0030055044 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"chrf", + "score":0.1680771697 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"cs", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"cs", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"cs", + "task":"translation_from", + "metric":"bleu", + "score":0.1169562212 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"cs", + "task":"translation_from", + "metric":"chrf", + "score":0.4547809891 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"cs", + "task":"translation_to", + "metric":"bleu", + "score":0.2167266047 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"cs", + "task":"translation_to", + "metric":"chrf", + "score":0.4629060689 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"de", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"de", + "task":"translation_from", + "metric":"bleu", + "score":0.2546126219 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"de", + "task":"translation_from", + "metric":"chrf", + "score":0.4840060449 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"de", + "task":"translation_to", + "metric":"bleu", + "score":0.3171866034 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"de", + "task":"translation_to", + "metric":"chrf", + "score":0.5752285995 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"el", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"el", + "task":"translation_from", + "metric":"bleu", + "score":0.1236158233 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"el", + "task":"translation_from", + "metric":"chrf", + "score":0.3922493462 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"el", + "task":"translation_to", + "metric":"bleu", + "score":0.1783375751 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"el", + "task":"translation_to", + "metric":"chrf", + "score":0.4003787241 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"en", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"en", + "task":"translation_from", + "metric":"bleu", + "score":0.3642023499 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"en", + "task":"translation_from", + "metric":"chrf", + "score":0.5697992815 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"en", + "task":"translation_to", + "metric":"bleu", + "score":0.4959810553 + }, + { + "model":"microsoft\/phi-4", "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.7280386297 + "score":0.7232313255 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"es", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"es", "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.6 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"es", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.3593767686 + "score":0.1732534835 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.5668073679 + "score":0.4434970776 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.3662275621 + "score":0.3605235101 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.6102640711 + "score":0.5849733787 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"fa", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"fa", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"fa", "task":"translation_from", "metric":"bleu", - "score":0.286051969 + "score":0.0868573088 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"fa", "task":"translation_from", "metric":"chrf", - "score":0.5373856549 + "score":0.3068232268 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"fa", "task":"translation_to", "metric":"bleu", - "score":0.1816947237 + "score":0.0883262705 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"fa", "task":"translation_to", "metric":"chrf", - "score":0.3981159206 + "score":0.3294670602 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"fil", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"fil", "task":"mmlu", "metric":"accuracy", "score":0.7 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"fil", "task":"translation_from", "metric":"bleu", - "score":0.3579818144 + "score":0.1921595243 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"fil", "task":"translation_from", "metric":"chrf", - "score":0.5889481625 + "score":0.4381909531 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"fil", "task":"translation_to", "metric":"bleu", - "score":0.3403832088 + "score":0.2102834142 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"fil", "task":"translation_to", "metric":"chrf", - "score":0.590264879 + "score":0.503934087 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"fr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"fr", "task":"mgsm", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"fr", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.6 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.3180384008 + "score":0.1763652726 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.5571267732 + "score":0.4428784232 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.5778354146 + "score":0.3772793055 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.7490356238 + "score":0.5820724576 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.0067893116 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.2007893146 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0132875082 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.1300679396 + }, + { + "model":"microsoft\/phi-4", "bcp_47":"gu", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"gu", "task":"translation_from", "metric":"bleu", - "score":0.34811918 + "score":0.1581139234 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"gu", "task":"translation_from", "metric":"chrf", - "score":0.5482709715 + "score":0.3992847318 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"gu", "task":"translation_to", "metric":"bleu", - "score":0.1618983325 + "score":0.1006122628 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"gu", "task":"translation_to", "metric":"chrf", - "score":0.4411905252 + "score":0.3529986856 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"ha", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"ha", "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":0.1 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"ha", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":0.5 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"ha", "task":"translation_from", "metric":"bleu", - "score":0.1925315551 + "score":0.0310807341 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"ha", "task":"translation_from", "metric":"chrf", - "score":0.4032389241 + "score":0.2470826922 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"ha", "task":"translation_to", "metric":"bleu", - "score":0.1992720083 + "score":0.0634023566 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"ha", "task":"translation_to", "metric":"chrf", - "score":0.4905441802 + "score":0.2955476351 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"hi", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"hi", "task":"mmlu", "metric":"accuracy", - "score":1.0 + "score":0.6 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.3722751955 + "score":0.2788689746 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.6207213131 + "score":0.5417455941 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.3378499277 + "score":0.2369610218 }, { - "model":"google\/gemini-flash-1.5", + "model":"microsoft\/phi-4", "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.554090013 + "score":0.3765795877 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", + "model":"microsoft\/phi-4", + "bcp_47":"hne", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"mmlu", + "model":"microsoft\/phi-4", + "bcp_47":"hne", + "task":"translation_from", + "metric":"bleu", + "score":0.1094117889 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"hne", + "task":"translation_from", + "metric":"chrf", + "score":0.3715115564 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"hne", + "task":"translation_to", + "metric":"bleu", + "score":0.0627224628 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"hne", + "task":"translation_to", + "metric":"chrf", + "score":0.3120135336 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ht", + "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", + "model":"microsoft\/phi-4", + "bcp_47":"ht", "task":"translation_from", "metric":"bleu", - "score":0.3583744222 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", + "model":"microsoft\/phi-4", + "bcp_47":"ht", "task":"translation_from", "metric":"chrf", - "score":0.5732194975 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", + "model":"microsoft\/phi-4", + "bcp_47":"ht", "task":"translation_to", "metric":"bleu", - "score":0.3364664006 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", + "model":"microsoft\/phi-4", + "bcp_47":"ht", "task":"translation_to", "metric":"chrf", - "score":0.6438910651 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"it", + "model":"microsoft\/phi-4", + "bcp_47":"hu", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"it", + "model":"microsoft\/phi-4", + "bcp_47":"hu", "task":"mgsm", "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 + "score":0.6 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"it", + "model":"microsoft\/phi-4", + "bcp_47":"hu", "task":"translation_from", "metric":"bleu", - "score":0.3074361781 + "score":0.1148528139 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"it", + "model":"microsoft\/phi-4", + "bcp_47":"hu", "task":"translation_from", "metric":"chrf", - "score":0.5178180754 + "score":0.3969632133 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"it", + "model":"microsoft\/phi-4", + "bcp_47":"hu", "task":"translation_to", "metric":"bleu", - "score":0.3505959215 + "score":0.2004789157 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"it", + "model":"microsoft\/phi-4", + "bcp_47":"hu", "task":"translation_to", "metric":"chrf", - "score":0.5955060476 + "score":0.4541545495 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", + "model":"microsoft\/phi-4", + "bcp_47":"id", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"mgsm", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", + "model":"microsoft\/phi-4", + "bcp_47":"id", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", + "model":"microsoft\/phi-4", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.2581140706 + "score":0.0855471394 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", + "model":"microsoft\/phi-4", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.5395853617 + "score":0.3720740561 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", + "model":"microsoft\/phi-4", + "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.3298839393 + "score":0.284365864 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", + "model":"microsoft\/phi-4", + "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.4471547552 + "score":0.589202199 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", + "model":"microsoft\/phi-4", + "bcp_47":"ig", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", + "model":"microsoft\/phi-4", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ig", "task":"translation_from", "metric":"bleu", - "score":0.3177915441 + "score":0.0344910359 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", + "model":"microsoft\/phi-4", + "bcp_47":"ig", "task":"translation_from", "metric":"chrf", - "score":0.5387853038 + "score":0.2176253825 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", + "model":"microsoft\/phi-4", + "bcp_47":"ig", "task":"translation_to", "metric":"bleu", - "score":0.2549228547 + "score":0.0020930717 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", + "model":"microsoft\/phi-4", + "bcp_47":"ig", "task":"translation_to", "metric":"chrf", - "score":0.5322440265 + "score":0.0498013123 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"kn", + "model":"microsoft\/phi-4", + "bcp_47":"ilo", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"kn", + "model":"microsoft\/phi-4", + "bcp_47":"ilo", "task":"translation_from", "metric":"bleu", - "score":0.2858443353 + "score":0.0788515324 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"kn", + "model":"microsoft\/phi-4", + "bcp_47":"ilo", "task":"translation_from", "metric":"chrf", - "score":0.5499221943 + "score":0.3023201397 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"kn", + "model":"microsoft\/phi-4", + "bcp_47":"ilo", "task":"translation_to", "metric":"bleu", - "score":0.2481102245 + "score":0.0177354807 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"kn", + "model":"microsoft\/phi-4", + "bcp_47":"ilo", "task":"translation_to", "metric":"chrf", - "score":0.4829685786 + "score":0.2429763441 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ko", + "model":"microsoft\/phi-4", + "bcp_47":"it", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ko", + "model":"microsoft\/phi-4", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"it", "task":"mmlu", "metric":"accuracy", "score":0.7 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ko", + "model":"microsoft\/phi-4", + "bcp_47":"it", "task":"translation_from", "metric":"bleu", - "score":0.2305492704 + "score":0.1849581121 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ko", + "model":"microsoft\/phi-4", + "bcp_47":"it", "task":"translation_from", "metric":"chrf", - "score":0.4826740501 + "score":0.4562979327 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ko", + "model":"microsoft\/phi-4", + "bcp_47":"it", "task":"translation_to", "metric":"bleu", - "score":0.1746024172 + "score":0.2591551222 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ko", + "model":"microsoft\/phi-4", + "bcp_47":"it", "task":"translation_to", "metric":"chrf", - "score":0.3073554703 + "score":0.5311194854 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ml", + "model":"microsoft\/phi-4", + "bcp_47":"ja", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3161992509 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.5479755911 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2133071404 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4660281027 + "model":"microsoft\/phi-4", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"classification", + "model":"microsoft\/phi-4", + "bcp_47":"ja", + "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", + "model":"microsoft\/phi-4", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.2370074805 + "score":0.1462066826 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", + "model":"microsoft\/phi-4", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.4804215458 + "score":0.4299215293 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", + "model":"microsoft\/phi-4", + "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.2399769139 + "score":0.2371087689 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", + "model":"microsoft\/phi-4", + "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.4726429935 + "score":0.4064089202 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ms", + "model":"microsoft\/phi-4", + "bcp_47":"jv", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ms", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ms", + "model":"microsoft\/phi-4", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.3104483533 + "score":0.1102793601 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ms", + "model":"microsoft\/phi-4", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.5705763492 + "score":0.3718502317 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ms", + "model":"microsoft\/phi-4", + "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.4229626959 + "score":0.0999035402 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ms", + "model":"microsoft\/phi-4", + "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.6856510383 + "score":0.3664761129 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"my", + "model":"microsoft\/phi-4", + "bcp_47":"ki", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"my", + "model":"microsoft\/phi-4", + "bcp_47":"ki", "task":"translation_from", "metric":"bleu", - "score":0.2227645269 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"my", + "model":"microsoft\/phi-4", + "bcp_47":"ki", "task":"translation_from", "metric":"chrf", - "score":0.4888582617 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"my", + "model":"microsoft\/phi-4", + "bcp_47":"ki", "task":"translation_to", "metric":"bleu", - "score":0.1869632744 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"my", + "model":"microsoft\/phi-4", + "bcp_47":"ki", "task":"translation_to", "metric":"chrf", - "score":0.4322398057 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"om", + "model":"microsoft\/phi-4", + "bcp_47":"kk", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"om", - "task":"mgsm", - "metric":"accuracy", - "score":0.1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"om", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"om", + "model":"microsoft\/phi-4", + "bcp_47":"kk", "task":"translation_from", "metric":"bleu", - "score":0.0258426139 + "score":0.0537848954 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"om", + "model":"microsoft\/phi-4", + "bcp_47":"kk", "task":"translation_from", "metric":"chrf", - "score":0.2237241232 + "score":0.3139411656 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"om", + "model":"microsoft\/phi-4", + "bcp_47":"kk", "task":"translation_to", "metric":"bleu", - "score":0.0460531144 + "score":0.0666822222 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"om", + "model":"microsoft\/phi-4", + "bcp_47":"kk", "task":"translation_to", "metric":"chrf", - "score":0.3418147419 + "score":0.3622322436 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"or", + "model":"microsoft\/phi-4", + "bcp_47":"km", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"or", + "model":"microsoft\/phi-4", + "bcp_47":"km", "task":"translation_from", "metric":"bleu", - "score":0.3714452662 + "score":0.0753739979 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"or", + "model":"microsoft\/phi-4", + "bcp_47":"km", "task":"translation_from", "metric":"chrf", - "score":0.5977153904 + "score":0.3445771251 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"or", + "model":"microsoft\/phi-4", + "bcp_47":"km", "task":"translation_to", "metric":"bleu", - "score":0.2234825764 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"or", + "model":"microsoft\/phi-4", + "bcp_47":"km", "task":"translation_to", "metric":"chrf", - "score":0.4562477173 + "score":0.1701733674 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", + "model":"microsoft\/phi-4", + "bcp_47":"kn", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", + "model":"microsoft\/phi-4", + "bcp_47":"kn", "task":"translation_from", "metric":"bleu", - "score":0.4180718844 + "score":0.104202131 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", + "model":"microsoft\/phi-4", + "bcp_47":"kn", "task":"translation_from", "metric":"chrf", - "score":0.6426219278 + "score":0.3590734072 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", + "model":"microsoft\/phi-4", + "bcp_47":"kn", "task":"translation_to", "metric":"bleu", - "score":0.3938693136 + "score":0.0705324379 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", + "model":"microsoft\/phi-4", + "bcp_47":"kn", "task":"translation_to", "metric":"chrf", - "score":0.5573992167 + "score":0.3025321109 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pl", + "model":"microsoft\/phi-4", + "bcp_47":"ko", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pl", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pl", + "model":"microsoft\/phi-4", + "bcp_47":"ko", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.6 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pl", + "model":"microsoft\/phi-4", + "bcp_47":"ko", "task":"translation_from", "metric":"bleu", - "score":0.2456102401 + "score":0.1107444823 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pl", + "model":"microsoft\/phi-4", + "bcp_47":"ko", "task":"translation_from", "metric":"chrf", - "score":0.5190609119 + "score":0.3916459404 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pl", + "model":"microsoft\/phi-4", + "bcp_47":"ko", "task":"translation_to", "metric":"bleu", - "score":0.4265619216 + "score":0.1649626358 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pl", + "model":"microsoft\/phi-4", + "bcp_47":"ko", "task":"translation_to", "metric":"chrf", - "score":0.6320824157 + "score":0.2656552119 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", + "model":"microsoft\/phi-4", + "bcp_47":"lua", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", + "model":"microsoft\/phi-4", + "bcp_47":"lua", "task":"translation_from", "metric":"bleu", - "score":0.3537745123 + "score":0.0539171508 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", + "model":"microsoft\/phi-4", + "bcp_47":"lua", "task":"translation_from", "metric":"chrf", - "score":0.5904429929 + "score":0.2436825008 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", + "model":"microsoft\/phi-4", + "bcp_47":"lua", "task":"translation_to", "metric":"bleu", - "score":0.4588664196 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", + "model":"microsoft\/phi-4", + "bcp_47":"lua", "task":"translation_to", "metric":"chrf", - "score":0.6844540285 + "score":0.1581276083 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", + "model":"microsoft\/phi-4", + "bcp_47":"mag", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", + "model":"microsoft\/phi-4", + "bcp_47":"mag", "task":"translation_from", "metric":"bleu", - "score":0.2449777422 + "score":0.1658903033 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", + "model":"microsoft\/phi-4", + "bcp_47":"mag", "task":"translation_from", "metric":"chrf", - "score":0.5268764903 + "score":0.4217933103 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", + "model":"microsoft\/phi-4", + "bcp_47":"mag", "task":"translation_to", "metric":"bleu", - "score":0.3789708434 + "score":0.0803859812 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", + "model":"microsoft\/phi-4", + "bcp_47":"mag", "task":"translation_to", "metric":"chrf", - "score":0.5790333031 + "score":0.3220461814 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sd", + "model":"microsoft\/phi-4", + "bcp_47":"mai", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sd", + "model":"microsoft\/phi-4", + "bcp_47":"mai", "task":"translation_from", "metric":"bleu", - "score":0.3352727297 + "score":0.1018185799 }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sd", + { + "model":"microsoft\/phi-4", + "bcp_47":"mai", "task":"translation_from", "metric":"chrf", - "score":0.5583215205 + "score":0.3881585962 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sd", + "model":"microsoft\/phi-4", + "bcp_47":"mai", "task":"translation_to", "metric":"bleu", - "score":0.2009000601 + "score":0.0840554004 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sd", + "model":"microsoft\/phi-4", + "bcp_47":"mai", "task":"translation_to", "metric":"chrf", - "score":0.4004383195 + "score":0.3260852936 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", + "model":"microsoft\/phi-4", + "bcp_47":"mg", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", + "model":"microsoft\/phi-4", + "bcp_47":"mg", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.2 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", + "model":"microsoft\/phi-4", + "bcp_47":"mg", "task":"translation_from", "metric":"bleu", - "score":0.3005035588 + "score":0.036255172 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", + "model":"microsoft\/phi-4", + "bcp_47":"mg", "task":"translation_from", "metric":"chrf", - "score":0.5210660172 + "score":0.2361171448 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", + "model":"microsoft\/phi-4", + "bcp_47":"mg", "task":"translation_to", "metric":"bleu", - "score":0.3401968092 + "score":0.0369324798 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", + "model":"microsoft\/phi-4", + "bcp_47":"mg", "task":"translation_to", "metric":"chrf", - "score":0.6217197146 + "score":0.3426601677 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ta", + "model":"microsoft\/phi-4", + "bcp_47":"ml", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ta", + "model":"microsoft\/phi-4", + "bcp_47":"ml", "task":"translation_from", "metric":"bleu", - "score":0.2662307086 + "score":0.1675392326 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ta", + "model":"microsoft\/phi-4", + "bcp_47":"ml", "task":"translation_from", "metric":"chrf", - "score":0.5053585639 + "score":0.4161590898 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ta", + "model":"microsoft\/phi-4", + "bcp_47":"ml", "task":"translation_to", "metric":"bleu", - "score":0.3044345778 + "score":0.101823454 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ta", + "model":"microsoft\/phi-4", + "bcp_47":"ml", "task":"translation_to", "metric":"chrf", - "score":0.5714036731 + "score":0.3124446375 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", + "model":"microsoft\/phi-4", + "bcp_47":"mr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", + "model":"microsoft\/phi-4", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.3330093484 + "score":0.1012625471 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", + "model":"microsoft\/phi-4", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.5694168709 + "score":0.3580813711 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", + "model":"microsoft\/phi-4", + "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.257812168 + "score":0.0891010327 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", + "model":"microsoft\/phi-4", + "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.5167002436 + "score":0.3158325956 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"th", + "model":"microsoft\/phi-4", + "bcp_47":"ms", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"th", - "task":"mgsm", + "model":"microsoft\/phi-4", + "bcp_47":"ms", + "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.6 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"th", + "model":"microsoft\/phi-4", + "bcp_47":"ms", "task":"translation_from", "metric":"bleu", - "score":0.2992360169 + "score":0.1211248924 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"th", + "model":"microsoft\/phi-4", + "bcp_47":"ms", "task":"translation_from", "metric":"chrf", - "score":0.5585599708 + "score":0.389246098 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"th", + "model":"microsoft\/phi-4", + "bcp_47":"ms", "task":"translation_to", "metric":"bleu", - "score":0.4269079012 + "score":0.2367123999 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"th", + "model":"microsoft\/phi-4", + "bcp_47":"ms", "task":"translation_to", "metric":"chrf", - "score":0.5719718715 + "score":0.5273473365 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"tr", + "model":"microsoft\/phi-4", + "bcp_47":"my", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"tr", + "model":"microsoft\/phi-4", + "bcp_47":"my", "task":"translation_from", "metric":"bleu", - "score":0.2832304201 + "score":0.1262296798 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"tr", + "model":"microsoft\/phi-4", + "bcp_47":"my", "task":"translation_from", "metric":"chrf", - "score":0.5467240003 + "score":0.3480250641 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"tr", + "model":"microsoft\/phi-4", + "bcp_47":"my", "task":"translation_to", "metric":"bleu", - "score":0.3273464288 + "score":0.104091386 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"tr", + "model":"microsoft\/phi-4", + "bcp_47":"my", "task":"translation_to", "metric":"chrf", - "score":0.5827048506 + "score":0.3135377948 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", + "model":"microsoft\/phi-4", + "bcp_47":"ne", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", + "model":"microsoft\/phi-4", + "bcp_47":"ne", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ne", "task":"translation_from", "metric":"bleu", - "score":0.322448107 + "score":0.1488007297 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", + "model":"microsoft\/phi-4", + "bcp_47":"ne", "task":"translation_from", "metric":"chrf", - "score":0.5887654616 + "score":0.4132412315 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", + "model":"microsoft\/phi-4", + "bcp_47":"ne", "task":"translation_to", "metric":"bleu", - "score":0.2148139783 + "score":0.0478735067 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", + "model":"microsoft\/phi-4", + "bcp_47":"ne", "task":"translation_to", "metric":"chrf", - "score":0.4226865444 + "score":0.3069618299 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"uz", + "model":"microsoft\/phi-4", + "bcp_47":"nl", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"uz", + "model":"microsoft\/phi-4", + "bcp_47":"nl", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"nl", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"nl", "task":"translation_from", "metric":"bleu", - "score":0.2829644119 + "score":0.1523025562 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"uz", + "model":"microsoft\/phi-4", + "bcp_47":"nl", "task":"translation_from", "metric":"chrf", - "score":0.5194956482 + "score":0.4096891017 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"uz", + "model":"microsoft\/phi-4", + "bcp_47":"nl", "task":"translation_to", "metric":"bleu", - "score":0.2911955464 + "score":0.2469695748 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"uz", + "model":"microsoft\/phi-4", + "bcp_47":"nl", "task":"translation_to", "metric":"chrf", - "score":0.5560139888 + "score":0.524876157 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", + "model":"microsoft\/phi-4", + "bcp_47":"ny", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", + "model":"microsoft\/phi-4", + "bcp_47":"ny", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.5 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", + "model":"microsoft\/phi-4", + "bcp_47":"ny", "task":"translation_from", "metric":"bleu", - "score":0.2745000434 + "score":0.0369494139 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", + "model":"microsoft\/phi-4", + "bcp_47":"ny", "task":"translation_from", "metric":"chrf", - "score":0.5206422805 + "score":0.2350129808 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", + "model":"microsoft\/phi-4", + "bcp_47":"ny", "task":"translation_to", "metric":"bleu", - "score":0.4261790941 + "score":0.0015518794 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", + "model":"microsoft\/phi-4", + "bcp_47":"ny", "task":"translation_to", "metric":"chrf", - "score":0.6358462464 + "score":0.1140211549 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"wuu", + "model":"microsoft\/phi-4", + "bcp_47":"om", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.6 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"wuu", + "model":"microsoft\/phi-4", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"om", "task":"translation_from", "metric":"bleu", - "score":0.2072386748 + "score":0.0103766134 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"wuu", + "model":"microsoft\/phi-4", + "bcp_47":"om", "task":"translation_from", "metric":"chrf", - "score":0.4628288648 + "score":0.1821363344 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"wuu", + "model":"microsoft\/phi-4", + "bcp_47":"om", "task":"translation_to", "metric":"bleu", - "score":0.1471425714 + "score":0.0003856632 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"wuu", + "model":"microsoft\/phi-4", + "bcp_47":"om", "task":"translation_to", "metric":"chrf", - "score":0.1971299212 + "score":0.0985339751 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"yue", + "model":"microsoft\/phi-4", + "bcp_47":"or", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"yue", + "model":"microsoft\/phi-4", + "bcp_47":"or", "task":"translation_from", "metric":"bleu", - "score":0.2253512269 + "score":0.1279029727 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"yue", + "model":"microsoft\/phi-4", + "bcp_47":"or", "task":"translation_from", "metric":"chrf", - "score":0.4949150094 + "score":0.3504496172 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"yue", + "model":"microsoft\/phi-4", + "bcp_47":"or", "task":"translation_to", "metric":"bleu", - "score":0.1897306863 + "score":0.1158076498 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"yue", + "model":"microsoft\/phi-4", + "bcp_47":"or", "task":"translation_to", "metric":"chrf", - "score":0.2561574259 + "score":0.3583374616 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", + "model":"microsoft\/phi-4", + "bcp_47":"pa", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", + "model":"microsoft\/phi-4", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.2201641871 + "score":0.3550414512 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", + "model":"microsoft\/phi-4", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.5051068628 + "score":0.5626107823 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", + "model":"microsoft\/phi-4", + "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.2508351517 + "score":0.2784963846 }, { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", + "model":"microsoft\/phi-4", + "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.3110461024 + "score":0.4121299981 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"am", + "model":"microsoft\/phi-4", + "bcp_47":"pl", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"am", + "model":"microsoft\/phi-4", + "bcp_47":"pl", "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":0.6 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"am", + "model":"microsoft\/phi-4", + "bcp_47":"pl", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"am", + "model":"microsoft\/phi-4", + "bcp_47":"pl", "task":"translation_from", "metric":"bleu", - "score":0.1906134629 + "score":0.1049411882 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"am", + "model":"microsoft\/phi-4", + "bcp_47":"pl", "task":"translation_from", "metric":"chrf", - "score":0.4467868389 + "score":0.371724232 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"am", + "model":"microsoft\/phi-4", + "bcp_47":"pl", "task":"translation_to", "metric":"bleu", - "score":0.2001643223 + "score":0.2126550777 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"am", + "model":"microsoft\/phi-4", + "bcp_47":"pl", "task":"translation_to", "metric":"chrf", - "score":0.3225170104 + "score":0.4754992095 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"apc", + "model":"microsoft\/phi-4", + "bcp_47":"pt", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"apc", + "model":"microsoft\/phi-4", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.1876459632 + "score":0.1813353123 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"apc", + "model":"microsoft\/phi-4", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.4830875841 + "score":0.4632560004 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"apc", + "model":"microsoft\/phi-4", + "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.1830944017 + "score":0.3450201321 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"apc", + "model":"microsoft\/phi-4", + "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.4175337587 + "score":0.5827805827 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", + "model":"microsoft\/phi-4", + "bcp_47":"ro", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", + "model":"microsoft\/phi-4", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ro", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.6 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", + "model":"microsoft\/phi-4", + "bcp_47":"ro", "task":"translation_from", "metric":"bleu", - "score":0.260683336 + "score":0.1323104842 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", + "model":"microsoft\/phi-4", + "bcp_47":"ro", "task":"translation_from", "metric":"chrf", - "score":0.5383651277 + "score":0.3747307468 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", + "model":"microsoft\/phi-4", + "bcp_47":"ro", "task":"translation_to", "metric":"bleu", - "score":0.2962406565 + "score":0.2733723845 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", + "model":"microsoft\/phi-4", + "bcp_47":"ro", "task":"translation_to", "metric":"chrf", - "score":0.5190026627 + "score":0.5057937589 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"arz", + "model":"microsoft\/phi-4", + "bcp_47":"ru", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"arz", + "model":"microsoft\/phi-4", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.1675595946 + "score":0.164734586 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"arz", + "model":"microsoft\/phi-4", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.4187188467 + "score":0.4400610126 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"arz", + "model":"microsoft\/phi-4", + "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.1545869288 + "score":0.2884407046 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"arz", + "model":"microsoft\/phi-4", + "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.4031218248 + "score":0.5338739518 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"az", + "model":"microsoft\/phi-4", + "bcp_47":"rw", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"az", + "model":"microsoft\/phi-4", + "bcp_47":"rw", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"rw", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"rw", "task":"translation_from", "metric":"bleu", - "score":0.1604267099 + "score":0.0202859007 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"az", + "model":"microsoft\/phi-4", + "bcp_47":"rw", "task":"translation_from", "metric":"chrf", - "score":0.4139767864 + "score":0.2084128437 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"az", + "model":"microsoft\/phi-4", + "bcp_47":"rw", "task":"translation_to", "metric":"bleu", - "score":0.1651025864 + "score":0.0129709626 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"az", + "model":"microsoft\/phi-4", + "bcp_47":"rw", "task":"translation_to", "metric":"chrf", - "score":0.3978212407 + "score":0.1407028363 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bho", + "model":"microsoft\/phi-4", + "bcp_47":"sd", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bho", + "model":"microsoft\/phi-4", + "bcp_47":"sd", "task":"translation_from", "metric":"bleu", - "score":0.2519150677 + "score":0.0476641683 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bho", + "model":"microsoft\/phi-4", + "bcp_47":"sd", "task":"translation_from", "metric":"chrf", - "score":0.4966963131 + "score":0.1691869095 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bho", + "model":"microsoft\/phi-4", + "bcp_47":"sd", "task":"translation_to", "metric":"bleu", - "score":0.2057435019 + "score":0.0111247819 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bho", + "model":"microsoft\/phi-4", + "bcp_47":"sd", "task":"translation_to", "metric":"chrf", - "score":0.4016427491 + "score":0.151377306 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", + "model":"microsoft\/phi-4", + "bcp_47":"si", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"mgsm", - "metric":"accuracy", "score":0.7 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", + "model":"microsoft\/phi-4", + "bcp_47":"si", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.4 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", + "model":"microsoft\/phi-4", + "bcp_47":"si", "task":"translation_from", "metric":"bleu", - "score":0.2183929994 + "score":0.0307653909 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", + "model":"microsoft\/phi-4", + "bcp_47":"si", "task":"translation_from", "metric":"chrf", - "score":0.4877941086 + "score":0.2382457281 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", + "model":"microsoft\/phi-4", + "bcp_47":"si", "task":"translation_to", "metric":"bleu", - "score":0.2700916391 + "score":0.0240096696 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", + "model":"microsoft\/phi-4", + "bcp_47":"si", "task":"translation_to", "metric":"chrf", - "score":0.5150577414 + "score":0.154444722 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", + "model":"microsoft\/phi-4", + "bcp_47":"sn", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", + "model":"microsoft\/phi-4", + "bcp_47":"sn", "task":"mgsm", "metric":"accuracy", - "score":0.6 + "score":0.1 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", + "model":"microsoft\/phi-4", + "bcp_47":"sn", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.5 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", + "model":"microsoft\/phi-4", + "bcp_47":"sn", "task":"translation_from", "metric":"bleu", - "score":0.3440655166 + "score":0.0116292791 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", + "model":"microsoft\/phi-4", + "bcp_47":"sn", "task":"translation_from", "metric":"chrf", - "score":0.563902418 + "score":0.1897831748 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", + "model":"microsoft\/phi-4", + "bcp_47":"sn", "task":"translation_to", "metric":"bleu", - "score":0.4305522274 + "score":0.000876482 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", + "model":"microsoft\/phi-4", + "bcp_47":"sn", "task":"translation_to", "metric":"chrf", - "score":0.6477508732 + "score":0.066397943 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", + "model":"microsoft\/phi-4", + "bcp_47":"so", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", + "model":"microsoft\/phi-4", + "bcp_47":"so", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.6 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", + "model":"microsoft\/phi-4", + "bcp_47":"so", "task":"translation_from", "metric":"bleu", - "score":0.4113463435 + "score":0.0221364496 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", + "model":"microsoft\/phi-4", + "bcp_47":"so", "task":"translation_from", "metric":"chrf", - "score":0.6260248317 + "score":0.2036637198 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", + "model":"microsoft\/phi-4", + "bcp_47":"so", "task":"translation_to", "metric":"bleu", - "score":0.5310035709 + "score":0.0300378344 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", + "model":"microsoft\/phi-4", + "bcp_47":"so", "task":"translation_to", "metric":"chrf", - "score":0.7595845064 + "score":0.146034089 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", + "model":"microsoft\/phi-4", + "bcp_47":"sr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"mgsm", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", + "model":"microsoft\/phi-4", + "bcp_47":"sr", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.7 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", + "model":"microsoft\/phi-4", + "bcp_47":"sr", "task":"translation_from", "metric":"bleu", - "score":0.3031284355 + "score":0.1551096033 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", + "model":"microsoft\/phi-4", + "bcp_47":"sr", "task":"translation_from", "metric":"chrf", - "score":0.5241309352 + "score":0.4297549368 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", + "model":"microsoft\/phi-4", + "bcp_47":"sr", "task":"translation_to", "metric":"bleu", - "score":0.3289699508 + "score":0.200397515 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", + "model":"microsoft\/phi-4", + "bcp_47":"sr", "task":"translation_to", "metric":"chrf", - "score":0.5811203167 + "score":0.4351193348 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fa", + "model":"microsoft\/phi-4", + "bcp_47":"su", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fa", + "model":"microsoft\/phi-4", + "bcp_47":"su", "task":"translation_from", "metric":"bleu", - "score":0.2483616515 + "score":0.0631852964 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fa", + "model":"microsoft\/phi-4", + "bcp_47":"su", "task":"translation_from", "metric":"chrf", - "score":0.5338391625 + "score":0.3127999721 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fa", + "model":"microsoft\/phi-4", + "bcp_47":"su", "task":"translation_to", "metric":"bleu", - "score":0.1651229998 + "score":0.0328870671 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fa", + "model":"microsoft\/phi-4", + "bcp_47":"su", "task":"translation_to", "metric":"chrf", - "score":0.3923963113 + "score":0.285042966 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fil", + "model":"microsoft\/phi-4", + "bcp_47":"sv", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fil", + "model":"microsoft\/phi-4", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"sv", "task":"mmlu", "metric":"accuracy", "score":0.7 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fil", + "model":"microsoft\/phi-4", + "bcp_47":"sv", "task":"translation_from", "metric":"bleu", - "score":0.3057177881 + "score":0.1749499193 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fil", + "model":"microsoft\/phi-4", + "bcp_47":"sv", "task":"translation_from", "metric":"chrf", - "score":0.5523945263 + "score":0.4691275614 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fil", + "model":"microsoft\/phi-4", + "bcp_47":"sv", "task":"translation_to", "metric":"bleu", - "score":0.2711892461 + "score":0.2454574882 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fil", + "model":"microsoft\/phi-4", + "bcp_47":"sv", "task":"translation_to", "metric":"chrf", - "score":0.5802332073 + "score":0.5348019826 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", + "model":"microsoft\/phi-4", + "bcp_47":"sw", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", + "model":"microsoft\/phi-4", + "bcp_47":"sw", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.6 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", + "model":"microsoft\/phi-4", + "bcp_47":"sw", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.6 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", + "model":"microsoft\/phi-4", + "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.3349110908 + "score":0.1325294802 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", + "model":"microsoft\/phi-4", + "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.564806297 + "score":0.4051925402 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", + "model":"microsoft\/phi-4", + "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.4574014191 + "score":0.1631216823 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", + "model":"microsoft\/phi-4", + "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.6626552528 + "score":0.4696161488 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"gu", + "model":"microsoft\/phi-4", + "bcp_47":"ta", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"gu", + "model":"microsoft\/phi-4", + "bcp_47":"ta", "task":"translation_from", "metric":"bleu", - "score":0.2954497906 + "score":0.1338729952 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"gu", + "model":"microsoft\/phi-4", + "bcp_47":"ta", "task":"translation_from", "metric":"chrf", - "score":0.5086877895 + "score":0.3640492116 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"gu", + "model":"microsoft\/phi-4", + "bcp_47":"ta", "task":"translation_to", "metric":"bleu", - "score":0.1582270271 + "score":0.1115670494 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"gu", + "model":"microsoft\/phi-4", + "bcp_47":"ta", "task":"translation_to", "metric":"chrf", - "score":0.4201411039 + "score":0.4303510763 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ha", + "model":"microsoft\/phi-4", + "bcp_47":"te", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ha", + "model":"microsoft\/phi-4", + "bcp_47":"te", "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":0.1 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ha", + "model":"microsoft\/phi-4", + "bcp_47":"te", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.4 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ha", + "model":"microsoft\/phi-4", + "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.1697291765 + "score":0.2374723306 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ha", + "model":"microsoft\/phi-4", + "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.4073157654 + "score":0.4675485501 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ha", + "model":"microsoft\/phi-4", + "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.139672818 + "score":0.2528444882 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ha", + "model":"microsoft\/phi-4", + "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.4450194819 + "score":0.4794045124 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", + "model":"microsoft\/phi-4", + "bcp_47":"tg", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", + "model":"microsoft\/phi-4", + "bcp_47":"tg", "task":"translation_from", "metric":"bleu", - "score":0.3184042229 + "score":0.00699528 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", + "model":"microsoft\/phi-4", + "bcp_47":"tg", "task":"translation_from", "metric":"chrf", - "score":0.5712698408 + "score":0.2382738034 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", + "model":"microsoft\/phi-4", + "bcp_47":"tg", "task":"translation_to", "metric":"bleu", - "score":0.3659029431 + "score":0.0018437478 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", + "model":"microsoft\/phi-4", + "bcp_47":"tg", "task":"translation_to", "metric":"chrf", - "score":0.5796195236 + "score":0.2225002567 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", + "model":"microsoft\/phi-4", + "bcp_47":"th", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"mmlu", + "model":"microsoft\/phi-4", + "bcp_47":"th", + "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":0.7 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", + "model":"microsoft\/phi-4", + "bcp_47":"th", "task":"translation_from", "metric":"bleu", - "score":0.2301748885 + "score":0.1140490825 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", + "model":"microsoft\/phi-4", + "bcp_47":"th", "task":"translation_from", "metric":"chrf", - "score":0.4682741896 + "score":0.3668015685 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", + "model":"microsoft\/phi-4", + "bcp_47":"th", "task":"translation_to", "metric":"bleu", - "score":0.3346592082 + "score":0.1317498141 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", + "model":"microsoft\/phi-4", + "bcp_47":"th", "task":"translation_to", "metric":"chrf", - "score":0.6514874668 + "score":0.2770372268 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"it", + "model":"microsoft\/phi-4", + "bcp_47":"ti", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"it", - "task":"mgsm", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 + "score":0.1 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"it", + "model":"microsoft\/phi-4", + "bcp_47":"ti", "task":"translation_from", "metric":"bleu", - "score":0.2724260509 + "score":0.0342955291 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"it", + "model":"microsoft\/phi-4", + "bcp_47":"ti", "task":"translation_from", "metric":"chrf", - "score":0.5200202435 + "score":0.2066101372 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"it", + "model":"microsoft\/phi-4", + "bcp_47":"ti", "task":"translation_to", "metric":"bleu", - "score":0.2753225284 + "score":0.0101983319 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"it", + "model":"microsoft\/phi-4", + "bcp_47":"ti", "task":"translation_to", "metric":"chrf", - "score":0.5457466615 + "score":0.0539238863 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", + "model":"microsoft\/phi-4", + "bcp_47":"tr", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", + "model":"microsoft\/phi-4", + "bcp_47":"tr", "task":"mmlu", "metric":"accuracy", "score":0.7 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", + "model":"microsoft\/phi-4", + "bcp_47":"tr", "task":"translation_from", "metric":"bleu", - "score":0.2664966821 + "score":0.1209396556 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", + "model":"microsoft\/phi-4", + "bcp_47":"tr", "task":"translation_from", "metric":"chrf", - "score":0.5386982677 + "score":0.3409074931 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", + "model":"microsoft\/phi-4", + "bcp_47":"tr", "task":"translation_to", "metric":"bleu", - "score":0.2651365589 + "score":0.270580586 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", + "model":"microsoft\/phi-4", + "bcp_47":"tr", "task":"translation_to", "metric":"chrf", - "score":0.409095006 + "score":0.537606561 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", + "model":"microsoft\/phi-4", + "bcp_47":"uk", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", + "model":"microsoft\/phi-4", + "bcp_47":"uk", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"uk", "task":"translation_from", "metric":"bleu", - "score":0.2326358655 + "score":0.1285741979 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", + "model":"microsoft\/phi-4", + "bcp_47":"uk", "task":"translation_from", "metric":"chrf", - "score":0.4815897231 + "score":0.4057727321 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", + "model":"microsoft\/phi-4", + "bcp_47":"uk", "task":"translation_to", "metric":"bleu", - "score":0.2187928356 + "score":0.1865914948 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", + "model":"microsoft\/phi-4", + "bcp_47":"uk", "task":"translation_to", "metric":"chrf", - "score":0.4896578943 + "score":0.4565231191 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"kn", + "model":"microsoft\/phi-4", + "bcp_47":"umb", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"kn", + "model":"microsoft\/phi-4", + "bcp_47":"umb", "task":"translation_from", "metric":"bleu", - "score":0.247746183 + "score":0.0177160721 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"kn", + "model":"microsoft\/phi-4", + "bcp_47":"umb", "task":"translation_from", "metric":"chrf", - "score":0.506339637 + "score":0.1342994379 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"kn", + "model":"microsoft\/phi-4", + "bcp_47":"umb", "task":"translation_to", "metric":"bleu", - "score":0.1775009719 + "score":0.0010895392 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"kn", + "model":"microsoft\/phi-4", + "bcp_47":"umb", "task":"translation_to", "metric":"chrf", - "score":0.4300321597 + "score":0.0283042279 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ko", + "model":"microsoft\/phi-4", + "bcp_47":"ur", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ko", + "model":"microsoft\/phi-4", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.2402657185 + "score":0.1155003818 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ko", + "model":"microsoft\/phi-4", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.497198112 + "score":0.3250077925 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ko", + "model":"microsoft\/phi-4", + "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.3100527074 + "score":0.1195513435 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ko", + "model":"microsoft\/phi-4", + "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.3696197774 + "score":0.3158904676 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ml", + "model":"microsoft\/phi-4", + "bcp_47":"uz", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ml", + "model":"microsoft\/phi-4", + "bcp_47":"uz", "task":"translation_from", "metric":"bleu", - "score":0.2600500491 + "score":0.0676473408 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ml", + "model":"microsoft\/phi-4", + "bcp_47":"uz", "task":"translation_from", "metric":"chrf", - "score":0.5029669853 + "score":0.2672641675 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ml", + "model":"microsoft\/phi-4", + "bcp_47":"uz", "task":"translation_to", "metric":"bleu", - "score":0.2091322046 + "score":0.0166808106 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ml", + "model":"microsoft\/phi-4", + "bcp_47":"uz", "task":"translation_to", "metric":"chrf", - "score":0.4711774201 + "score":0.2361978954 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", + "model":"microsoft\/phi-4", + "bcp_47":"vi", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", + "model":"microsoft\/phi-4", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.2256246926 + "score":0.1452425625 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", + "model":"microsoft\/phi-4", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.4703189943 + "score":0.3941195385 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", + "model":"microsoft\/phi-4", + "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.2254492518 + "score":0.2680553268 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", + "model":"microsoft\/phi-4", + "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.447826525 + "score":0.5055559664 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ms", + "model":"microsoft\/phi-4", + "bcp_47":"wo", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ms", + "model":"microsoft\/phi-4", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"wo", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.3 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ms", + "model":"microsoft\/phi-4", + "bcp_47":"wo", "task":"translation_from", "metric":"bleu", - "score":0.2986303081 + "score":0.0218129891 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ms", + "model":"microsoft\/phi-4", + "bcp_47":"wo", "task":"translation_from", "metric":"chrf", - "score":0.5546917725 + "score":0.2316696377 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ms", + "model":"microsoft\/phi-4", + "bcp_47":"wo", "task":"translation_to", "metric":"bleu", - "score":0.3680194341 + "score":0.0005135911 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ms", + "model":"microsoft\/phi-4", + "bcp_47":"wo", "task":"translation_to", "metric":"chrf", - "score":0.6778287705 + "score":0.0644762753 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"my", + "model":"microsoft\/phi-4", + "bcp_47":"wuu", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"my", + "model":"microsoft\/phi-4", + "bcp_47":"wuu", "task":"translation_from", "metric":"bleu", - "score":0.1979480779 + "score":0.0721904827 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"my", + "model":"microsoft\/phi-4", + "bcp_47":"wuu", "task":"translation_from", "metric":"chrf", - "score":0.4791457508 + "score":0.3322122834 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"my", + "model":"microsoft\/phi-4", + "bcp_47":"wuu", "task":"translation_to", "metric":"bleu", - "score":0.1536786708 + "score":0.0963078281 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"my", + "model":"microsoft\/phi-4", + "bcp_47":"wuu", "task":"translation_to", "metric":"chrf", - "score":0.4315811907 + "score":0.1506583582 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"om", + "model":"microsoft\/phi-4", + "bcp_47":"xh", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"om", + "model":"microsoft\/phi-4", + "bcp_47":"xh", "task":"mgsm", "metric":"accuracy", - "score":0.2 + "score":0.1 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"om", + "model":"microsoft\/phi-4", + "bcp_47":"xh", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.4 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"om", + "model":"microsoft\/phi-4", + "bcp_47":"xh", "task":"translation_from", "metric":"bleu", - "score":0.0981161875 + "score":0.0658670408 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"om", + "model":"microsoft\/phi-4", + "bcp_47":"xh", "task":"translation_from", "metric":"chrf", - "score":0.3370208163 + "score":0.2264957148 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"om", + "model":"microsoft\/phi-4", + "bcp_47":"xh", "task":"translation_to", "metric":"bleu", - "score":0.040931235 + "score":0.0240888197 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"om", + "model":"microsoft\/phi-4", + "bcp_47":"xh", "task":"translation_to", "metric":"chrf", - "score":0.3615428475 + "score":0.1589846026 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"or", + "model":"microsoft\/phi-4", + "bcp_47":"yo", "task":"classification", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"or", + "model":"microsoft\/phi-4", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"yo", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"yo", "task":"translation_from", "metric":"bleu", - "score":0.2626677598 + "score":0.0361610953 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"or", + "model":"microsoft\/phi-4", + "bcp_47":"yo", "task":"translation_from", "metric":"chrf", - "score":0.4970567085 + "score":0.2209617429 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"or", + "model":"microsoft\/phi-4", + "bcp_47":"yo", "task":"translation_to", "metric":"bleu", - "score":0.1807466012 + "score":0.0152526027 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"or", + "model":"microsoft\/phi-4", + "bcp_47":"yo", "task":"translation_to", "metric":"chrf", - "score":0.4219189716 + "score":0.1066841292 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", + "model":"microsoft\/phi-4", + "bcp_47":"yue", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", + "model":"microsoft\/phi-4", + "bcp_47":"yue", "task":"translation_from", "metric":"bleu", - "score":0.3706063992 + "score":0.1360263411 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", + "model":"microsoft\/phi-4", + "bcp_47":"yue", "task":"translation_from", "metric":"chrf", - "score":0.6167676482 + "score":0.4135302369 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", + "model":"microsoft\/phi-4", + "bcp_47":"yue", "task":"translation_to", "metric":"bleu", - "score":0.4234596823 + "score":0.1427052583 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", + "model":"microsoft\/phi-4", + "bcp_47":"yue", "task":"translation_to", "metric":"chrf", - "score":0.5629443923 + "score":0.2190638456 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pl", + "model":"microsoft\/phi-4", + "bcp_47":"zh", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pl", + "model":"microsoft\/phi-4", + "bcp_47":"zh", "task":"mgsm", "metric":"accuracy", - "score":0.6 + "score":0.7 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pl", + "model":"microsoft\/phi-4", + "bcp_47":"zh", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pl", + "model":"microsoft\/phi-4", + "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.2754265608 + "score":0.1516445239 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pl", + "model":"microsoft\/phi-4", + "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.5207065369 + "score":0.4517979691 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pl", + "model":"microsoft\/phi-4", + "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.3700040895 + "score":0.2058198052 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pl", + "model":"microsoft\/phi-4", + "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.5924241261 + "score":0.2799124898 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", + "model":"microsoft\/phi-4", + "bcp_47":"zu", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", + "model":"microsoft\/phi-4", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"zu", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.5 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", + "model":"microsoft\/phi-4", + "bcp_47":"zu", "task":"translation_from", "metric":"bleu", - "score":0.2971403532 + "score":0.0158837296 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", + "model":"microsoft\/phi-4", + "bcp_47":"zu", "task":"translation_from", "metric":"chrf", - "score":0.5321068893 + "score":0.2111229219 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", + "model":"microsoft\/phi-4", + "bcp_47":"zu", "task":"translation_to", "metric":"bleu", - "score":0.4364286549 + "score":0.0440027048 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", + "model":"microsoft\/phi-4", + "bcp_47":"zu", "task":"translation_to", "metric":"chrf", - "score":0.6509885745 + "score":0.1856579938 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"aeb", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.1381244544 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"mmlu", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.3106084366 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.1319133586 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.2261398681 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"af", + "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"af", "task":"translation_from", "metric":"bleu", - "score":0.2300270544 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"af", "task":"translation_from", "metric":"chrf", - "score":0.4839384065 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"af", "task":"translation_to", "metric":"bleu", - "score":0.4236492288 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"af", "task":"translation_to", "metric":"chrf", - "score":0.6116207052 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sd", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ak", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.4 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sd", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ak", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ak", "task":"translation_from", "metric":"bleu", - "score":0.2571204202 + "score":0.0101349522 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sd", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ak", "task":"translation_from", "metric":"chrf", - "score":0.4946608155 + "score":0.0727946226 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sd", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ak", "task":"translation_to", "metric":"bleu", - "score":0.0869374651 + "score":0.0087636854 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sd", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ak", "task":"translation_to", "metric":"chrf", - "score":0.3119061498 + "score":0.0326918009 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"am", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.4 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"am", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"am", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.4 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"am", "task":"translation_from", "metric":"bleu", - "score":0.2501435914 + "score":0.0143438883 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"am", "task":"translation_from", "metric":"chrf", - "score":0.5088299265 + "score":0.0651139855 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"am", "task":"translation_to", "metric":"bleu", - "score":0.262372343 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"am", "task":"translation_to", "metric":"chrf", - "score":0.5806899403 + "score":0.0145699741 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ta", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"apc", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ta", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"apc", "task":"translation_from", "metric":"bleu", - "score":0.2450100573 + "score":0.1077126314 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ta", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"apc", "task":"translation_from", "metric":"chrf", - "score":0.4918691312 + "score":0.3303312588 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ta", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"apc", "task":"translation_to", "metric":"bleu", - "score":0.2434733519 + "score":0.0568249639 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ta", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"apc", "task":"translation_to", "metric":"chrf", - "score":0.5120095348 + "score":0.1985159581 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ar", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"mgsm", - "metric":"accuracy", - "score":0.6 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ar", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.2 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.3568851036 + "score":0.1428907436 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.5825326367 + "score":0.3107041775 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.3112091725 + "score":0.1849770017 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.5431414206 + "score":0.2932088535 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"th", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ary", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"th", - "task":"mgsm", - "metric":"accuracy", - "score":0.5 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"th", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ary", "task":"translation_from", "metric":"bleu", - "score":0.2544201673 + "score":0.0246413933 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"th", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ary", "task":"translation_from", "metric":"chrf", - "score":0.5081271409 + "score":0.2220905764 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"th", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ary", "task":"translation_to", "metric":"bleu", - "score":0.2942923294 + "score":0.0462912201 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"th", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ary", "task":"translation_to", "metric":"chrf", - "score":0.4479604827 + "score":0.2082310898 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"tr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"arz", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"tr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"arz", "task":"translation_from", "metric":"bleu", - "score":0.2563119866 + "score":0.021812522 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"tr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"arz", "task":"translation_from", "metric":"chrf", - "score":0.5291012922 + "score":0.1700035697 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"tr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"arz", "task":"translation_to", "metric":"bleu", - "score":0.3009595898 + "score":0.0687018163 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"tr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"arz", "task":"translation_to", "metric":"chrf", - "score":0.5854044281 + "score":0.213092048 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"as", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.5 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"as", "task":"translation_from", "metric":"bleu", - "score":0.2402951661 + "score":0.0516867052 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"as", "task":"translation_from", "metric":"chrf", - "score":0.5033005385 + "score":0.2165108464 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"as", "task":"translation_to", "metric":"bleu", - "score":0.2302239803 + "score":0.0097728449 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"as", "task":"translation_to", "metric":"chrf", - "score":0.4066956434 + "score":0.1483692036 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"uz", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"awa", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"uz", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"awa", "task":"translation_from", "metric":"bleu", - "score":0.203750264 + "score":0.08262787 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"uz", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"awa", "task":"translation_from", "metric":"chrf", - "score":0.4979829233 + "score":0.281005553 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"uz", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"awa", "task":"translation_to", "metric":"bleu", - "score":0.2162945849 + "score":0.0481979333 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"uz", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"awa", "task":"translation_to", "metric":"chrf", - "score":0.4941278712 + "score":0.2232523474 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"az", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"az", "task":"translation_from", "metric":"bleu", - "score":0.2537752957 + "score":0.0805820584 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"az", "task":"translation_from", "metric":"chrf", - "score":0.5073147534 + "score":0.2555758551 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"az", "task":"translation_to", "metric":"bleu", - "score":0.3583753747 + "score":0.0296286693 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"az", "task":"translation_to", "metric":"chrf", - "score":0.6253917282 + "score":0.1319853113 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"wuu", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"be", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"wuu", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"be", "task":"translation_from", "metric":"bleu", - "score":0.1700904158 + "score":0.0173366455 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"wuu", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"be", "task":"translation_from", "metric":"chrf", - "score":0.421111634 + "score":0.220616462 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"wuu", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"be", "task":"translation_to", "metric":"bleu", - "score":0.1213993524 + "score":0.0065148659 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"wuu", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"be", "task":"translation_to", "metric":"chrf", - "score":0.1655788185 + "score":0.1526491803 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"yue", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"bho", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"yue", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"bho", "task":"translation_from", "metric":"bleu", - "score":0.1783312983 + "score":0.0459721625 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"yue", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"bho", "task":"translation_from", "metric":"chrf", - "score":0.4423885999 + "score":0.2229551601 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"yue", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"bho", "task":"translation_to", "metric":"bleu", - "score":0.1632112014 + "score":0.0233985631 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"yue", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"bho", "task":"translation_to", "metric":"chrf", - "score":0.2297357227 + "score":0.1665184954 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"bm", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"mgsm", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"bm", "task":"translation_from", "metric":"bleu", - "score":0.249810194 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"bm", "task":"translation_from", "metric":"chrf", - "score":0.5151255506 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"bm", "task":"translation_to", "metric":"bleu", - "score":0.1854861198 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"bm", "task":"translation_to", "metric":"chrf", - "score":0.2463326959 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"am", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"bn", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"am", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"bn", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.1 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"am", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"bn", "task":"mmlu", "metric":"accuracy", "score":0.3 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"am", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.1913062339 + "score":0.0355167863 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"am", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.4296053228 + "score":0.2600874171 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"am", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.13443556 + "score":0.0323184525 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"am", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.2528930204 + "score":0.1970289791 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"apc", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ca", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"apc", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ca", "task":"translation_from", "metric":"bleu", - "score":0.24265587 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"apc", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ca", "task":"translation_from", "metric":"chrf", - "score":0.4918380331 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"apc", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ca", "task":"translation_to", "metric":"bleu", - "score":0.2104382871 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"apc", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ca", "task":"translation_to", "metric":"chrf", - "score":0.456050442 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ceb", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.4 + "score":0.9 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ceb", "task":"translation_from", "metric":"bleu", - "score":0.2891206499 + "score":0.0892751266 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ceb", "task":"translation_from", "metric":"chrf", - "score":0.5438550217 + "score":0.2388608153 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ceb", "task":"translation_to", "metric":"bleu", - "score":0.3184721364 + "score":0.0416926889 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ceb", "task":"translation_to", "metric":"chrf", - "score":0.5483731849 + "score":0.1552666429 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ckb", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.5 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ckb", "task":"translation_from", "metric":"bleu", - "score":0.1618648119 + "score":0.020551822 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ckb", "task":"translation_from", "metric":"chrf", - "score":0.4104839109 + "score":0.1292684598 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ckb", "task":"translation_to", "metric":"bleu", - "score":0.2266738862 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ckb", "task":"translation_to", "metric":"chrf", - "score":0.4315390742 + "score":0.0744822177 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"az", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"cs", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"az", - "task":"translation_from", - "metric":"bleu", - "score":0.1880331404 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"az", - "task":"translation_from", - "metric":"chrf", - "score":0.4234748209 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"az", - "task":"translation_to", - "metric":"bleu", - "score":0.1517877566 + "score":0.9 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"az", - "task":"translation_to", - "metric":"chrf", - "score":0.423956163 + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bho", - "task":"classification", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"cs", + "task":"mmlu", "metric":"accuracy", - "score":1.0 + "score":0.4 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bho", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"cs", "task":"translation_from", "metric":"bleu", - "score":0.2430984589 + "score":0.0527597248 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bho", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"cs", "task":"translation_from", "metric":"chrf", - "score":0.4969060141 + "score":0.3026154166 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bho", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"cs", "task":"translation_to", "metric":"bleu", - "score":0.1699224465 + "score":0.0777044688 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bho", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"cs", "task":"translation_to", "metric":"chrf", - "score":0.3964402252 + "score":0.3081482084 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"de", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"de", "task":"mgsm", "metric":"accuracy", - "score":0.7 + "score":0.1 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"de", "task":"mmlu", "metric":"accuracy", - "score":0.3 + "score":0.5 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.2907230812 + "score":0.1237340737 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.5148223626 + "score":0.3601104142 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.3473636391 + "score":0.1371705946 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.5442574441 + "score":0.4120757797 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"el", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"el", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.2 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"el", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.4 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"el", "task":"translation_from", "metric":"bleu", - "score":0.3577876868 + "score":0.0837672025 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"el", "task":"translation_from", "metric":"chrf", - "score":0.5943423055 + "score":0.2648038016 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"el", "task":"translation_to", "metric":"bleu", - "score":0.5344280565 + "score":0.0885028071 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"el", "task":"translation_to", "metric":"chrf", - "score":0.7084649844 + "score":0.2007646735 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"en", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"en", "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.2 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"en", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.8 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.452427177 + "score":0.3548422361 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.6525566656 + "score":0.460765953 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.5467976399 + "score":0.4690424472 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.7780833183 + "score":0.6788013861 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"es", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"es", "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.3 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"es", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.5 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.3554331718 + "score":0.1169662945 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.5997743406 + "score":0.3242693179 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.3847830842 + "score":0.2556403143 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.6191109047 + "score":0.4583071754 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"fa", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"fa", "task":"mmlu", "metric":"accuracy", "score":0.4 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"fa", "task":"translation_from", "metric":"bleu", - "score":0.2579194729 + "score":0.0271486292 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"fa", "task":"translation_from", "metric":"chrf", - "score":0.5351839762 + "score":0.2182731449 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"fa", "task":"translation_to", "metric":"bleu", - "score":0.1571676635 + "score":0.0526574176 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"fa", "task":"translation_to", "metric":"chrf", - "score":0.4046770996 + "score":0.2424108963 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"fil", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"fil", "task":"mmlu", "metric":"accuracy", "score":0.4 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"fil", "task":"translation_from", "metric":"bleu", - "score":0.3771043132 + "score":0.0762125847 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"fil", "task":"translation_from", "metric":"chrf", - "score":0.5835797455 + "score":0.2228549327 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"fil", "task":"translation_to", "metric":"bleu", - "score":0.3564426025 + "score":0.0269063649 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"fil", "task":"translation_to", "metric":"chrf", - "score":0.6107274367 + "score":0.2401408344 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"fr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"fr", "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.3 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"fr", "task":"mmlu", "metric":"accuracy", - "score":0.3 + "score":0.6 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.2846092378 + "score":0.0839707225 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.5655970541 + "score":0.3074010094 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.5192984544 + "score":0.2478840637 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.7020040834 + "score":0.4205657928 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.0290727628 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.1841843114 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0523495621 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.1231670583 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"gu", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.4 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"gu", "task":"translation_from", "metric":"bleu", - "score":0.2796934014 + "score":0.0005257422 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"gu", "task":"translation_from", "metric":"chrf", - "score":0.5155626456 + "score":0.0721265952 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"gu", "task":"translation_to", "metric":"bleu", - "score":0.1979202011 + "score":0.000262224 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"gu", "task":"translation_to", "metric":"chrf", - "score":0.4528880823 + "score":0.0118348356 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"ha", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"ha", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"ha", "task":"mmlu", "metric":"accuracy", - "score":0.3 + "score":0.6 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"ha", "task":"translation_from", "metric":"bleu", - "score":0.1595296755 + "score":0.0318398305 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"ha", "task":"translation_from", "metric":"chrf", - "score":0.3859356797 + "score":0.1834830244 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"ha", "task":"translation_to", "metric":"bleu", - "score":0.171830216 + "score":0.0320718253 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"ha", "task":"translation_to", "metric":"chrf", - "score":0.4608354018 + "score":0.1032515167 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"hi", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"hi", "task":"mmlu", "metric":"accuracy", "score":0.5 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.3520691191 + "score":0.1989310744 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.6035990708 + "score":0.408792844 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.3987037224 + "score":0.2107266229 }, { - "model":"google\/gemma-3-27b-it", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.6195037668 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.3377417704 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5674360496 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3534620252 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6680177029 + "score":0.3722535388 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"hne", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.2 + "score":0.7 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"hne", "task":"translation_from", "metric":"bleu", - "score":0.3356485456 + "score":0.0223204074 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"hne", "task":"translation_from", "metric":"chrf", - "score":0.5684527887 + "score":0.1959765545 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"hne", "task":"translation_to", "metric":"bleu", - "score":0.3627134123 + "score":0.022115131 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"hne", "task":"translation_to", "metric":"chrf", - "score":0.6050822949 + "score":0.1882969266 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ht", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.4 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ht", "task":"translation_from", "metric":"bleu", - "score":0.2481856237 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ht", "task":"translation_from", "metric":"chrf", - "score":0.5180749152 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ht", "task":"translation_to", "metric":"bleu", - "score":0.242508046 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ht", "task":"translation_to", "metric":"chrf", - "score":0.4046420215 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"hu", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3019627022 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5133980923 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2316517545 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5189963647 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"classification", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"hu", + "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.2 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"hu", "task":"translation_from", "metric":"bleu", - "score":0.2692189197 + "score":0.1149995432 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"hu", "task":"translation_from", "metric":"chrf", - "score":0.5290912174 + "score":0.3052316233 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"hu", "task":"translation_to", "metric":"bleu", - "score":0.2869741566 + "score":0.1017437337 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"hu", "task":"translation_to", "metric":"chrf", - "score":0.5072256514 + "score":0.2651695911 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"id", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"id", "task":"mmlu", "metric":"accuracy", - "score":0.3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2172591082 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.478962626 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2169046229 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3151387909 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "score":0.5 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.2809005667 + "score":0.1251179936 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.5466717628 + "score":0.3078536626 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.2287455417 + "score":0.1049757961 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.4915489263 + "score":0.338086632 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ig", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3395095603 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5877742809 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2222923122 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4572688692 + "score":0.7 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ms", - "task":"classification", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ig", + "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ms", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ig", "task":"mmlu", "metric":"accuracy", - "score":0.2 + "score":0.6 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ms", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ig", "task":"translation_from", "metric":"bleu", - "score":0.3794800258 + "score":0.0185191424 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ms", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ig", "task":"translation_from", "metric":"chrf", - "score":0.6256125923 + "score":0.1790132896 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ms", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ig", "task":"translation_to", "metric":"bleu", - "score":0.3593747877 + "score":0.0151653031 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ms", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ig", "task":"translation_to", "metric":"chrf", - "score":0.664135376 + "score":0.0537338226 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"my", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ilo", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.7 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"my", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ilo", "task":"translation_from", "metric":"bleu", - "score":0.251920694 + "score":0.0341024751 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"my", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ilo", "task":"translation_from", "metric":"chrf", - "score":0.4662583176 + "score":0.2126115238 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"my", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ilo", "task":"translation_to", "metric":"bleu", - "score":0.1647980206 + "score":0.0221151729 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"my", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ilo", "task":"translation_to", "metric":"chrf", - "score":0.4166796691 + "score":0.1431429685 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"om", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"it", "task":"classification", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"om", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"it", "task":"mgsm", "metric":"accuracy", - "score":0.1 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"om", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"it", "task":"mmlu", "metric":"accuracy", - "score":0.2 + "score":0.4 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"om", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"it", "task":"translation_from", "metric":"bleu", - "score":0.0417850648 + "score":0.1041933329 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"om", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"it", "task":"translation_from", "metric":"chrf", - "score":0.2509675066 + "score":0.3064701129 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"om", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"it", "task":"translation_to", "metric":"bleu", - "score":0.0312813941 + "score":0.1299185029 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"om", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"it", "task":"translation_to", "metric":"chrf", - "score":0.2886309955 + "score":0.3570513672 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ja", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.2613495089 + "score":0.1170990874 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.5009335042 + "score":0.3281623219 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.1648455996 + "score":0.1166577127 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.3943041737 + "score":0.2303280443 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"jv", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.4164890636 + "score":0.0192945074 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.6375470445 + "score":0.2015068169 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.4166823661 + "score":0.045857499 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.575314128 + "score":0.1778848232 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ki", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.2 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ki", "task":"translation_from", "metric":"bleu", - "score":0.2913506513 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ki", "task":"translation_from", "metric":"chrf", - "score":0.5431985912 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ki", "task":"translation_to", "metric":"bleu", - "score":0.3723742743 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ki", "task":"translation_to", "metric":"chrf", - "score":0.5891983505 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"kk", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 + "score":0.9 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"kk", "task":"translation_from", "metric":"bleu", - "score":0.340245547 + "score":0.0278653757 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"kk", "task":"translation_from", "metric":"chrf", - "score":0.5681284927 + "score":0.2309769046 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"kk", "task":"translation_to", "metric":"bleu", - "score":0.4702737577 + "score":0.0264488684 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"kk", "task":"translation_to", "metric":"chrf", - "score":0.6903236014 + "score":0.1618433519 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"km", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.3 + "score":0.7 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"km", "task":"translation_from", "metric":"bleu", - "score":0.2862936285 + "score":0.0187368299 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"km", "task":"translation_from", "metric":"chrf", - "score":0.5264436928 + "score":0.210610547 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"km", "task":"translation_to", "metric":"bleu", - "score":0.4800957551 + "score":0.0070803381 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"km", "task":"translation_to", "metric":"chrf", - "score":0.6618495803 + "score":0.0602951272 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"kn", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.6 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"kn", "task":"translation_from", "metric":"bleu", - "score":0.2365858071 + "score":0.0343738545 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"kn", "task":"translation_from", "metric":"chrf", - "score":0.4722212406 + "score":0.1971697601 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"kn", "task":"translation_to", "metric":"bleu", - "score":0.2251623508 + "score":0.012430185 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"kn", "task":"translation_to", "metric":"chrf", - "score":0.4159341653 + "score":0.0969965616 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ko", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"mgsm", - "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ko", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.2 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ko", "task":"translation_from", "metric":"bleu", - "score":0.268709657 + "score":0.1011791445 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ko", "task":"translation_from", "metric":"chrf", - "score":0.5306834056 + "score":0.2665626277 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ko", "task":"translation_to", "metric":"bleu", - "score":0.3395981599 + "score":0.0674482283 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ko", "task":"translation_to", "metric":"chrf", - "score":0.6130756934 + "score":0.1439352867 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"lua", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.7 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"lua", "task":"translation_from", "metric":"bleu", - "score":0.2563448403 + "score":0.0333812973 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"lua", "task":"translation_from", "metric":"chrf", - "score":0.5007966916 + "score":0.2140071833 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"lua", "task":"translation_to", "metric":"bleu", - "score":0.2405135195 + "score":0.013803565 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"lua", "task":"translation_to", "metric":"chrf", - "score":0.5564984925 + "score":0.0856760144 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"mag", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"mgsm", - "metric":"accuracy", "score":0.7 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"mag", "task":"translation_from", "metric":"bleu", - "score":0.2787922254 + "score":0.0857349903 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"mag", "task":"translation_from", "metric":"chrf", - "score":0.5420797212 + "score":0.2682295704 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"mag", "task":"translation_to", "metric":"bleu", - "score":0.259866454 + "score":0.0363984536 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"mag", "task":"translation_to", "metric":"chrf", - "score":0.48543634 + "score":0.2133514375 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"mai", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"mai", "task":"translation_from", "metric":"bleu", - "score":0.2400131449 + "score":0.0831966089 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"mai", "task":"translation_from", "metric":"chrf", - "score":0.4851690277 + "score":0.3252283455 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"mai", "task":"translation_to", "metric":"bleu", - "score":0.383380628 + "score":0.0100264548 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"mai", "task":"translation_to", "metric":"chrf", - "score":0.5430720239 + "score":0.2049643183 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"mg", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"mg", "task":"mmlu", "metric":"accuracy", "score":0.4 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"mg", "task":"translation_from", "metric":"bleu", - "score":0.2757340333 + "score":0.0402775114 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"mg", "task":"translation_from", "metric":"chrf", - "score":0.5244536559 + "score":0.2132968488 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"mg", "task":"translation_to", "metric":"bleu", - "score":0.3185578758 + "score":0.0178624704 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"mg", "task":"translation_to", "metric":"chrf", - "score":0.5765088485 + "score":0.1584836987 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ml", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ml", "task":"translation_from", "metric":"bleu", - "score":0.2595582459 + "score":0.044306682 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ml", "task":"translation_from", "metric":"chrf", - "score":0.5043992681 + "score":0.2110608123 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ml", "task":"translation_to", "metric":"bleu", - "score":0.2142625601 + "score":0.0101250707 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ml", "task":"translation_to", "metric":"chrf", - "score":0.429749938 + "score":0.1446641679 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"uz", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"mr", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.7 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"uz", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.2595944841 + "score":0.0250471784 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"uz", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.5081810113 + "score":0.2097577846 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"uz", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.2601189518 + "score":0.034382114 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"uz", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.5225655991 + "score":0.2211758055 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ms", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ms", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":0.2 }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ms", "task":"translation_from", "metric":"bleu", - "score":0.2279880384 + "score":0.120023798 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ms", "task":"translation_from", "metric":"chrf", - "score":0.4835933272 + "score":0.3039131897 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ms", "task":"translation_to", "metric":"bleu", - "score":0.3478085621 + "score":0.1137229069 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ms", "task":"translation_to", "metric":"chrf", - "score":0.5968604742 + "score":0.3446031673 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"wuu", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"my", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.6 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"wuu", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"my", "task":"translation_from", "metric":"bleu", - "score":0.246042863 + "score":0.1101780964 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"wuu", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"my", "task":"translation_from", "metric":"chrf", - "score":0.4917114856 + "score":0.2424045636 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"wuu", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"my", "task":"translation_to", "metric":"bleu", - "score":0.1017188886 + "score":0.0971253665 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"wuu", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"my", "task":"translation_to", "metric":"chrf", - "score":0.1707828137 + "score":0.1223804901 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ne", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.7 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ne", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ne", "task":"translation_from", "metric":"bleu", - "score":0.2124709579 + "score":0.0522706053 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ne", "task":"translation_from", "metric":"chrf", - "score":0.4811646042 + "score":0.2509451803 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ne", "task":"translation_to", "metric":"bleu", - "score":0.1392232 + "score":0.0404811569 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ne", "task":"translation_to", "metric":"chrf", - "score":0.2205120991 + "score":0.2098515398 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"nl", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"nl", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.2 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"nl", "task":"mmlu", "metric":"accuracy", "score":0.5 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"nl", "task":"translation_from", "metric":"bleu", - "score":0.1900086584 + "score":0.1127735687 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"nl", "task":"translation_from", "metric":"chrf", - "score":0.4895930442 + "score":0.3096427976 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"nl", "task":"translation_to", "metric":"bleu", - "score":0.2395565562 + "score":0.1171995651 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"nl", "task":"translation_to", "metric":"chrf", - "score":0.3237759485 + "score":0.39693057 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"am", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ny", "task":"classification", "metric":"accuracy", - "score":0.3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"am", - "task":"mgsm", - "metric":"accuracy", - "score":0.0 + "score":0.7 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"am", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ny", "task":"mmlu", "metric":"accuracy", "score":0.2 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"am", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ny", "task":"translation_from", "metric":"bleu", - "score":0.0135029462 + "score":0.0249203424 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"am", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ny", "task":"translation_from", "metric":"chrf", - "score":0.1510010912 + "score":0.183758763 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"am", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ny", "task":"translation_to", "metric":"bleu", - "score":0.0033288372 + "score":0.0148302605 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"am", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ny", "task":"translation_to", "metric":"chrf", - "score":0.0389705109 + "score":0.1329930306 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"apc", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"om", "task":"classification", "metric":"accuracy", + "score":0.4 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", "score":0.7 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"apc", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"om", "task":"translation_from", "metric":"bleu", - "score":0.0592251547 + "score":0.0171568718 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"apc", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"om", "task":"translation_from", "metric":"chrf", - "score":0.2921276604 + "score":0.1561109456 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"apc", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"om", "task":"translation_to", "metric":"bleu", - "score":0.0366276845 + "score":0.0097264241 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"apc", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"om", "task":"translation_to", "metric":"chrf", - "score":0.2393327958 + "score":0.0452833915 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"or", "task":"classification", "metric":"accuracy", - "score":0.5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", "score":0.4 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"or", "task":"translation_from", "metric":"bleu", - "score":0.0837265107 + "score":0.0554840251 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"or", "task":"translation_from", "metric":"chrf", - "score":0.3012065838 + "score":0.1538079363 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"or", "task":"translation_to", "metric":"bleu", - "score":0.1120670716 + "score":0.0033288372 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"or", "task":"translation_to", "metric":"chrf", - "score":0.2771296913 + "score":0.036508675 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"arz", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pa", "task":"classification", "metric":"accuracy", - "score":0.6 + "score":0.7 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"arz", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.0290259599 + "score":0.3055395757 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"arz", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.2238098591 + "score":0.4480585816 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"arz", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.0597935462 + "score":0.2165906221 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"arz", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.2388670431 + "score":0.3271537328 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"az", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pl", "task":"classification", "metric":"accuracy", - "score":0.5 + "score":0.8 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"az", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pl", "task":"translation_from", "metric":"bleu", - "score":0.0148972561 + "score":0.1017362354 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"az", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pl", "task":"translation_from", "metric":"chrf", - "score":0.2336350172 + "score":0.2782010079 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"az", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pl", "task":"translation_to", "metric":"bleu", - "score":0.0047574121 + "score":0.1041302213 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"az", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pl", "task":"translation_to", "metric":"chrf", - "score":0.1922357185 + "score":0.2865629267 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bho", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pt", "task":"classification", "metric":"accuracy", - "score":0.4 + "score":0.9 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bho", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.0581882104 + "score":0.1031395116 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bho", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.2702416532 + "score":0.3223915745 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bho", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.0562052656 + "score":0.1194174782 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bho", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.2181774858 + "score":0.3618255907 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ro", "task":"classification", "metric":"accuracy", - "score":0.4 + "score":0.9 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ro", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.1 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ro", "task":"mmlu", "metric":"accuracy", "score":0.3 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ro", "task":"translation_from", "metric":"bleu", - "score":0.021858254 + "score":0.0901332073 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ro", "task":"translation_from", "metric":"chrf", - "score":0.2327499821 + "score":0.2638668804 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ro", "task":"translation_to", "metric":"bleu", - "score":0.0253088472 + "score":0.1408494847 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ro", "task":"translation_to", "metric":"chrf", - "score":0.1918662187 + "score":0.2546101322 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ru", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ru", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.1 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ru", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":0.5 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.1784955678 + "score":0.0826481083 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.4008799371 + "score":0.2913230821 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.1782663616 + "score":0.1808682916 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.4070825897 + "score":0.3815777762 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"rw", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.3 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"rw", "task":"mgsm", "metric":"accuracy", "score":0.0 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"rw", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.4 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"rw", "task":"translation_from", "metric":"bleu", - "score":0.2797104835 + "score":0.0012309971 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"rw", "task":"translation_from", "metric":"chrf", - "score":0.4601471921 + "score":0.0385987025 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"rw", "task":"translation_to", "metric":"bleu", - "score":0.3392404298 + "score":0.0093358773 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"rw", "task":"translation_to", "metric":"chrf", - "score":0.5518674496 + "score":0.0457261214 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sd", "task":"classification", "metric":"accuracy", "score":0.8 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"mgsm", - "metric":"accuracy", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sd", + "task":"translation_from", + "metric":"bleu", + "score":0.0448599501 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sd", + "task":"translation_from", + "metric":"chrf", + "score":0.1691371082 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sd", + "task":"translation_to", + "metric":"bleu", "score":0.0 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sd", + "task":"translation_to", + "metric":"chrf", + "score":0.0527194634 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"si", + "task":"classification", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"si", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":0.3 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"si", "task":"translation_from", "metric":"bleu", - "score":0.1682956348 + "score":0.0187725283 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"si", "task":"translation_from", "metric":"chrf", - "score":0.3705606944 + "score":0.1451005114 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"si", "task":"translation_to", "metric":"bleu", - "score":0.1595479626 + "score":0.0072043177 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"si", "task":"translation_to", "metric":"chrf", - "score":0.4040956812 + "score":0.0622904587 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fa", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sn", "task":"classification", "metric":"accuracy", - "score":0.5 + "score":0.8 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fa", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sn", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sn", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":0.6 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fa", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sn", "task":"translation_from", "metric":"bleu", - "score":0.0333586544 + "score":0.015192186 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fa", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sn", "task":"translation_from", "metric":"chrf", - "score":0.2582740293 + "score":0.1562018554 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fa", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sn", "task":"translation_to", "metric":"bleu", - "score":0.0187498765 + "score":0.0146518601 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fa", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sn", "task":"translation_to", "metric":"chrf", - "score":0.2265924477 + "score":0.0664358997 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fil", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"so", "task":"classification", "metric":"accuracy", - "score":0.6 + "score":0.7 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fil", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"so", "task":"mmlu", "metric":"accuracy", - "score":0.2 + "score":0.4 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fil", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"so", "task":"translation_from", "metric":"bleu", - "score":0.1122756663 + "score":0.0168598973 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fil", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"so", "task":"translation_from", "metric":"chrf", - "score":0.3654994366 + "score":0.1350682776 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fil", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"so", "task":"translation_to", "metric":"bleu", - "score":0.0565617503 + "score":0.0192034206 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fil", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"so", "task":"translation_to", "metric":"chrf", - "score":0.2914640343 + "score":0.1607323446 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sr", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"mgsm", - "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sr", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.4 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sr", "task":"translation_from", "metric":"bleu", - "score":0.1362099506 + "score":0.0538059584 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sr", "task":"translation_from", "metric":"chrf", - "score":0.4039646029 + "score":0.2453781212 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sr", "task":"translation_to", "metric":"bleu", - "score":0.2151785904 + "score":0.0917605905 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sr", "task":"translation_to", "metric":"chrf", - "score":0.4309035319 + "score":0.2668905804 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"gu", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"su", "task":"classification", "metric":"accuracy", - "score":0.2 + "score":0.8 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"gu", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"su", "task":"translation_from", "metric":"bleu", - "score":0.0426900866 + "score":0.0217870696 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"gu", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"su", "task":"translation_from", "metric":"chrf", - "score":0.2179546047 + "score":0.2165031068 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"gu", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"su", "task":"translation_to", "metric":"bleu", - "score":0.0232938459 + "score":0.0464674805 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"gu", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"su", "task":"translation_to", "metric":"chrf", - "score":0.2007105106 + "score":0.2235940604 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ha", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sv", "task":"classification", "metric":"accuracy", - "score":0.3 + "score":0.8 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ha", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sv", "task":"mgsm", "metric":"accuracy", "score":0.0 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ha", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sv", "task":"mmlu", "metric":"accuracy", - "score":0.1 + "score":0.4 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ha", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sv", "task":"translation_from", "metric":"bleu", - "score":0.0254280801 + "score":0.1007032416 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ha", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sv", "task":"translation_from", "metric":"chrf", - "score":0.1890793851 + "score":0.2719560518 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ha", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sv", "task":"translation_to", "metric":"bleu", - "score":0.0144953008 + "score":0.1266242057 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ha", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sv", "task":"translation_to", "metric":"chrf", - "score":0.1884647114 + "score":0.3334538145 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sw", "task":"classification", "metric":"accuracy", - "score":0.6 + "score":0.8 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sw", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sw", "task":"mmlu", "metric":"accuracy", - "score":0.2 + "score":0.3 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.1658307051 + "score":0.0422003709 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.3676480008 + "score":0.253591842 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.1711676323 + "score":0.0280729387 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.360371738 + "score":0.1884927612 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ta", "task":"classification", "metric":"accuracy", "score":0.7 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ta", "task":"translation_from", "metric":"bleu", - "score":0.1399603895 + "score":0.0366379898 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ta", "task":"translation_from", "metric":"chrf", - "score":0.3604113675 + "score":0.1847934746 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ta", "task":"translation_to", "metric":"bleu", - "score":0.1312450274 + "score":0.0141355453 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ta", "task":"translation_to", "metric":"chrf", - "score":0.3988827234 + "score":0.1724636201 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"it", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"te", "task":"classification", "metric":"accuracy", "score":0.8 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"it", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"te", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.2 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"it", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"te", "task":"mmlu", "metric":"accuracy", - "score":0.1 + "score":0.4 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"it", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.0992729275 + "score":0.1550101498 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"it", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.3331935567 + "score":0.3623113506 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"it", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.1507170285 + "score":0.1217984824 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"it", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.4062498972 + "score":0.2801870917 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"tg", "task":"classification", "metric":"accuracy", "score":0.7 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"mgsm", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"tg", + "task":"translation_from", + "metric":"bleu", + "score":0.0606788965 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"tg", + "task":"translation_from", + "metric":"chrf", + "score":0.1688995018 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"tg", + "task":"translation_to", + "metric":"bleu", + "score":0.0007119113 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"tg", + "task":"translation_to", + "metric":"chrf", + "score":0.0386741345 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"th", + "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"mmlu", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"th", + "task":"mgsm", "metric":"accuracy", "score":0.1 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"th", "task":"translation_from", "metric":"bleu", - "score":0.1222242366 + "score":0.0853746951 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"th", "task":"translation_from", "metric":"chrf", - "score":0.3415186168 + "score":0.3009803927 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"th", "task":"translation_to", "metric":"bleu", - "score":0.1607198845 + "score":0.0676677726 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"th", "task":"translation_to", "metric":"chrf", - "score":0.2706371796 + "score":0.2051763344 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ti", "task":"classification", "metric":"accuracy", - "score":0.6 + "score":0.1 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ti", "task":"translation_from", "metric":"bleu", - "score":0.0550016522 + "score":0.0118399471 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ti", "task":"translation_from", "metric":"chrf", - "score":0.2468917982 + "score":0.0818929883 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ti", "task":"translation_to", "metric":"bleu", - "score":0.017690474 + "score":0.0 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ti", "task":"translation_to", "metric":"chrf", - "score":0.2536001746 + "score":0.0131103824 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"kn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"tr", "task":"classification", "metric":"accuracy", - "score":0.1 + "score":0.8 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"kn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"tr", "task":"translation_from", "metric":"bleu", - "score":0.0397152583 + "score":0.1075252941 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"kn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"tr", "task":"translation_from", "metric":"chrf", - "score":0.2037873099 + "score":0.2810155518 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"kn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"tr", "task":"translation_to", "metric":"bleu", - "score":0.0137546968 + "score":0.0683323294 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"kn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"tr", "task":"translation_to", "metric":"chrf", - "score":0.1710566423 + "score":0.2657241512 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ko", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"uk", "task":"classification", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ko", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"uk", "task":"mmlu", "metric":"accuracy", - "score":0.3 + "score":0.4 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ko", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"uk", "task":"translation_from", "metric":"bleu", - "score":0.0564413481 + "score":0.0921333598 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ko", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"uk", "task":"translation_from", "metric":"chrf", - "score":0.3212656259 + "score":0.2640680177 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ko", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"uk", "task":"translation_to", "metric":"bleu", - "score":0.0674768387 + "score":0.1042804602 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ko", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"uk", "task":"translation_to", "metric":"chrf", - "score":0.1657544717 + "score":0.257176459 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ml", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"umb", "task":"classification", "metric":"accuracy", - "score":0.2 + "score":0.4 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ml", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"umb", "task":"translation_from", "metric":"bleu", - "score":0.0532822129 + "score":0.0453126073 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ml", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"umb", "task":"translation_from", "metric":"chrf", - "score":0.2301007371 + "score":0.1567880475 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ml", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"umb", "task":"translation_to", "metric":"bleu", - "score":0.022639121 + "score":0.027790575 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ml", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"umb", "task":"translation_to", "metric":"chrf", - "score":0.175884413 + "score":0.0855724163 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ur", "task":"classification", "metric":"accuracy", - "score":0.4 + "score":0.7 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.0411296617 + "score":0.096255918 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.2442292695 + "score":0.2490196736 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.0482775033 + "score":0.0759551519 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.2211003771 + "score":0.2765897266 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ms", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"uz", "task":"classification", "metric":"accuracy", - "score":0.8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ms", - "task":"mmlu", - "metric":"accuracy", - "score":0.2 + "score":0.9 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ms", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"uz", "task":"translation_from", "metric":"bleu", - "score":0.1375979502 + "score":0.030810794 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ms", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"uz", "task":"translation_from", "metric":"chrf", - "score":0.3518293272 + "score":0.1804383237 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ms", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"uz", "task":"translation_to", "metric":"bleu", - "score":0.1462646527 + "score":0.0151653031 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ms", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"uz", "task":"translation_to", "metric":"chrf", - "score":0.3886405702 + "score":0.0766086067 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"my", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"vi", "task":"classification", "metric":"accuracy", - "score":0.1 + "score":0.9 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"my", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.1 + "score":0.1578714698 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"my", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.2238699363 + "score":0.3784433754 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"my", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.1 + "score":0.1713340477 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"my", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.1606469353 + "score":0.3260532752 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"om", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"wo", "task":"classification", "metric":"accuracy", - "score":0.2 + "score":0.8 }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"om", + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"wo", "task":"mgsm", "metric":"accuracy", "score":0.0 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"om", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"wo", "task":"mmlu", "metric":"accuracy", - "score":0.1 + "score":0.4 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"om", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"wo", "task":"translation_from", "metric":"bleu", - "score":0.0127402107 + "score":0.0354904515 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"om", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"wo", "task":"translation_from", "metric":"chrf", - "score":0.1651498064 + "score":0.1880266806 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"om", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"wo", "task":"translation_to", "metric":"bleu", - "score":0.0088808864 + "score":0.0178986288 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"om", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"wo", "task":"translation_to", "metric":"chrf", - "score":0.1702476721 + "score":0.0724032398 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"or", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"wuu", "task":"classification", "metric":"accuracy", - "score":0.2 + "score":0.9 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"or", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"wuu", "task":"translation_from", "metric":"bleu", - "score":0.0366762006 + "score":0.0482308543 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"or", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"wuu", "task":"translation_from", "metric":"chrf", - "score":0.1697470704 + "score":0.2087387992 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"or", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"wuu", "task":"translation_to", "metric":"bleu", - "score":0.0190635247 + "score":0.0574307954 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"or", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"wuu", "task":"translation_to", "metric":"chrf", - "score":0.1343627089 + "score":0.1098000711 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"xh", "task":"classification", "metric":"accuracy", + "score":0.8 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", "score":0.0 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"xh", "task":"translation_from", "metric":"bleu", - "score":0.2292007848 + "score":0.0118398272 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"xh", "task":"translation_from", "metric":"chrf", - "score":0.3716655897 + "score":0.1505828307 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"xh", "task":"translation_to", "metric":"bleu", - "score":0.2126702079 + "score":0.008719744 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"xh", "task":"translation_to", "metric":"chrf", - "score":0.3248815955 + "score":0.056668863 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pl", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"yo", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pl", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"yo", "task":"mgsm", "metric":"accuracy", "score":0.0 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pl", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"yo", "task":"mmlu", "metric":"accuracy", - "score":0.3 + "score":0.4 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pl", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"yo", "task":"translation_from", "metric":"bleu", - "score":0.1085949014 + "score":0.0200324188 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pl", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"yo", "task":"translation_from", "metric":"chrf", - "score":0.3346783911 + "score":0.1553578618 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pl", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"yo", "task":"translation_to", "metric":"bleu", - "score":0.1676106101 + "score":0.0095466427 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pl", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"yo", "task":"translation_to", "metric":"chrf", - "score":0.3907504991 + "score":0.0491504248 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"yue", "task":"classification", "metric":"accuracy", - "score":0.7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.4 + "score":0.9 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"yue", "task":"translation_from", "metric":"bleu", - "score":0.1013445398 + "score":0.0513648793 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"yue", "task":"translation_from", "metric":"chrf", - "score":0.3063125264 + "score":0.2577830867 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"yue", "task":"translation_to", "metric":"bleu", - "score":0.2231857524 + "score":0.119690435 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"yue", "task":"translation_to", "metric":"chrf", - "score":0.4401829864 + "score":0.1721639976 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"zh", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"zh", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.2 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"zh", "task":"mmlu", "metric":"accuracy", - "score":0.3 + "score":0.5 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.1005466956 + "score":0.0821079546 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.3356518748 + "score":0.3164863838 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.1363185356 + "score":0.1265931852 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.3769111636 + "score":0.1793067232 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sd", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"zu", "task":"classification", "metric":"accuracy", - "score":0.2 + "score":0.6 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sd", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"zu", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"zu", "task":"translation_from", "metric":"bleu", - "score":0.0441421075 + "score":0.0115347204 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sd", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"zu", "task":"translation_from", "metric":"chrf", - "score":0.1739314177 + "score":0.1485833844 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sd", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"zu", "task":"translation_to", "metric":"bleu", - "score":0.0182129294 + "score":0.0093856962 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sd", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"zu", "task":"translation_to", "metric":"chrf", - "score":0.119134604 + "score":0.0608458885 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", + "model":"mistralai\/mistral-nemo", + "bcp_47":"aeb", "task":"classification", "metric":"accuracy", - "score":0.5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"mgsm", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.3 + "score":0.9 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", + "model":"mistralai\/mistral-nemo", + "bcp_47":"aeb", "task":"translation_from", "metric":"bleu", - "score":0.0510060878 + "score":0.1520421573 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", + "model":"mistralai\/mistral-nemo", + "bcp_47":"aeb", "task":"translation_from", "metric":"chrf", - "score":0.2132741272 + "score":0.3707336059 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", + "model":"mistralai\/mistral-nemo", + "bcp_47":"aeb", "task":"translation_to", "metric":"bleu", - "score":0.0089146903 + "score":0.0325845731 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", + "model":"mistralai\/mistral-nemo", + "bcp_47":"aeb", "task":"translation_to", "metric":"chrf", - "score":0.2314109768 + "score":0.1866364833 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ta", + "model":"mistralai\/mistral-nemo", + "bcp_47":"af", "task":"classification", "metric":"accuracy", - "score":0.3 + "score":0.0 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ta", + "model":"mistralai\/mistral-nemo", + "bcp_47":"af", "task":"translation_from", "metric":"bleu", - "score":0.0303451125 + "score":0.0 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ta", + "model":"mistralai\/mistral-nemo", + "bcp_47":"af", "task":"translation_from", "metric":"chrf", - "score":0.1748071119 + "score":0.0 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ta", + "model":"mistralai\/mistral-nemo", + "bcp_47":"af", "task":"translation_to", "metric":"bleu", - "score":0.0076177075 + "score":0.0 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ta", + "model":"mistralai\/mistral-nemo", + "bcp_47":"af", "task":"translation_to", "metric":"chrf", - "score":0.1986647775 + "score":0.0 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ak", "task":"classification", "metric":"accuracy", - "score":0.2 + "score":0.7 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ak", "task":"mgsm", "metric":"accuracy", "score":0.0 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ak", "task":"mmlu", "metric":"accuracy", "score":0.1 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ak", "task":"translation_from", "metric":"bleu", - "score":0.1096331511 + "score":0.049235994 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ak", "task":"translation_from", "metric":"chrf", - "score":0.2888090685 + "score":0.1875704973 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ak", "task":"translation_to", "metric":"bleu", - "score":0.1206114883 + "score":0.0203716729 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ak", "task":"translation_to", "metric":"chrf", - "score":0.2597106436 + "score":0.1964052359 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"th", + "model":"mistralai\/mistral-nemo", + "bcp_47":"am", "task":"classification", "metric":"accuracy", - "score":0.3 + "score":0.1 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"th", + "model":"mistralai\/mistral-nemo", + "bcp_47":"am", "task":"mgsm", "metric":"accuracy", "score":0.0 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"th", + "model":"mistralai\/mistral-nemo", + "bcp_47":"am", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"am", "task":"translation_from", "metric":"bleu", - "score":0.0382115226 + "score":0.0457848104 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"th", + "model":"mistralai\/mistral-nemo", + "bcp_47":"am", "task":"translation_from", "metric":"chrf", - "score":0.2562543067 + "score":0.1635760551 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"th", + "model":"mistralai\/mistral-nemo", + "bcp_47":"am", "task":"translation_to", "metric":"bleu", - "score":0.0125933293 + "score":0.0043114209 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"th", + "model":"mistralai\/mistral-nemo", + "bcp_47":"am", "task":"translation_to", "metric":"chrf", - "score":0.1659603426 + "score":0.0733956093 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"tr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"apc", "task":"classification", "metric":"accuracy", - "score":0.6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.1 + "score":0.9 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"tr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"apc", "task":"translation_from", "metric":"bleu", - "score":0.0907273605 + "score":0.0844832543 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"tr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"apc", "task":"translation_from", "metric":"chrf", - "score":0.2666411269 + "score":0.2899357726 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"tr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"apc", "task":"translation_to", "metric":"bleu", - "score":0.0495223383 + "score":0.0202296618 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"tr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"apc", "task":"translation_to", "metric":"chrf", - "score":0.276468397 + "score":0.1170466993 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ar", "task":"classification", "metric":"accuracy", - "score":0.5 + "score":0.9 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.0891185343 + "score":0.1314009634 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.281793335 + "score":0.3827163755 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.0799576366 + "score":0.0953897712 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.2661903898 + "score":0.2894343613 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"uz", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ary", "task":"classification", "metric":"accuracy", - "score":0.4 + "score":0.8 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"uz", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ary", "task":"translation_from", "metric":"bleu", - "score":0.0287030985 + "score":0.0542604747 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"uz", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ary", "task":"translation_from", "metric":"chrf", - "score":0.2124751899 + "score":0.2839533373 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"uz", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ary", "task":"translation_to", "metric":"bleu", - "score":0.0040250398 + "score":0.0103488851 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"uz", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ary", "task":"translation_to", "metric":"chrf", - "score":0.1706379305 + "score":0.1022931459 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", + "model":"mistralai\/mistral-nemo", + "bcp_47":"arz", "task":"classification", "metric":"accuracy", "score":0.8 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"mmlu", + "model":"mistralai\/mistral-nemo", + "bcp_47":"arz", + "task":"translation_from", + "metric":"bleu", + "score":0.1005104859 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"arz", + "task":"translation_from", + "metric":"chrf", + "score":0.3241333261 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"arz", + "task":"translation_to", + "metric":"bleu", + "score":0.0397410561 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"arz", + "task":"translation_to", + "metric":"chrf", + "score":0.1986373033 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"as", + "task":"classification", "metric":"accuracy", - "score":0.2 + "score":0.4 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", + "model":"mistralai\/mistral-nemo", + "bcp_47":"as", "task":"translation_from", "metric":"bleu", - "score":0.1389065496 + "score":0.0370753847 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", + "model":"mistralai\/mistral-nemo", + "bcp_47":"as", "task":"translation_from", "metric":"chrf", - "score":0.3708687542 + "score":0.2466649661 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", + "model":"mistralai\/mistral-nemo", + "bcp_47":"as", "task":"translation_to", "metric":"bleu", - "score":0.1661316612 + "score":0.0104943059 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", + "model":"mistralai\/mistral-nemo", + "bcp_47":"as", "task":"translation_to", "metric":"chrf", - "score":0.354399593 + "score":0.1703228075 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"wuu", + "model":"mistralai\/mistral-nemo", + "bcp_47":"awa", "task":"classification", "metric":"accuracy", - "score":0.5 + "score":0.8 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"wuu", + "model":"mistralai\/mistral-nemo", + "bcp_47":"awa", "task":"translation_from", "metric":"bleu", - "score":0.0973024735 + "score":0.1181763987 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"wuu", + "model":"mistralai\/mistral-nemo", + "bcp_47":"awa", "task":"translation_from", "metric":"chrf", - "score":0.3076531166 + "score":0.3010924314 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"wuu", + "model":"mistralai\/mistral-nemo", + "bcp_47":"awa", "task":"translation_to", "metric":"bleu", - "score":0.0161682999 + "score":0.0774366468 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"wuu", + "model":"mistralai\/mistral-nemo", + "bcp_47":"awa", "task":"translation_to", "metric":"chrf", - "score":0.0635837055 + "score":0.232244564 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"yue", + "model":"mistralai\/mistral-nemo", + "bcp_47":"az", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"yue", + "model":"mistralai\/mistral-nemo", + "bcp_47":"az", "task":"translation_from", "metric":"bleu", - "score":0.1043191943 + "score":0.0700327695 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"yue", + "model":"mistralai\/mistral-nemo", + "bcp_47":"az", "task":"translation_from", "metric":"chrf", - "score":0.3414129274 + "score":0.2793919522 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"yue", + "model":"mistralai\/mistral-nemo", + "bcp_47":"az", "task":"translation_to", "metric":"bleu", - "score":0.0651436117 + "score":0.04780178 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"yue", + "model":"mistralai\/mistral-nemo", + "bcp_47":"az", "task":"translation_to", "metric":"chrf", - "score":0.1002582276 + "score":0.1986318307 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", + "model":"mistralai\/mistral-nemo", + "bcp_47":"be", "task":"classification", "metric":"accuracy", - "score":0.7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"mgsm", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.3 + "score":1.0 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", + "model":"mistralai\/mistral-nemo", + "bcp_47":"be", "task":"translation_from", "metric":"bleu", - "score":0.1133138775 + "score":0.0761832692 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", + "model":"mistralai\/mistral-nemo", + "bcp_47":"be", "task":"translation_from", "metric":"chrf", - "score":0.3754190494 + "score":0.3293090829 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", + "model":"mistralai\/mistral-nemo", + "bcp_47":"be", "task":"translation_to", "metric":"bleu", - "score":0.1672636279 + "score":0.0940299872 }, { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", + "model":"mistralai\/mistral-nemo", + "bcp_47":"be", "task":"translation_to", "metric":"chrf", - "score":0.232325354 + "score":0.3022965125 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"am", + "model":"mistralai\/mistral-nemo", + "bcp_47":"bho", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"am", - "task":"mgsm", - "metric":"accuracy", - "score":0.2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"am", - "task":"mmlu", - "metric":"accuracy", - "score":0.3 + "score":0.9 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"am", + "model":"mistralai\/mistral-nemo", + "bcp_47":"bho", "task":"translation_from", "metric":"bleu", - "score":0.1203676158 + "score":0.1421502617 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"am", + "model":"mistralai\/mistral-nemo", + "bcp_47":"bho", "task":"translation_from", "metric":"chrf", - "score":0.3241911739 + "score":0.3249063292 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"am", + "model":"mistralai\/mistral-nemo", + "bcp_47":"bho", "task":"translation_to", "metric":"bleu", - "score":0.0165994228 + "score":0.044984749 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"am", + "model":"mistralai\/mistral-nemo", + "bcp_47":"bho", "task":"translation_to", "metric":"chrf", - "score":0.1058904177 + "score":0.1531327249 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"apc", + "model":"mistralai\/mistral-nemo", + "bcp_47":"bm", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"apc", + "model":"mistralai\/mistral-nemo", + "bcp_47":"bm", "task":"translation_from", "metric":"bleu", - "score":0.2332719546 + "score":0.0 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"apc", + "model":"mistralai\/mistral-nemo", + "bcp_47":"bm", "task":"translation_from", "metric":"chrf", - "score":0.4924788322 + "score":0.0 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"apc", + "model":"mistralai\/mistral-nemo", + "bcp_47":"bm", "task":"translation_to", "metric":"bleu", - "score":0.1544598614 + "score":0.0 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"apc", + "model":"mistralai\/mistral-nemo", + "bcp_47":"bm", "task":"translation_to", "metric":"chrf", - "score":0.403814105 + "score":0.0 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-nemo", + "bcp_47":"bn", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-nemo", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"bn", "task":"mmlu", "metric":"accuracy", - "score":1.0 + "score":0.5 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-nemo", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.2609114367 + "score":0.1016298945 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-nemo", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.5167379854 + "score":0.2980803254 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-nemo", + "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.1932802581 + "score":0.0978160022 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-nemo", + "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.4648835751 + "score":0.2190252958 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ca", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ca", "task":"translation_from", "metric":"bleu", - "score":0.1966421011 + "score":0.0 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ca", "task":"translation_from", "metric":"chrf", - "score":0.4161867731 + "score":0.0 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ca", "task":"translation_to", "metric":"bleu", - "score":0.1531147508 + "score":0.0 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ca", "task":"translation_to", "metric":"chrf", - "score":0.3635575685 + "score":0.0 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"az", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ceb", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"az", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ceb", "task":"translation_from", "metric":"bleu", - "score":0.130005692 + "score":0.0784827192 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"az", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ceb", "task":"translation_from", "metric":"chrf", - "score":0.3815764307 + "score":0.3301673127 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"az", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ceb", "task":"translation_to", "metric":"bleu", - "score":0.136654027 + "score":0.0942154389 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"az", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ceb", "task":"translation_to", "metric":"chrf", - "score":0.3809883299 + "score":0.3318581823 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bho", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ckb", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.5 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bho", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ckb", "task":"translation_from", "metric":"bleu", - "score":0.2451140745 + "score":0.0227564483 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bho", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ckb", "task":"translation_from", "metric":"chrf", - "score":0.4883780153 + "score":0.1618637003 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bho", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ckb", "task":"translation_to", "metric":"bleu", - "score":0.1334730215 + "score":0.0041151275 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bho", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ckb", "task":"translation_to", "metric":"chrf", - "score":0.363000921 + "score":0.052321141 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-nemo", + "bcp_47":"cs", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-nemo", + "bcp_47":"cs", "task":"mgsm", "metric":"accuracy", - "score":0.4 + "score":0.1 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-nemo", + "bcp_47":"cs", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.4 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-nemo", + "bcp_47":"cs", "task":"translation_from", "metric":"bleu", - "score":0.1938367121 + "score":0.1376994092 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-nemo", + "bcp_47":"cs", "task":"translation_from", "metric":"chrf", - "score":0.4674774016 + "score":0.3446006208 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-nemo", + "bcp_47":"cs", "task":"translation_to", "metric":"bleu", - "score":0.2073541352 + "score":0.1126650404 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-nemo", + "bcp_47":"cs", "task":"translation_to", "metric":"chrf", - "score":0.4438396219 + "score":0.3592815418 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"mistralai\/mistral-nemo", "bcp_47":"de", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"mistralai\/mistral-nemo", "bcp_47":"de", "task":"mgsm", "metric":"accuracy", - "score":0.7 + "score":0.0 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"mistralai\/mistral-nemo", "bcp_47":"de", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.6 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"mistralai\/mistral-nemo", "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.2685056004 + "score":0.1786073211 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"mistralai\/mistral-nemo", "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.506818165 + "score":0.418923403 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"mistralai\/mistral-nemo", "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.3801657831 + "score":0.1529904036 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"mistralai\/mistral-nemo", "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.6056477234 + "score":0.4257110482 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-nemo", + "bcp_47":"el", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-nemo", + "bcp_47":"el", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.1 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-nemo", + "bcp_47":"el", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.5 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-nemo", + "bcp_47":"el", "task":"translation_from", "metric":"bleu", - "score":0.2216031518 + "score":0.0881428767 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-nemo", + "bcp_47":"el", "task":"translation_from", "metric":"chrf", - "score":0.4429472312 + "score":0.2731602409 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-nemo", + "bcp_47":"el", "task":"translation_to", "metric":"bleu", - "score":0.3322887566 + "score":0.1667346071 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-nemo", + "bcp_47":"el", "task":"translation_to", "metric":"chrf", - "score":0.5824514758 + "score":0.3197259125 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-nemo", + "bcp_47":"en", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-nemo", + "bcp_47":"en", "task":"mgsm", "metric":"accuracy", - "score":0.7 + "score":0.1 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-nemo", + "bcp_47":"en", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-nemo", + "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.1640783778 + "score":0.3166864072 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-nemo", + "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.434749516 + "score":0.5483508218 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-nemo", + "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.3126220052 + "score":0.4404172544 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-nemo", + "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.6038883227 + "score":0.7231001513 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"es", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"es", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.2147534918 + "score":0.1298121807 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.4874495537 + "score":0.3403579227 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.094833194 + "score":0.3743863952 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.3292486732 + "score":0.5971283997 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fa", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fa", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.5 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fa", "task":"translation_from", "metric":"bleu", - "score":0.3074477197 + "score":0.1016894588 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fa", "task":"translation_from", "metric":"chrf", - "score":0.5168064726 + "score":0.3636401028 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fa", "task":"translation_to", "metric":"bleu", - "score":0.2380541489 + "score":0.1695199459 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fa", "task":"translation_to", "metric":"chrf", - "score":0.552589393 + "score":0.3986853323 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fil", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"mgsm", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fil", "task":"mmlu", "metric":"accuracy", - "score":0.7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2261588318 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4944996319 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4626001556 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6614963779 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "score":0.3 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fil", "task":"translation_from", "metric":"bleu", - "score":0.2250377214 + "score":0.1164300835 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fil", "task":"translation_from", "metric":"chrf", - "score":0.4688956519 + "score":0.3215620941 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fil", "task":"translation_to", "metric":"bleu", - "score":0.1515937263 + "score":0.1452350029 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fil", "task":"translation_to", "metric":"chrf", - "score":0.4251249067 + "score":0.4128118494 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fr", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fr", "task":"mgsm", "metric":"accuracy", - "score":0.2 + "score":0.1 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fr", "task":"mmlu", "metric":"accuracy", "score":0.6 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.0957125553 + "score":0.1078563354 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.3135046613 + "score":0.3207926618 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.1387309388 + "score":0.3659011486 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.383923158 + "score":0.580998869 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fuv", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fuv", "task":"translation_from", "metric":"bleu", - "score":0.3316295853 + "score":0.0208055886 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fuv", "task":"translation_from", "metric":"chrf", - "score":0.5594083443 + "score":0.1775856129 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fuv", "task":"translation_to", "metric":"bleu", - "score":0.3598049012 + "score":0.0303702553 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fuv", "task":"translation_to", "metric":"chrf", - "score":0.5828568956 + "score":0.1647346597 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-nemo", + "bcp_47":"gu", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-nemo", + "bcp_47":"gu", "task":"translation_from", "metric":"bleu", - "score":0.2236143729 + "score":0.0897802232 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-nemo", + "bcp_47":"gu", "task":"translation_from", "metric":"chrf", - "score":0.4912948296 + "score":0.3334021167 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-nemo", + "bcp_47":"gu", "task":"translation_to", "metric":"bleu", - "score":0.2910526755 + "score":0.0546926081 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-nemo", + "bcp_47":"gu", "task":"translation_to", "metric":"chrf", - "score":0.6005590773 + "score":0.2631919591 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ha", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.5 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ha", "task":"mgsm", "metric":"accuracy", - "score":0.6 + "score":0.0 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ha", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.3 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ha", "task":"translation_from", "metric":"bleu", - "score":0.2150043089 + "score":0.038636598 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ha", "task":"translation_from", "metric":"chrf", - "score":0.4693148389 + "score":0.1770095402 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ha", "task":"translation_to", "metric":"bleu", - "score":0.2998342329 + "score":0.0050909961 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ha", "task":"translation_to", "metric":"chrf", - "score":0.5545377546 + "score":0.1811657432 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", + "model":"mistralai\/mistral-nemo", + "bcp_47":"hi", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"mgsm", - "metric":"accuracy", - "score":0.5 + "score":0.9 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", + "model":"mistralai\/mistral-nemo", + "bcp_47":"hi", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.6 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", + "model":"mistralai\/mistral-nemo", + "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.2131020144 + "score":0.1271878224 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", + "model":"mistralai\/mistral-nemo", + "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.4845704057 + "score":0.3698932868 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", + "model":"mistralai\/mistral-nemo", + "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.1446650781 + "score":0.1324625901 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", + "model":"mistralai\/mistral-nemo", + "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.2292145443 + "score":0.3233634009 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", + "model":"mistralai\/mistral-nemo", + "bcp_47":"hne", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", + "model":"mistralai\/mistral-nemo", + "bcp_47":"hne", "task":"translation_from", "metric":"bleu", - "score":0.1840709267 + "score":0.0809118708 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", + "model":"mistralai\/mistral-nemo", + "bcp_47":"hne", "task":"translation_from", "metric":"chrf", - "score":0.4042090141 + "score":0.2537010038 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", + "model":"mistralai\/mistral-nemo", + "bcp_47":"hne", "task":"translation_to", "metric":"bleu", - "score":0.1902389614 + "score":0.022242601 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", + "model":"mistralai\/mistral-nemo", + "bcp_47":"hne", "task":"translation_to", "metric":"chrf", - "score":0.4796942089 + "score":0.2086622767 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ht", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ht", "task":"translation_from", "metric":"bleu", - "score":0.1797031918 + "score":0.0 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ht", "task":"translation_from", "metric":"chrf", - "score":0.446466319 + "score":0.0 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ht", "task":"translation_to", "metric":"bleu", - "score":0.1846339038 + "score":0.0 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ht", "task":"translation_to", "metric":"chrf", - "score":0.4220658756 + "score":0.0 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", + "model":"mistralai\/mistral-nemo", + "bcp_47":"hu", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", + "model":"mistralai\/mistral-nemo", + "bcp_47":"hu", + "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", + "model":"mistralai\/mistral-nemo", + "bcp_47":"hu", "task":"translation_from", "metric":"bleu", - "score":0.1932392069 + "score":0.1216394809 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", + "model":"mistralai\/mistral-nemo", + "bcp_47":"hu", "task":"translation_from", "metric":"chrf", - "score":0.4204852284 + "score":0.4062520998 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", + "model":"mistralai\/mistral-nemo", + "bcp_47":"hu", "task":"translation_to", "metric":"bleu", - "score":0.0476115004 + "score":0.1488006127 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", + "model":"mistralai\/mistral-nemo", + "bcp_47":"hu", "task":"translation_to", "metric":"chrf", - "score":0.0790735292 + "score":0.3814897068 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", + "model":"mistralai\/mistral-nemo", + "bcp_47":"id", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2670990652 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.5220692033 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1981851908 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4555314776 + "score":0.9 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"classification", + "model":"mistralai\/mistral-nemo", + "bcp_47":"id", + "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.2152417217 + "score":0.1489627056 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.4578207034 + "score":0.4172638299 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.1654073391 + "score":0.2008824981 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.3941079443 + "score":0.5185852751 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ms", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ig", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ms", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"ig", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.5 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ms", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ig", "task":"translation_from", "metric":"bleu", - "score":0.2763114217 + "score":0.0505138835 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ms", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ig", "task":"translation_from", "metric":"chrf", - "score":0.5353874356 + "score":0.1914888261 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ms", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ig", "task":"translation_to", "metric":"bleu", - "score":0.3315044625 + "score":0.0070198993 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ms", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ig", "task":"translation_to", "metric":"chrf", - "score":0.6241092077 + "score":0.1690394526 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"my", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ilo", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"my", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ilo", "task":"translation_from", "metric":"bleu", - "score":0.2083780287 + "score":0.0982399037 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"my", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ilo", "task":"translation_from", "metric":"chrf", - "score":0.4466015977 + "score":0.2845447958 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"my", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ilo", "task":"translation_to", "metric":"bleu", - "score":0.0879797246 + "score":0.0238061486 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"my", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ilo", "task":"translation_to", "metric":"chrf", - "score":0.3441521948 + "score":0.2070418144 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-nemo", + "bcp_47":"it", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-nemo", + "bcp_47":"it", "task":"mgsm", "metric":"accuracy", - "score":0.3 + "score":0.1 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-nemo", + "bcp_47":"it", "task":"mmlu", "metric":"accuracy", - "score":0.2 + "score":0.6 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-nemo", + "bcp_47":"it", "task":"translation_from", "metric":"bleu", - "score":0.0206783974 + "score":0.1148524922 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-nemo", + "bcp_47":"it", "task":"translation_from", "metric":"chrf", - "score":0.2005424268 + "score":0.3722842281 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-nemo", + "bcp_47":"it", "task":"translation_to", "metric":"bleu", - "score":0.0171071488 + "score":0.250138544 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-nemo", + "bcp_47":"it", "task":"translation_to", "metric":"chrf", - "score":0.239253642 + "score":0.5338430631 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ja", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.1677012885 + "score":0.1169165949 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.4316686173 + "score":0.3638899173 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.1202133569 + "score":0.1330552123 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.3816566526 + "score":0.2685952079 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"jv", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.1891048622 + "score":0.0823011221 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.4238091524 + "score":0.2825939861 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.2086330089 + "score":0.0327082346 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.364326938 + "score":0.2319054893 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ki", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"mgsm", - "metric":"accuracy", - "score":0.4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ki", "task":"translation_from", "metric":"bleu", - "score":0.1998083747 + "score":0.0 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ki", "task":"translation_from", "metric":"chrf", - "score":0.4667760664 + "score":0.0 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ki", "task":"translation_to", "metric":"bleu", - "score":0.3336132898 + "score":0.0 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ki", "task":"translation_to", "metric":"chrf", - "score":0.5541703282 + "score":0.0 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-nemo", + "bcp_47":"kk", "task":"classification", "metric":"accuracy", "score":0.8 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-nemo", + "bcp_47":"kk", "task":"translation_from", "metric":"bleu", - "score":0.2256776552 + "score":0.044667859 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-nemo", + "bcp_47":"kk", "task":"translation_from", "metric":"chrf", - "score":0.4793769886 + "score":0.2691000298 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-nemo", + "bcp_47":"kk", "task":"translation_to", "metric":"bleu", - "score":0.3320822339 + "score":0.0732644907 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-nemo", + "bcp_47":"kk", "task":"translation_to", "metric":"chrf", - "score":0.6132478102 + "score":0.3296633392 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-nemo", + "bcp_47":"km", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"mgsm", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 + "score":0.1 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-nemo", + "bcp_47":"km", "task":"translation_from", "metric":"bleu", - "score":0.1730354472 + "score":0.0353609299 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-nemo", + "bcp_47":"km", "task":"translation_from", "metric":"chrf", - "score":0.454951133 + "score":0.1909025949 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-nemo", + "bcp_47":"km", "task":"translation_to", "metric":"bleu", - "score":0.3073459183 + "score":0.0077167113 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-nemo", + "bcp_47":"km", "task":"translation_to", "metric":"chrf", - "score":0.554890569 + "score":0.1386174808 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", + "model":"mistralai\/mistral-nemo", + "bcp_47":"kn", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", + "model":"mistralai\/mistral-nemo", + "bcp_47":"kn", "task":"translation_from", "metric":"bleu", - "score":0.1343511225 + "score":0.1165534681 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", + "model":"mistralai\/mistral-nemo", + "bcp_47":"kn", "task":"translation_from", "metric":"chrf", - "score":0.385804118 + "score":0.3877914341 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", + "model":"mistralai\/mistral-nemo", + "bcp_47":"kn", "task":"translation_to", "metric":"bleu", - "score":0.0662090824 + "score":0.1033665849 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", + "model":"mistralai\/mistral-nemo", + "bcp_47":"kn", "task":"translation_to", "metric":"chrf", - "score":0.3030628402 + "score":0.3638806009 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ko", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"mgsm", - "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ko", "task":"mmlu", "metric":"accuracy", "score":0.6 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ko", "task":"translation_from", "metric":"bleu", - "score":0.1798653655 + "score":0.1314926141 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ko", "task":"translation_from", "metric":"chrf", - "score":0.4290347271 + "score":0.3540405018 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ko", "task":"translation_to", "metric":"bleu", - "score":0.1709237193 + "score":0.1705869429 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ko", "task":"translation_to", "metric":"chrf", - "score":0.522080463 + "score":0.2612780395 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", + "model":"mistralai\/mistral-nemo", + "bcp_47":"lua", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.6 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", + "model":"mistralai\/mistral-nemo", + "bcp_47":"lua", "task":"translation_from", "metric":"bleu", - "score":0.1405088565 + "score":0.0158033007 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", + "model":"mistralai\/mistral-nemo", + "bcp_47":"lua", "task":"translation_from", "metric":"chrf", - "score":0.4088204523 + "score":0.1802186885 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", + "model":"mistralai\/mistral-nemo", + "bcp_47":"lua", "task":"translation_to", "metric":"bleu", - "score":0.2360333676 + "score":0.004737288 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", + "model":"mistralai\/mistral-nemo", + "bcp_47":"lua", "task":"translation_to", "metric":"chrf", - "score":0.5038093602 + "score":0.1665989397 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", + "model":"mistralai\/mistral-nemo", + "bcp_47":"mag", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"mgsm", - "metric":"accuracy", - "score":0.4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.5 + "score":0.9 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", + "model":"mistralai\/mistral-nemo", + "bcp_47":"mag", "task":"translation_from", "metric":"bleu", - "score":0.2507091988 + "score":0.0968803629 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", + "model":"mistralai\/mistral-nemo", + "bcp_47":"mag", "task":"translation_from", "metric":"chrf", - "score":0.5067409185 + "score":0.3271235347 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", + "model":"mistralai\/mistral-nemo", + "bcp_47":"mag", "task":"translation_to", "metric":"bleu", - "score":0.2998213366 + "score":0.0742021289 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", + "model":"mistralai\/mistral-nemo", + "bcp_47":"mag", "task":"translation_to", "metric":"chrf", - "score":0.5112516267 + "score":0.1811100359 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", + "model":"mistralai\/mistral-nemo", + "bcp_47":"mai", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"mgsm", - "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", + "model":"mistralai\/mistral-nemo", + "bcp_47":"mai", "task":"translation_from", "metric":"bleu", - "score":0.2022308722 + "score":0.0830883828 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", + "model":"mistralai\/mistral-nemo", + "bcp_47":"mai", "task":"translation_from", "metric":"chrf", - "score":0.4620737135 + "score":0.2590209016 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", + "model":"mistralai\/mistral-nemo", + "bcp_47":"mai", "task":"translation_to", "metric":"bleu", - "score":0.2592698778 + "score":0.0473984845 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", + "model":"mistralai\/mistral-nemo", + "bcp_47":"mai", "task":"translation_to", "metric":"chrf", - "score":0.4253112122 + "score":0.2714023791 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"mg", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"mg", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.4 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"mg", "task":"translation_from", "metric":"bleu", - "score":0.2231619401 + "score":0.0436065244 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"mg", "task":"translation_from", "metric":"chrf", - "score":0.4653230255 + "score":0.1616079019 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"mg", "task":"translation_to", "metric":"bleu", - "score":0.2701457179 + "score":0.0321839146 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"mg", "task":"translation_to", "metric":"chrf", - "score":0.5043061571 + "score":0.2872152251 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ml", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ml", "task":"translation_from", "metric":"bleu", - "score":0.194871957 + "score":0.1039755938 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ml", "task":"translation_from", "metric":"chrf", - "score":0.4838690709 + "score":0.3670583743 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ml", "task":"translation_to", "metric":"bleu", - "score":0.1908512613 + "score":0.0490353313 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ml", "task":"translation_to", "metric":"chrf", - "score":0.3855814375 + "score":0.3016997477 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"uz", + "model":"mistralai\/mistral-nemo", + "bcp_47":"mr", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"uz", + "model":"mistralai\/mistral-nemo", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.177513842 + "score":0.1016737952 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"uz", + "model":"mistralai\/mistral-nemo", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.386230097 + "score":0.3529445259 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"uz", + "model":"mistralai\/mistral-nemo", + "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.2544813414 + "score":0.0980137705 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"uz", + "model":"mistralai\/mistral-nemo", + "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.4948262917 + "score":0.3076980329 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ms", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ms", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.4 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ms", "task":"translation_from", "metric":"bleu", - "score":0.2003733128 + "score":0.2051934522 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ms", "task":"translation_from", "metric":"chrf", - "score":0.4613442635 + "score":0.4174861616 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ms", "task":"translation_to", "metric":"bleu", - "score":0.3326058501 + "score":0.1030714956 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ms", "task":"translation_to", "metric":"chrf", - "score":0.5496097026 + "score":0.3069420156 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"wuu", + "model":"mistralai\/mistral-nemo", + "bcp_47":"my", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"wuu", + "model":"mistralai\/mistral-nemo", + "bcp_47":"my", "task":"translation_from", "metric":"bleu", - "score":0.1538409962 + "score":0.1062506996 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"wuu", + "model":"mistralai\/mistral-nemo", + "bcp_47":"my", "task":"translation_from", "metric":"chrf", - "score":0.4398974306 + "score":0.3311804385 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"wuu", + "model":"mistralai\/mistral-nemo", + "bcp_47":"my", "task":"translation_to", "metric":"bleu", - "score":0.0373503953 + "score":0.0661499319 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"wuu", + "model":"mistralai\/mistral-nemo", + "bcp_47":"my", "task":"translation_to", "metric":"chrf", - "score":0.074080246 + "score":0.2408635082 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ne", "task":"classification", "metric":"accuracy", "score":0.8 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ne", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"ne", "task":"translation_from", "metric":"bleu", - "score":0.174955946 + "score":0.1305087747 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ne", "task":"translation_from", "metric":"chrf", - "score":0.4554476081 + "score":0.336550146 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ne", "task":"translation_to", "metric":"bleu", - "score":0.1400846872 + "score":0.0829900967 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ne", "task":"translation_to", "metric":"chrf", - "score":0.1809201358 + "score":0.3039678683 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-nemo", + "bcp_47":"nl", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-nemo", + "bcp_47":"nl", "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":0.2 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-nemo", + "bcp_47":"nl", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.6 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-nemo", + "bcp_47":"nl", "task":"translation_from", "metric":"bleu", - "score":0.1869648376 + "score":0.1166543201 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-nemo", + "bcp_47":"nl", "task":"translation_from", "metric":"chrf", - "score":0.4664675781 + "score":0.3031041679 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-nemo", + "bcp_47":"nl", "task":"translation_to", "metric":"bleu", - "score":0.1696786467 + "score":0.200304354 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-nemo", + "bcp_47":"nl", "task":"translation_to", "metric":"chrf", - "score":0.2325846099 + "score":0.4780661009 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"am", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ny", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"am", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ny", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"ny", + "task":"translation_from", + "metric":"bleu", + "score":0.0265108253 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"ny", + "task":"translation_from", + "metric":"chrf", + "score":0.1166554461 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"ny", + "task":"translation_to", + "metric":"bleu", + "score":0.0293332904 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"ny", + "task":"translation_to", + "metric":"chrf", + "score":0.1849240696 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"om", + "task":"classification", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"om", "task":"mgsm", "metric":"accuracy", "score":0.0 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"am", + "model":"mistralai\/mistral-nemo", + "bcp_47":"om", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":0.6 }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"am", + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"om", "task":"translation_from", "metric":"bleu", - "score":0.1375609672 + "score":0.0177577979 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"am", + "model":"mistralai\/mistral-nemo", + "bcp_47":"om", "task":"translation_from", "metric":"chrf", - "score":0.3710873948 + "score":0.1411822431 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"am", + "model":"mistralai\/mistral-nemo", + "bcp_47":"om", "task":"translation_to", "metric":"bleu", - "score":0.0526682247 + "score":0.0101970078 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"am", + "model":"mistralai\/mistral-nemo", + "bcp_47":"om", "task":"translation_to", "metric":"chrf", - "score":0.1185738392 + "score":0.1613941454 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"apc", + "model":"mistralai\/mistral-nemo", + "bcp_47":"or", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"apc", + "model":"mistralai\/mistral-nemo", + "bcp_47":"or", "task":"translation_from", "metric":"bleu", - "score":0.2624553878 + "score":0.0446786865 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"apc", + "model":"mistralai\/mistral-nemo", + "bcp_47":"or", "task":"translation_from", "metric":"chrf", - "score":0.5118695802 + "score":0.1562050743 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"apc", + "model":"mistralai\/mistral-nemo", + "bcp_47":"or", "task":"translation_to", "metric":"bleu", - "score":0.2175864677 + "score":0.0022538162 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"apc", + "model":"mistralai\/mistral-nemo", + "bcp_47":"or", "task":"translation_to", "metric":"chrf", - "score":0.4641969296 + "score":0.0960982382 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-nemo", + "bcp_47":"pa", "task":"classification", "metric":"accuracy", - "score":0.8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-nemo", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.2766513185 + "score":0.3158857772 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-nemo", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.5528193738 + "score":0.5109022919 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-nemo", + "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.3371708551 + "score":0.2903521386 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-nemo", + "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.5607841978 + "score":0.4758823803 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", + "model":"mistralai\/mistral-nemo", + "bcp_47":"pl", "task":"classification", "metric":"accuracy", "score":0.8 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", + "model":"mistralai\/mistral-nemo", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"pl", "task":"translation_from", "metric":"bleu", - "score":0.2374604323 + "score":0.1198559998 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", + "model":"mistralai\/mistral-nemo", + "bcp_47":"pl", "task":"translation_from", "metric":"chrf", - "score":0.4585263555 + "score":0.3492711529 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", + "model":"mistralai\/mistral-nemo", + "bcp_47":"pl", "task":"translation_to", "metric":"bleu", - "score":0.2300327193 + "score":0.2480316528 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", + "model":"mistralai\/mistral-nemo", + "bcp_47":"pl", "task":"translation_to", "metric":"chrf", - "score":0.43482663 + "score":0.4488014348 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"az", + "model":"mistralai\/mistral-nemo", + "bcp_47":"pt", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"az", + "model":"mistralai\/mistral-nemo", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.1767618659 + "score":0.1398701241 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"az", + "model":"mistralai\/mistral-nemo", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.4088166263 + "score":0.3034565852 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"az", + "model":"mistralai\/mistral-nemo", + "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.1381246624 + "score":0.3460979115 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"az", + "model":"mistralai\/mistral-nemo", + "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.3730280956 + "score":0.5835851988 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bho", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ro", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bho", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"ro", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"ro", "task":"translation_from", "metric":"bleu", - "score":0.2731033294 + "score":0.1130151873 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bho", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ro", "task":"translation_from", "metric":"chrf", - "score":0.5159041397 + "score":0.3818050844 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bho", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ro", "task":"translation_to", "metric":"bleu", - "score":0.2075901182 + "score":0.1838222494 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bho", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ro", "task":"translation_to", "metric":"chrf", - "score":0.4086862509 + "score":0.416344125 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ru", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ru", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.1 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ru", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.5 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.2623045124 + "score":0.0947682488 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.512895511 + "score":0.3259777135 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.3328087961 + "score":0.1796274314 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.5013967236 + "score":0.4360781177 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", + "model":"mistralai\/mistral-nemo", + "bcp_47":"rw", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", + "model":"mistralai\/mistral-nemo", + "bcp_47":"rw", "task":"mgsm", "metric":"accuracy", "score":0.0 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", + "model":"mistralai\/mistral-nemo", + "bcp_47":"rw", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.2 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", + "model":"mistralai\/mistral-nemo", + "bcp_47":"rw", "task":"translation_from", "metric":"bleu", - "score":0.3059254014 + "score":0.0300958323 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", + "model":"mistralai\/mistral-nemo", + "bcp_47":"rw", "task":"translation_from", "metric":"chrf", - "score":0.5403551155 + "score":0.2021438397 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", + "model":"mistralai\/mistral-nemo", + "bcp_47":"rw", "task":"translation_to", "metric":"bleu", - "score":0.4588037752 + "score":0.0097834933 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", + "model":"mistralai\/mistral-nemo", + "bcp_47":"rw", "task":"translation_to", "metric":"chrf", - "score":0.6692431614 + "score":0.1744531846 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sd", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"mgsm", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sd", + "task":"translation_from", + "metric":"bleu", + "score":0.0299661217 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"sd", + "task":"translation_from", + "metric":"chrf", + "score":0.204544657 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"sd", + "task":"translation_to", + "metric":"bleu", + "score":0.0009238366 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"sd", + "task":"translation_to", + "metric":"chrf", + "score":0.0843772457 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"si", + "task":"classification", "metric":"accuracy", "score":0.2 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-nemo", + "bcp_47":"si", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.2 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-nemo", + "bcp_47":"si", "task":"translation_from", "metric":"bleu", - "score":0.5486108614 + "score":0.031724087 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-nemo", + "bcp_47":"si", "task":"translation_from", "metric":"chrf", - "score":0.6873139374 + "score":0.16451202 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-nemo", + "bcp_47":"si", "task":"translation_to", "metric":"bleu", - "score":0.691450825 + "score":0.0046124791 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-nemo", + "bcp_47":"si", "task":"translation_to", "metric":"chrf", - "score":0.8407064328 + "score":0.1085913002 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sn", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sn", "task":"mgsm", "metric":"accuracy", "score":0.0 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sn", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.6 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sn", "task":"translation_from", "metric":"bleu", - "score":0.3021494986 + "score":0.017437495 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sn", "task":"translation_from", "metric":"chrf", - "score":0.5604145602 + "score":0.142035614 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sn", "task":"translation_to", "metric":"bleu", - "score":0.3865320679 + "score":0.0146532378 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sn", "task":"translation_to", "metric":"chrf", - "score":0.6126903448 + "score":0.1923028552 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"so", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.6 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"so", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.3 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"so", "task":"translation_from", "metric":"bleu", - "score":0.3383579693 + "score":0.0516240546 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"so", "task":"translation_from", "metric":"chrf", - "score":0.5641679075 + "score":0.153428686 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"so", "task":"translation_to", "metric":"bleu", - "score":0.2069613925 + "score":0.0121002424 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"so", "task":"translation_to", "metric":"chrf", - "score":0.4288746449 + "score":0.1697462625 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sr", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sr", "task":"translation_from", "metric":"bleu", - "score":0.3771163962 + "score":0.115711536 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sr", "task":"translation_from", "metric":"chrf", - "score":0.5827777548 + "score":0.3597872407 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sr", "task":"translation_to", "metric":"bleu", - "score":0.3225619014 + "score":0.1694354423 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sr", "task":"translation_to", "metric":"chrf", - "score":0.5830090459 + "score":0.4167060912 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"su", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"mgsm", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", "score":0.7 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"su", "task":"translation_from", "metric":"bleu", - "score":0.2924853239 + "score":0.0407632458 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"su", "task":"translation_from", "metric":"chrf", - "score":0.5462367408 + "score":0.2238900502 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"su", "task":"translation_to", "metric":"bleu", - "score":0.4963618411 + "score":0.0714251247 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"su", "task":"translation_to", "metric":"chrf", - "score":0.682573515 + "score":0.2764333203 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sv", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"sv", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"sv", "task":"translation_from", "metric":"bleu", - "score":0.3220032872 + "score":0.2208693059 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sv", "task":"translation_from", "metric":"chrf", - "score":0.537784261 + "score":0.4679683611 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sv", "task":"translation_to", "metric":"bleu", - "score":0.2206953431 + "score":0.3234795754 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sv", "task":"translation_to", "metric":"chrf", - "score":0.4990640113 + "score":0.5608576982 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sw", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sw", "task":"mgsm", "metric":"accuracy", - "score":0.1 + "score":0.2 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sw", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.3 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.1527043255 + "score":0.0669163701 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.4074071592 + "score":0.2784916366 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.1567942198 + "score":0.0633186191 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.4125213011 + "score":0.3074668268 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ta", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ta", "task":"translation_from", "metric":"bleu", - "score":0.3914590212 + "score":0.0917433239 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ta", "task":"translation_from", "metric":"chrf", - "score":0.6128431348 + "score":0.3851148557 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ta", "task":"translation_to", "metric":"bleu", - "score":0.4189427376 + "score":0.1299606269 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ta", "task":"translation_to", "metric":"chrf", - "score":0.6262550579 + "score":0.3428948363 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-nemo", + "bcp_47":"te", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-nemo", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"te", "task":"mmlu", "metric":"accuracy", - "score":1.0 + "score":0.6 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-nemo", + "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.290274553 + "score":0.1471870965 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-nemo", + "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.5143960108 + "score":0.3392441061 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-nemo", + "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.3789023659 + "score":0.2060450795 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-nemo", + "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.6751523776 + "score":0.3717773766 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", + "model":"mistralai\/mistral-nemo", + "bcp_47":"tg", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"mgsm", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", + "model":"mistralai\/mistral-nemo", + "bcp_47":"tg", "task":"translation_from", "metric":"bleu", - "score":0.296179579 + "score":0.0594528699 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", + "model":"mistralai\/mistral-nemo", + "bcp_47":"tg", "task":"translation_from", "metric":"chrf", - "score":0.5259369403 + "score":0.1988219607 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", + "model":"mistralai\/mistral-nemo", + "bcp_47":"tg", "task":"translation_to", "metric":"bleu", - "score":0.3187240753 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", + "model":"mistralai\/mistral-nemo", + "bcp_47":"tg", "task":"translation_to", "metric":"chrf", - "score":0.5786749514 + "score":0.1247215313 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", + "model":"mistralai\/mistral-nemo", + "bcp_47":"th", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", + "model":"mistralai\/mistral-nemo", + "bcp_47":"th", "task":"mgsm", "metric":"accuracy", "score":0.0 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", + "model":"mistralai\/mistral-nemo", + "bcp_47":"th", "task":"translation_from", "metric":"bleu", - "score":0.3306727326 + "score":0.1079848157 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", + "model":"mistralai\/mistral-nemo", + "bcp_47":"th", "task":"translation_from", "metric":"chrf", - "score":0.5648258387 + "score":0.2801778291 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", + "model":"mistralai\/mistral-nemo", + "bcp_47":"th", "task":"translation_to", "metric":"bleu", - "score":0.262512317 + "score":0.1131365873 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", + "model":"mistralai\/mistral-nemo", + "bcp_47":"th", "task":"translation_to", "metric":"chrf", - "score":0.4036795798 + "score":0.2713637811 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ti", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.1 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ti", "task":"translation_from", "metric":"bleu", - "score":0.2593989014 + "score":0.0118794667 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ti", "task":"translation_from", "metric":"chrf", - "score":0.4825732152 + "score":0.1249552242 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ti", "task":"translation_to", "metric":"bleu", - "score":0.2177203514 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ti", "task":"translation_to", "metric":"chrf", - "score":0.452576603 + "score":0.0507921341 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", + "model":"mistralai\/mistral-nemo", + "bcp_47":"tr", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", + "model":"mistralai\/mistral-nemo", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"tr", "task":"translation_from", "metric":"bleu", - "score":0.2155836452 + "score":0.1097631082 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", + "model":"mistralai\/mistral-nemo", + "bcp_47":"tr", "task":"translation_from", "metric":"chrf", - "score":0.4583181839 + "score":0.3352988316 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", + "model":"mistralai\/mistral-nemo", + "bcp_47":"tr", "task":"translation_to", "metric":"bleu", - "score":0.2468017951 + "score":0.0795019275 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", + "model":"mistralai\/mistral-nemo", + "bcp_47":"tr", "task":"translation_to", "metric":"chrf", - "score":0.4734415865 + "score":0.2884455353 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", + "model":"mistralai\/mistral-nemo", + "bcp_47":"uk", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", + "model":"mistralai\/mistral-nemo", + "bcp_47":"uk", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", + "model":"mistralai\/mistral-nemo", + "bcp_47":"uk", "task":"translation_from", "metric":"bleu", - "score":0.2276258723 + "score":0.0837893895 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", + "model":"mistralai\/mistral-nemo", + "bcp_47":"uk", "task":"translation_from", "metric":"chrf", - "score":0.4577745447 + "score":0.2809963487 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", + "model":"mistralai\/mistral-nemo", + "bcp_47":"uk", "task":"translation_to", "metric":"bleu", - "score":0.3046437152 + "score":0.2215012201 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", + "model":"mistralai\/mistral-nemo", + "bcp_47":"uk", "task":"translation_to", "metric":"chrf", - "score":0.3825631739 + "score":0.4551853935 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", + "model":"mistralai\/mistral-nemo", + "bcp_47":"umb", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.4 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", + "model":"mistralai\/mistral-nemo", + "bcp_47":"umb", "task":"translation_from", "metric":"bleu", - "score":0.271926141 + "score":0.0345153294 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", + "model":"mistralai\/mistral-nemo", + "bcp_47":"umb", "task":"translation_from", "metric":"chrf", - "score":0.5318057054 + "score":0.1364890072 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", + "model":"mistralai\/mistral-nemo", + "bcp_47":"umb", "task":"translation_to", "metric":"bleu", - "score":0.2579782083 + "score":0.0012941396 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", + "model":"mistralai\/mistral-nemo", + "bcp_47":"umb", "task":"translation_to", "metric":"chrf", - "score":0.4806502272 + "score":0.1092334478 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ur", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.2987546297 + "score":0.0522713846 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.526361525 + "score":0.3192866676 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.1515083487 + "score":0.0868686952 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.4332812085 + "score":0.2859772299 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ms", + "model":"mistralai\/mistral-nemo", + "bcp_47":"uz", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ms", - "task":"mmlu", - "metric":"accuracy", "score":0.8 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ms", + "model":"mistralai\/mistral-nemo", + "bcp_47":"uz", "task":"translation_from", "metric":"bleu", - "score":0.3458633411 + "score":0.0689558305 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ms", + "model":"mistralai\/mistral-nemo", + "bcp_47":"uz", "task":"translation_from", "metric":"chrf", - "score":0.5703964991 + "score":0.22853185 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ms", + "model":"mistralai\/mistral-nemo", + "bcp_47":"uz", "task":"translation_to", "metric":"bleu", - "score":0.4050410338 + "score":0.0415402981 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ms", + "model":"mistralai\/mistral-nemo", + "bcp_47":"uz", "task":"translation_to", "metric":"chrf", - "score":0.6535211779 + "score":0.2227329297 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"my", + "model":"mistralai\/mistral-nemo", + "bcp_47":"vi", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"my", + "model":"mistralai\/mistral-nemo", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.2598947984 + "score":0.0649160569 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"my", + "model":"mistralai\/mistral-nemo", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.4881220333 + "score":0.2830042558 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"my", + "model":"mistralai\/mistral-nemo", + "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.2015903544 + "score":0.0350138164 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"my", + "model":"mistralai\/mistral-nemo", + "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.4513077936 + "score":0.2206802597 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-nemo", + "bcp_47":"wo", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-nemo", + "bcp_47":"wo", "task":"mgsm", "metric":"accuracy", - "score":0.1 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-nemo", + "bcp_47":"wo", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.4 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-nemo", + "bcp_47":"wo", "task":"translation_from", "metric":"bleu", - "score":0.024472012 + "score":0.0588767323 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-nemo", + "bcp_47":"wo", "task":"translation_from", "metric":"chrf", - "score":0.2143061298 + "score":0.2123528181 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-nemo", + "bcp_47":"wo", "task":"translation_to", "metric":"bleu", - "score":0.0100859589 + "score":0.0134096062 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-nemo", + "bcp_47":"wo", "task":"translation_to", "metric":"chrf", - "score":0.2528047704 + "score":0.1594472691 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", + "model":"mistralai\/mistral-nemo", + "bcp_47":"wuu", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", + "model":"mistralai\/mistral-nemo", + "bcp_47":"wuu", "task":"translation_from", "metric":"bleu", - "score":0.285587224 + "score":0.0908263331 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", + "model":"mistralai\/mistral-nemo", + "bcp_47":"wuu", "task":"translation_from", "metric":"chrf", - "score":0.5216659729 + "score":0.3394219762 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", + "model":"mistralai\/mistral-nemo", + "bcp_47":"wuu", "task":"translation_to", "metric":"bleu", - "score":0.1281773816 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", + "model":"mistralai\/mistral-nemo", + "bcp_47":"wuu", "task":"translation_to", "metric":"chrf", - "score":0.3720376754 + "score":0.0645497034 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"xh", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"xh", "task":"translation_from", "metric":"bleu", - "score":0.4479091606 + "score":0.0478741208 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"xh", "task":"translation_from", "metric":"chrf", - "score":0.6272058507 + "score":0.1576256072 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"xh", "task":"translation_to", "metric":"bleu", - "score":0.4155919737 + "score":0.0235106256 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"xh", "task":"translation_to", "metric":"chrf", - "score":0.5685427433 + "score":0.1852540612 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", + "model":"mistralai\/mistral-nemo", + "bcp_47":"yo", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.5 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", + "model":"mistralai\/mistral-nemo", + "bcp_47":"yo", "task":"mgsm", "metric":"accuracy", "score":0.0 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", + "model":"mistralai\/mistral-nemo", + "bcp_47":"yo", "task":"mmlu", "metric":"accuracy", + "score":0.4 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"yo", + "task":"translation_from", + "metric":"bleu", + "score":0.0235724586 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"yo", + "task":"translation_from", + "metric":"chrf", + "score":0.1570768217 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"yo", + "task":"translation_to", + "metric":"bleu", + "score":0.0152437624 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"yo", + "task":"translation_to", + "metric":"chrf", + "score":0.1214492647 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"yue", + "task":"classification", + "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", + "model":"mistralai\/mistral-nemo", + "bcp_47":"yue", "task":"translation_from", "metric":"bleu", - "score":0.2568309796 + "score":0.0740063452 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", + "model":"mistralai\/mistral-nemo", + "bcp_47":"yue", "task":"translation_from", "metric":"chrf", - "score":0.5058927884 + "score":0.2757375638 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", + "model":"mistralai\/mistral-nemo", + "bcp_47":"yue", "task":"translation_to", "metric":"bleu", - "score":0.3323405641 + "score":0.0872564614 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", + "model":"mistralai\/mistral-nemo", + "bcp_47":"yue", "task":"translation_to", "metric":"chrf", - "score":0.5569354008 + "score":0.1427963743 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-nemo", + "bcp_47":"zh", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-nemo", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"zh", "task":"mmlu", "metric":"accuracy", - "score":1.0 + "score":0.7 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-nemo", + "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.3183331223 + "score":0.0992800287 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-nemo", + "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.5559144449 + "score":0.324429867 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-nemo", + "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.4500659682 + "score":0.09185491 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-nemo", + "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.6761551234 + "score":0.1769207611 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-nemo", + "bcp_47":"zu", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.6 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-nemo", + "bcp_47":"zu", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.1 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-nemo", + "bcp_47":"zu", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.4 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-nemo", + "bcp_47":"zu", "task":"translation_from", "metric":"bleu", - "score":0.2051262499 + "score":0.0494841031 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-nemo", + "bcp_47":"zu", "task":"translation_from", "metric":"chrf", - "score":0.4837372958 + "score":0.1999996494 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-nemo", + "bcp_47":"zu", "task":"translation_to", "metric":"bleu", - "score":0.3699194641 + "score":0.0196415161 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-nemo", + "bcp_47":"zu", "task":"translation_to", "metric":"chrf", - "score":0.5770913921 + "score":0.1910730769 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", + "model":"mistralai\/mistral-saba", + "bcp_47":"aeb", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", + "model":"mistralai\/mistral-saba", + "bcp_47":"aeb", "task":"translation_from", "metric":"bleu", - "score":0.2666171334 + "score":0.2867784698 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", + "model":"mistralai\/mistral-saba", + "bcp_47":"aeb", "task":"translation_from", "metric":"chrf", - "score":0.4765001737 + "score":0.5037863792 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", + "model":"mistralai\/mistral-saba", + "bcp_47":"aeb", "task":"translation_to", "metric":"bleu", - "score":0.1168753501 + "score":0.2421610142 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", + "model":"mistralai\/mistral-saba", + "bcp_47":"aeb", "task":"translation_to", "metric":"chrf", - "score":0.3522716786 + "score":0.4148106883 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-saba", + "bcp_47":"af", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"mgsm", - "metric":"accuracy", "score":0.0 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-saba", + "bcp_47":"af", "task":"translation_from", "metric":"bleu", - "score":0.2983575506 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-saba", + "bcp_47":"af", "task":"translation_from", "metric":"chrf", - "score":0.5283269577 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-saba", + "bcp_47":"af", "task":"translation_to", "metric":"bleu", - "score":0.3087303367 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-saba", + "bcp_47":"af", "task":"translation_to", "metric":"chrf", - "score":0.6028401745 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", + "model":"mistralai\/mistral-saba", + "bcp_47":"ak", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.6 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", + "model":"mistralai\/mistral-saba", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"ak", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"ak", "task":"translation_from", "metric":"bleu", - "score":0.2210855899 + "score":0.0787707917 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", + "model":"mistralai\/mistral-saba", + "bcp_47":"ak", "task":"translation_from", "metric":"chrf", - "score":0.4616487061 + "score":0.218746848 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", + "model":"mistralai\/mistral-saba", + "bcp_47":"ak", "task":"translation_to", "metric":"bleu", - "score":0.2867265678 + "score":0.0187531501 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", + "model":"mistralai\/mistral-saba", + "bcp_47":"ak", "task":"translation_to", "metric":"chrf", - "score":0.5646798034 + "score":0.1112723085 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", + "model":"mistralai\/mistral-saba", + "bcp_47":"am", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.3 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", + "model":"mistralai\/mistral-saba", + "bcp_47":"am", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.2 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", + "model":"mistralai\/mistral-saba", + "bcp_47":"am", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.6 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", + "model":"mistralai\/mistral-saba", + "bcp_47":"am", "task":"translation_from", "metric":"bleu", - "score":0.357367421 + "score":0.0462314764 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", + "model":"mistralai\/mistral-saba", + "bcp_47":"am", "task":"translation_from", "metric":"chrf", - "score":0.5659157865 + "score":0.1434072436 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", + "model":"mistralai\/mistral-saba", + "bcp_47":"am", "task":"translation_to", "metric":"bleu", - "score":0.3515649071 + "score":0.0132821079 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", + "model":"mistralai\/mistral-saba", + "bcp_47":"am", "task":"translation_to", "metric":"chrf", - "score":0.5645706042 + "score":0.0456848091 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", + "model":"mistralai\/mistral-saba", + "bcp_47":"apc", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"mgsm", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", + "model":"mistralai\/mistral-saba", + "bcp_47":"apc", "task":"translation_from", "metric":"bleu", - "score":0.2422208114 + "score":0.2054466179 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", + "model":"mistralai\/mistral-saba", + "bcp_47":"apc", "task":"translation_from", "metric":"chrf", - "score":0.4745802383 + "score":0.4635698598 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", + "model":"mistralai\/mistral-saba", + "bcp_47":"apc", "task":"translation_to", "metric":"bleu", - "score":0.3118363896 + "score":0.2513408047 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", + "model":"mistralai\/mistral-saba", + "bcp_47":"apc", "task":"translation_to", "metric":"chrf", - "score":0.4892437324 + "score":0.5078766295 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", + "model":"mistralai\/mistral-saba", + "bcp_47":"ar", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", + "model":"mistralai\/mistral-saba", + "bcp_47":"ar", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":1.0 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", + "model":"mistralai\/mistral-saba", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.2772171859 + "score":0.278999196 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", + "model":"mistralai\/mistral-saba", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.5118206984 + "score":0.5072892325 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", + "model":"mistralai\/mistral-saba", + "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.3271066365 + "score":0.335915232 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", + "model":"mistralai\/mistral-saba", + "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.5803660329 + "score":0.5453940527 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-saba", + "bcp_47":"ary", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-saba", + "bcp_47":"ary", "task":"translation_from", "metric":"bleu", - "score":0.2584265792 + "score":0.1240264763 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-saba", + "bcp_47":"ary", "task":"translation_from", "metric":"chrf", - "score":0.5020697076 + "score":0.3914345538 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-saba", + "bcp_47":"ary", "task":"translation_to", "metric":"bleu", - "score":0.2624388601 + "score":0.1767788852 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-saba", + "bcp_47":"ary", "task":"translation_to", "metric":"chrf", - "score":0.4452300688 + "score":0.3838449247 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"uz", + "model":"mistralai\/mistral-saba", + "bcp_47":"arz", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"uz", + "model":"mistralai\/mistral-saba", + "bcp_47":"arz", "task":"translation_from", "metric":"bleu", - "score":0.2640324297 + "score":0.2249154291 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"uz", + "model":"mistralai\/mistral-saba", + "bcp_47":"arz", "task":"translation_from", "metric":"chrf", - "score":0.5196545965 + "score":0.4283700551 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"uz", + "model":"mistralai\/mistral-saba", + "bcp_47":"arz", "task":"translation_to", "metric":"bleu", - "score":0.2748329219 + "score":0.2483121176 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"uz", + "model":"mistralai\/mistral-saba", + "bcp_47":"arz", "task":"translation_to", "metric":"chrf", - "score":0.5341998684 + "score":0.4611825726 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-saba", + "bcp_47":"as", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-saba", + "bcp_47":"as", "task":"translation_from", "metric":"bleu", - "score":0.2872551102 + "score":0.1368466985 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-saba", + "bcp_47":"as", "task":"translation_from", "metric":"chrf", - "score":0.5360250569 + "score":0.3988973343 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-saba", + "bcp_47":"as", "task":"translation_to", "metric":"bleu", - "score":0.3575088107 + "score":0.0337104112 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-saba", + "bcp_47":"as", "task":"translation_to", "metric":"chrf", - "score":0.5879974234 + "score":0.2239889311 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"wuu", + "model":"mistralai\/mistral-saba", + "bcp_47":"awa", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"wuu", + "model":"mistralai\/mistral-saba", + "bcp_47":"awa", "task":"translation_from", "metric":"bleu", - "score":0.2174626032 + "score":0.2836423323 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"wuu", + "model":"mistralai\/mistral-saba", + "bcp_47":"awa", "task":"translation_from", "metric":"chrf", - "score":0.4686565248 + "score":0.4827693819 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"wuu", + "model":"mistralai\/mistral-saba", + "bcp_47":"awa", "task":"translation_to", "metric":"bleu", - "score":0.0941401506 + "score":0.1511392088 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"wuu", + "model":"mistralai\/mistral-saba", + "bcp_47":"awa", "task":"translation_to", "metric":"chrf", - "score":0.1690248565 + "score":0.3858872623 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", + "model":"mistralai\/mistral-saba", + "bcp_47":"az", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", + "model":"mistralai\/mistral-saba", + "bcp_47":"az", "task":"translation_from", "metric":"bleu", - "score":0.2098595469 + "score":0.1923090312 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", + "model":"mistralai\/mistral-saba", + "bcp_47":"az", "task":"translation_from", "metric":"chrf", - "score":0.4603190119 + "score":0.3973361244 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", + "model":"mistralai\/mistral-saba", + "bcp_47":"az", "task":"translation_to", "metric":"bleu", - "score":0.0831701767 + "score":0.1398741741 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", + "model":"mistralai\/mistral-saba", + "bcp_47":"az", "task":"translation_to", "metric":"chrf", - "score":0.2065328404 + "score":0.4023712427 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-saba", + "bcp_47":"be", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"mgsm", - "metric":"accuracy", - "score":0.0 + "model":"mistralai\/mistral-saba", + "bcp_47":"be", + "task":"translation_from", + "metric":"bleu", + "score":0.1262645615 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", + "model":"mistralai\/mistral-saba", + "bcp_47":"be", + "task":"translation_from", + "metric":"chrf", + "score":0.389349888 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"be", + "task":"translation_to", + "metric":"bleu", + "score":0.164496362 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"be", + "task":"translation_to", + "metric":"chrf", + "score":0.42344822 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"bho", + "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-saba", + "bcp_47":"bho", "task":"translation_from", "metric":"bleu", - "score":0.2619931658 + "score":0.2246336129 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-saba", + "bcp_47":"bho", "task":"translation_from", "metric":"chrf", - "score":0.5251502482 + "score":0.4406538597 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-saba", + "bcp_47":"bho", "task":"translation_to", "metric":"bleu", - "score":0.2725475868 + "score":0.1192868334 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-saba", + "bcp_47":"bho", "task":"translation_to", "metric":"chrf", - "score":0.3148065512 + "score":0.3094007011 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"am", + "model":"mistralai\/mistral-saba", + "bcp_47":"bm", "task":"classification", "metric":"accuracy", - "score":0.6 - }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"am", - "task":"mgsm", - "metric":"accuracy", "score":0.0 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"am", - "task":"mmlu", - "metric":"accuracy", - "score":0.3 - }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"am", + "model":"mistralai\/mistral-saba", + "bcp_47":"bm", "task":"translation_from", "metric":"bleu", - "score":0.0584274365 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"am", + "model":"mistralai\/mistral-saba", + "bcp_47":"bm", "task":"translation_from", "metric":"chrf", - "score":0.2032749366 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"am", + "model":"mistralai\/mistral-saba", + "bcp_47":"bm", "task":"translation_to", "metric":"bleu", "score":0.0 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"am", + "model":"mistralai\/mistral-saba", + "bcp_47":"bm", "task":"translation_to", "metric":"chrf", - "score":0.0680986525 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"apc", + "model":"mistralai\/mistral-saba", + "bcp_47":"bn", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"apc", + "model":"mistralai\/mistral-saba", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.1147231502 + "score":0.2557484343 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"apc", + "model":"mistralai\/mistral-saba", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.3942588381 + "score":0.4816174974 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"apc", + "model":"mistralai\/mistral-saba", + "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.1208986545 + "score":0.336565743 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"apc", + "model":"mistralai\/mistral-saba", + "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.329533412 + "score":0.500099888 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-saba", + "bcp_47":"ca", "task":"classification", "metric":"accuracy", - "score":0.8 - }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.5 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-saba", + "bcp_47":"ca", "task":"translation_from", "metric":"bleu", - "score":0.2166642565 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-saba", + "bcp_47":"ca", "task":"translation_from", "metric":"chrf", - "score":0.4531623464 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-saba", + "bcp_47":"ca", "task":"translation_to", "metric":"bleu", - "score":0.2433592841 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-saba", + "bcp_47":"ca", "task":"translation_to", "metric":"chrf", - "score":0.3890038008 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"arz", + "model":"mistralai\/mistral-saba", + "bcp_47":"ceb", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"arz", + "model":"mistralai\/mistral-saba", + "bcp_47":"ceb", "task":"translation_from", "metric":"bleu", - "score":0.1494352369 + "score":0.1502069597 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"arz", + "model":"mistralai\/mistral-saba", + "bcp_47":"ceb", "task":"translation_from", "metric":"chrf", - "score":0.3928912763 + "score":0.365503748 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"arz", + "model":"mistralai\/mistral-saba", + "bcp_47":"ceb", "task":"translation_to", "metric":"bleu", - "score":0.212669524 + "score":0.1518861892 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"arz", + "model":"mistralai\/mistral-saba", + "bcp_47":"ceb", "task":"translation_to", "metric":"chrf", - "score":0.4040671507 + "score":0.3795025844 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"az", + "model":"mistralai\/mistral-saba", + "bcp_47":"ckb", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"az", + "model":"mistralai\/mistral-saba", + "bcp_47":"ckb", "task":"translation_from", "metric":"bleu", - "score":0.090597898 + "score":0.0716255326 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"az", + "model":"mistralai\/mistral-saba", + "bcp_47":"ckb", "task":"translation_from", "metric":"chrf", - "score":0.3141862136 + "score":0.2354287318 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"az", + "model":"mistralai\/mistral-saba", + "bcp_47":"ckb", "task":"translation_to", "metric":"bleu", - "score":0.0583354997 + "score":0.0016024995 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"az", + "model":"mistralai\/mistral-saba", + "bcp_47":"ckb", "task":"translation_to", "metric":"chrf", - "score":0.2066334095 + "score":0.1289259809 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"bho", + "model":"mistralai\/mistral-saba", + "bcp_47":"cs", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"bho", + "model":"mistralai\/mistral-saba", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"cs", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"cs", "task":"translation_from", "metric":"bleu", - "score":0.1762047672 + "score":0.2895060168 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"bho", + "model":"mistralai\/mistral-saba", + "bcp_47":"cs", "task":"translation_from", "metric":"chrf", - "score":0.4472079773 + "score":0.5088283599 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"bho", + "model":"mistralai\/mistral-saba", + "bcp_47":"cs", "task":"translation_to", "metric":"bleu", - "score":0.1314817408 + "score":0.3502843148 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"bho", + "model":"mistralai\/mistral-saba", + "bcp_47":"cs", "task":"translation_to", "metric":"chrf", - "score":0.3114200678 + "score":0.5851011111 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-saba", + "bcp_47":"de", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-saba", + "bcp_47":"de", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.6 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-saba", + "bcp_47":"de", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-saba", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.1749870589 + "score":0.33652498 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-saba", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.3959743603 + "score":0.5394051209 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-saba", + "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.1992458221 + "score":0.4124704223 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-saba", + "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.3995820747 + "score":0.6500309258 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"de", + "model":"mistralai\/mistral-saba", + "bcp_47":"el", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"de", + "model":"mistralai\/mistral-saba", + "bcp_47":"el", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"de", + "model":"mistralai\/mistral-saba", + "bcp_47":"el", "task":"mmlu", "metric":"accuracy", "score":0.7 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"de", + "model":"mistralai\/mistral-saba", + "bcp_47":"el", "task":"translation_from", "metric":"bleu", - "score":0.2301502689 + "score":0.2440848305 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"de", + "model":"mistralai\/mistral-saba", + "bcp_47":"el", "task":"translation_from", "metric":"chrf", - "score":0.4644650793 + "score":0.4482066389 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"de", + "model":"mistralai\/mistral-saba", + "bcp_47":"el", "task":"translation_to", "metric":"bleu", - "score":0.2921772734 + "score":0.3683187834 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"de", + "model":"mistralai\/mistral-saba", + "bcp_47":"el", "task":"translation_to", "metric":"chrf", - "score":0.4951314188 + "score":0.5300499022 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"en", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"en", "task":"mgsm", "metric":"accuracy", - "score":0.1 + "score":1.0 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"en", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.4124666467 + "score":0.4669071745 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.582315662 + "score":0.6351301458 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.5519762012 + "score":0.5813419207 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.7446058172 + "score":0.8065247071 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"es", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"es", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"es", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.2337331881 + "score":0.293714449 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.4523774022 + "score":0.4892518335 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.2045157252 + "score":0.3400529578 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.4389018917 + "score":0.6054518089 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"fa", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"fa", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.8 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"fa", "task":"translation_from", "metric":"bleu", - "score":0.1671223511 + "score":0.2392739698 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"fa", "task":"translation_from", "metric":"chrf", - "score":0.4271635079 + "score":0.4813714407 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"fa", "task":"translation_to", "metric":"bleu", - "score":0.0972518606 + "score":0.2321648572 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"fa", "task":"translation_to", "metric":"chrf", - "score":0.3009816209 + "score":0.4166342577 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"fil", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"fil", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"fil", "task":"translation_from", "metric":"bleu", - "score":0.2033697572 + "score":0.2811212879 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"fil", "task":"translation_from", "metric":"chrf", - "score":0.4085758597 + "score":0.4244631944 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"fil", "task":"translation_to", "metric":"bleu", - "score":0.1337024916 + "score":0.2282664087 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"fil", "task":"translation_to", "metric":"chrf", - "score":0.3569658269 + "score":0.5153269959 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"fr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"fr", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"fr", "task":"mmlu", "metric":"accuracy", "score":0.7 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.2381890937 + "score":0.2548863763 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.4806457757 + "score":0.5181895957 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.3213357404 + "score":0.4309072933 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.5096591733 + "score":0.6122951839 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.0365190298 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.1781763265 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0417146562 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.0914072868 + }, + { + "model":"mistralai\/mistral-saba", "bcp_47":"gu", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"gu", "task":"translation_from", "metric":"bleu", - "score":0.168790959 + "score":0.266641943 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"gu", "task":"translation_from", "metric":"chrf", - "score":0.3588726594 + "score":0.4689143537 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"gu", "task":"translation_to", "metric":"bleu", - "score":0.0998466384 + "score":0.1714078748 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"gu", "task":"translation_to", "metric":"chrf", - "score":0.3089879911 + "score":0.45528413 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"ha", "task":"classification", "metric":"accuracy", "score":0.8 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"ha", "task":"mgsm", "metric":"accuracy", "score":0.0 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"ha", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.5 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"ha", "task":"translation_from", "metric":"bleu", - "score":0.0730728705 + "score":0.0639113657 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"ha", "task":"translation_from", "metric":"chrf", - "score":0.2880810134 + "score":0.1707631202 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"ha", "task":"translation_to", "metric":"bleu", - "score":0.032930228 + "score":0.0551968249 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"ha", "task":"translation_to", "metric":"chrf", - "score":0.1836595807 + "score":0.165412979 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"hi", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"hi", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.2951777856 + "score":0.3708164771 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.5193991656 + "score":0.5780452995 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.332068694 + "score":0.3889665973 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.5232846835 + "score":0.5940361548 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-saba", + "bcp_47":"hne", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-saba", + "bcp_47":"hne", "task":"translation_from", "metric":"bleu", - "score":0.1717243204 + "score":0.261843766 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-saba", + "bcp_47":"hne", "task":"translation_from", "metric":"chrf", - "score":0.4178336488 + "score":0.4806474097 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-saba", + "bcp_47":"hne", "task":"translation_to", "metric":"bleu", - "score":0.1865357446 + "score":0.0995040783 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-saba", + "bcp_47":"hne", "task":"translation_to", "metric":"chrf", - "score":0.429444403 + "score":0.3935925698 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"it", + "model":"mistralai\/mistral-saba", + "bcp_47":"ht", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"it", - "task":"mgsm", - "metric":"accuracy", "score":0.0 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.4 - }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"it", + "model":"mistralai\/mistral-saba", + "bcp_47":"ht", "task":"translation_from", "metric":"bleu", - "score":0.1826323546 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"it", + "model":"mistralai\/mistral-saba", + "bcp_47":"ht", "task":"translation_from", "metric":"chrf", - "score":0.4460216478 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"it", + "model":"mistralai\/mistral-saba", + "bcp_47":"ht", "task":"translation_to", "metric":"bleu", - "score":0.1650968642 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"it", + "model":"mistralai\/mistral-saba", + "bcp_47":"ht", "task":"translation_to", "metric":"chrf", - "score":0.3244010767 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ja", + "model":"mistralai\/mistral-saba", + "bcp_47":"hu", "task":"classification", "metric":"accuracy", "score":0.9 }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ja", - "task":"mgsm", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.4 - }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1933631076 - }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4686346426 - }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1629637627 - }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.265082494 - }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"jv", - "task":"classification", + { + "model":"mistralai\/mistral-saba", + "bcp_47":"hu", + "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"jv", + "model":"mistralai\/mistral-saba", + "bcp_47":"hu", "task":"translation_from", "metric":"bleu", - "score":0.0726508623 + "score":0.218205371 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"jv", + "model":"mistralai\/mistral-saba", + "bcp_47":"hu", "task":"translation_from", "metric":"chrf", - "score":0.3051851212 + "score":0.4561374245 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"jv", + "model":"mistralai\/mistral-saba", + "bcp_47":"hu", "task":"translation_to", "metric":"bleu", - "score":0.1282743245 + "score":0.2523642916 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"jv", + "model":"mistralai\/mistral-saba", + "bcp_47":"hu", "task":"translation_to", "metric":"chrf", - "score":0.3321469572 + "score":0.5178642158 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"kn", + "model":"mistralai\/mistral-saba", + "bcp_47":"id", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"kn", + "model":"mistralai\/mistral-saba", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.1401399582 + "score":0.2714445111 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"kn", + "model":"mistralai\/mistral-saba", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.3051974688 + "score":0.5033343062 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"kn", + "model":"mistralai\/mistral-saba", + "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.0942053588 + "score":0.3367134056 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"kn", + "model":"mistralai\/mistral-saba", + "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.3363687748 + "score":0.6204206544 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ko", + "model":"mistralai\/mistral-saba", + "bcp_47":"ig", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ko", + "model":"mistralai\/mistral-saba", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"ig", "task":"mmlu", "metric":"accuracy", "score":0.6 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ko", + "model":"mistralai\/mistral-saba", + "bcp_47":"ig", "task":"translation_from", "metric":"bleu", - "score":0.1324044329 + "score":0.0577998278 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ko", + "model":"mistralai\/mistral-saba", + "bcp_47":"ig", "task":"translation_from", "metric":"chrf", - "score":0.3790251178 + "score":0.184470268 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ko", + "model":"mistralai\/mistral-saba", + "bcp_47":"ig", "task":"translation_to", "metric":"bleu", - "score":0.1547958954 + "score":0.0317976664 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ko", + "model":"mistralai\/mistral-saba", + "bcp_47":"ig", "task":"translation_to", "metric":"chrf", - "score":0.2281907624 + "score":0.1311048104 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ml", + "model":"mistralai\/mistral-saba", + "bcp_47":"ilo", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ml", + "model":"mistralai\/mistral-saba", + "bcp_47":"ilo", "task":"translation_from", "metric":"bleu", - "score":0.171951865 + "score":0.097793149 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ml", + "model":"mistralai\/mistral-saba", + "bcp_47":"ilo", "task":"translation_from", "metric":"chrf", - "score":0.3835379408 + "score":0.2519860373 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ml", + "model":"mistralai\/mistral-saba", + "bcp_47":"ilo", "task":"translation_to", "metric":"bleu", - "score":0.1659756056 + "score":0.0683877466 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ml", + "model":"mistralai\/mistral-saba", + "bcp_47":"ilo", "task":"translation_to", "metric":"chrf", - "score":0.4178488097 + "score":0.255829494 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"mr", + "model":"mistralai\/mistral-saba", + "bcp_47":"it", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"mr", + "model":"mistralai\/mistral-saba", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"it", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"it", "task":"translation_from", "metric":"bleu", - "score":0.144541816 + "score":0.26428669 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"mr", + "model":"mistralai\/mistral-saba", + "bcp_47":"it", "task":"translation_from", "metric":"chrf", - "score":0.3648764501 + "score":0.4902151754 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"mr", + "model":"mistralai\/mistral-saba", + "bcp_47":"it", "task":"translation_to", "metric":"bleu", - "score":0.1047482644 + "score":0.3239977856 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"mr", + "model":"mistralai\/mistral-saba", + "bcp_47":"it", "task":"translation_to", "metric":"chrf", - "score":0.2965277611 + "score":0.5865126635 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ms", + "model":"mistralai\/mistral-saba", + "bcp_47":"ja", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ms", + "model":"mistralai\/mistral-saba", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"ja", "task":"mmlu", "metric":"accuracy", - "score":0.3 + "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ms", + "model":"mistralai\/mistral-saba", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.2497767256 + "score":0.2208745982 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ms", + "model":"mistralai\/mistral-saba", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.4824221555 + "score":0.4944838309 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ms", + "model":"mistralai\/mistral-saba", + "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.1854347311 + "score":0.1755723698 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ms", + "model":"mistralai\/mistral-saba", + "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.331339842 + "score":0.3733502483 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"my", + "model":"mistralai\/mistral-saba", + "bcp_47":"jv", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"my", + "model":"mistralai\/mistral-saba", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.0578909241 + "score":0.1125731148 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"my", + "model":"mistralai\/mistral-saba", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.2614924673 + "score":0.2778916971 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"my", + "model":"mistralai\/mistral-saba", + "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.1528509146 + "score":0.0861201622 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"my", + "model":"mistralai\/mistral-saba", + "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.347684852 + "score":0.3310005151 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-saba", + "bcp_47":"ki", "task":"classification", "metric":"accuracy", - "score":0.6 - }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"om", - "task":"mgsm", - "metric":"accuracy", "score":0.0 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"om", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-saba", + "bcp_47":"ki", "task":"translation_from", "metric":"bleu", - "score":0.0322766368 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-saba", + "bcp_47":"ki", "task":"translation_from", "metric":"chrf", - "score":0.1548467965 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-saba", + "bcp_47":"ki", "task":"translation_to", "metric":"bleu", - "score":0.0104672499 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-saba", + "bcp_47":"ki", "task":"translation_to", "metric":"chrf", - "score":0.1495897529 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"or", + "model":"mistralai\/mistral-saba", + "bcp_47":"kk", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"or", + "model":"mistralai\/mistral-saba", + "bcp_47":"kk", "task":"translation_from", "metric":"bleu", - "score":0.1266427785 + "score":0.1995238484 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"or", + "model":"mistralai\/mistral-saba", + "bcp_47":"kk", "task":"translation_from", "metric":"chrf", - "score":0.3740164648 + "score":0.4335224538 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"or", + "model":"mistralai\/mistral-saba", + "bcp_47":"kk", "task":"translation_to", "metric":"bleu", - "score":0.0281188176 + "score":0.172304501 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"or", + "model":"mistralai\/mistral-saba", + "bcp_47":"kk", "task":"translation_to", "metric":"chrf", - "score":0.1879339756 + "score":0.4246105774 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-saba", + "bcp_47":"km", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.6 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-saba", + "bcp_47":"km", "task":"translation_from", "metric":"bleu", - "score":0.3595710948 + "score":0.0572277693 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-saba", + "bcp_47":"km", "task":"translation_from", "metric":"chrf", - "score":0.539538196 + "score":0.2158207267 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-saba", + "bcp_47":"km", "task":"translation_to", "metric":"bleu", - "score":0.3110476538 + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-saba", + "bcp_47":"km", "task":"translation_to", "metric":"chrf", - "score":0.4964416902 + "score":0.0812368695 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"pl", + "model":"mistralai\/mistral-saba", + "bcp_47":"kn", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"pl", - "task":"mgsm", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"pl", + "model":"mistralai\/mistral-saba", + "bcp_47":"kn", "task":"translation_from", "metric":"bleu", - "score":0.1791082561 + "score":0.2415284955 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"pl", + "model":"mistralai\/mistral-saba", + "bcp_47":"kn", "task":"translation_from", "metric":"chrf", - "score":0.4315704667 + "score":0.4761318508 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"pl", + "model":"mistralai\/mistral-saba", + "bcp_47":"kn", "task":"translation_to", "metric":"bleu", - "score":0.1725231395 + "score":0.2506029382 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"pl", + "model":"mistralai\/mistral-saba", + "bcp_47":"kn", "task":"translation_to", "metric":"chrf", - "score":0.3476924531 + "score":0.4820610024 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-saba", + "bcp_47":"ko", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-saba", + "bcp_47":"ko", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.6 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-saba", + "bcp_47":"ko", "task":"translation_from", "metric":"bleu", - "score":0.2073899393 + "score":0.2390442925 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-saba", + "bcp_47":"ko", "task":"translation_from", "metric":"chrf", - "score":0.4691838054 + "score":0.4660486517 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-saba", + "bcp_47":"ko", "task":"translation_to", "metric":"bleu", - "score":0.1956364634 + "score":0.1889249825 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-saba", + "bcp_47":"ko", "task":"translation_to", "metric":"chrf", - "score":0.3100521945 + "score":0.314876296 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-saba", + "bcp_47":"lua", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ru", - "task":"mgsm", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-saba", + "bcp_47":"lua", "task":"translation_from", "metric":"bleu", - "score":0.1671614266 + "score":0.0673075407 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-saba", + "bcp_47":"lua", "task":"translation_from", "metric":"chrf", - "score":0.4422244829 + "score":0.2078406147 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-saba", + "bcp_47":"lua", "task":"translation_to", "metric":"bleu", - "score":0.1893614933 + "score":0.0194519734 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-saba", + "bcp_47":"lua", "task":"translation_to", "metric":"chrf", - "score":0.4605763082 + "score":0.1011298866 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"sd", + "model":"mistralai\/mistral-saba", + "bcp_47":"mag", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"sd", + "model":"mistralai\/mistral-saba", + "bcp_47":"mag", "task":"translation_from", "metric":"bleu", - "score":0.1191725522 + "score":0.2922121087 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"sd", + "model":"mistralai\/mistral-saba", + "bcp_47":"mag", "task":"translation_from", "metric":"chrf", - "score":0.3048062246 + "score":0.5037938788 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"sd", + "model":"mistralai\/mistral-saba", + "bcp_47":"mag", "task":"translation_to", "metric":"bleu", - "score":0.0235301378 + "score":0.2113094586 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"sd", + "model":"mistralai\/mistral-saba", + "bcp_47":"mag", "task":"translation_to", "metric":"chrf", - "score":0.1674956015 + "score":0.4865126178 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-saba", + "bcp_47":"mai", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"sw", - "task":"mgsm", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.4 - }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-saba", + "bcp_47":"mai", "task":"translation_from", "metric":"bleu", - "score":0.153544279 + "score":0.2362297066 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-saba", + "bcp_47":"mai", "task":"translation_from", "metric":"chrf", - "score":0.381670314 + "score":0.4746614882 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-saba", + "bcp_47":"mai", "task":"translation_to", "metric":"bleu", - "score":0.0470329064 + "score":0.108285746 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-saba", + "bcp_47":"mai", "task":"translation_to", "metric":"chrf", - "score":0.3516233998 + "score":0.3934483867 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ta", + "model":"mistralai\/mistral-saba", + "bcp_47":"mg", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ta", + "model":"mistralai\/mistral-saba", + "bcp_47":"mg", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"mg", "task":"translation_from", "metric":"bleu", - "score":0.116565827 + "score":0.0484302224 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ta", + "model":"mistralai\/mistral-saba", + "bcp_47":"mg", "task":"translation_from", "metric":"chrf", - "score":0.3259696821 + "score":0.2222317379 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ta", + "model":"mistralai\/mistral-saba", + "bcp_47":"mg", "task":"translation_to", "metric":"bleu", - "score":0.1799251119 + "score":0.0220530515 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ta", + "model":"mistralai\/mistral-saba", + "bcp_47":"mg", "task":"translation_to", "metric":"chrf", - "score":0.4422961909 + "score":0.2506994166 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"te", + "model":"mistralai\/mistral-saba", + "bcp_47":"ml", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"te", - "task":"mgsm", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.5 - }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"te", + "model":"mistralai\/mistral-saba", + "bcp_47":"ml", "task":"translation_from", "metric":"bleu", - "score":0.2177874056 + "score":0.2936668736 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"te", + "model":"mistralai\/mistral-saba", + "bcp_47":"ml", "task":"translation_from", "metric":"chrf", - "score":0.4228885108 + "score":0.4940538554 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"te", + "model":"mistralai\/mistral-saba", + "bcp_47":"ml", "task":"translation_to", "metric":"bleu", - "score":0.2215396728 + "score":0.1686173343 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"te", + "model":"mistralai\/mistral-saba", + "bcp_47":"ml", "task":"translation_to", "metric":"chrf", - "score":0.4514044695 + "score":0.4033123912 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"th", + "model":"mistralai\/mistral-saba", + "bcp_47":"mr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"th", - "task":"mgsm", - "metric":"accuracy", - "score":0.1 - }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"th", + "model":"mistralai\/mistral-saba", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.1077250531 + "score":0.3097940645 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"th", + "model":"mistralai\/mistral-saba", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.3466580166 + "score":0.5304242832 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"th", + "model":"mistralai\/mistral-saba", + "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.2151882368 + "score":0.2168719994 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"th", + "model":"mistralai\/mistral-saba", + "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.3617567446 + "score":0.4555868419 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"tr", + "model":"mistralai\/mistral-saba", + "bcp_47":"ms", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"tr", + "model":"mistralai\/mistral-saba", + "bcp_47":"ms", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.8 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"tr", + "model":"mistralai\/mistral-saba", + "bcp_47":"ms", "task":"translation_from", "metric":"bleu", - "score":0.1246699911 + "score":0.3030951939 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"tr", + "model":"mistralai\/mistral-saba", + "bcp_47":"ms", "task":"translation_from", "metric":"chrf", - "score":0.3740469363 + "score":0.5195567075 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"tr", + "model":"mistralai\/mistral-saba", + "bcp_47":"ms", "task":"translation_to", "metric":"bleu", - "score":0.1584629952 + "score":0.3655435175 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"tr", + "model":"mistralai\/mistral-saba", + "bcp_47":"ms", "task":"translation_to", "metric":"chrf", - "score":0.3608300472 + "score":0.6292737269 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-saba", + "bcp_47":"my", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-saba", + "bcp_47":"my", "task":"translation_from", "metric":"bleu", - "score":0.142024307 + "score":0.20731642 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-saba", + "bcp_47":"my", "task":"translation_from", "metric":"chrf", - "score":0.3925303581 + "score":0.414222781 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-saba", + "bcp_47":"my", "task":"translation_to", "metric":"bleu", - "score":0.13811776 + "score":0.0884087592 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-saba", + "bcp_47":"my", "task":"translation_to", "metric":"chrf", - "score":0.3521086255 + "score":0.2678188556 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"uz", + "model":"mistralai\/mistral-saba", + "bcp_47":"ne", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"uz", + "model":"mistralai\/mistral-saba", + "bcp_47":"ne", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"ne", "task":"translation_from", "metric":"bleu", - "score":0.1642228534 + "score":0.2746115511 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"uz", + "model":"mistralai\/mistral-saba", + "bcp_47":"ne", "task":"translation_from", "metric":"chrf", - "score":0.3736012886 + "score":0.5022730585 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"uz", + "model":"mistralai\/mistral-saba", + "bcp_47":"ne", "task":"translation_to", "metric":"bleu", - "score":0.055748564 + "score":0.1969099003 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"uz", + "model":"mistralai\/mistral-saba", + "bcp_47":"ne", "task":"translation_to", "metric":"chrf", - "score":0.2468016347 + "score":0.4481037581 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-saba", + "bcp_47":"nl", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-saba", + "bcp_47":"nl", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"nl", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-saba", + "bcp_47":"nl", "task":"translation_from", "metric":"bleu", - "score":0.1850447544 + "score":0.23536401 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-saba", + "bcp_47":"nl", "task":"translation_from", "metric":"chrf", - "score":0.4328029287 + "score":0.4943928771 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-saba", + "bcp_47":"nl", "task":"translation_to", "metric":"bleu", - "score":0.2262846976 + "score":0.3235114454 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-saba", + "bcp_47":"nl", "task":"translation_to", "metric":"chrf", - "score":0.3523271738 + "score":0.5875209718 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"wuu", + "model":"mistralai\/mistral-saba", + "bcp_47":"ny", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"wuu", + "model":"mistralai\/mistral-saba", + "bcp_47":"ny", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"ny", "task":"translation_from", "metric":"bleu", - "score":0.1255642972 + "score":0.0495608632 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"wuu", + "model":"mistralai\/mistral-saba", + "bcp_47":"ny", "task":"translation_from", "metric":"chrf", - "score":0.3734878168 + "score":0.2045968087 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"wuu", + "model":"mistralai\/mistral-saba", + "bcp_47":"ny", "task":"translation_to", "metric":"bleu", - "score":0.0067248884 + "score":0.0294620037 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"wuu", + "model":"mistralai\/mistral-saba", + "bcp_47":"ny", "task":"translation_to", "metric":"chrf", - "score":0.0887426693 + "score":0.1680044731 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"yue", + "model":"mistralai\/mistral-saba", + "bcp_47":"om", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"yue", + "model":"mistralai\/mistral-saba", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"om", "task":"translation_from", "metric":"bleu", - "score":0.1143976046 + "score":0.0200154664 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"yue", + "model":"mistralai\/mistral-saba", + "bcp_47":"om", "task":"translation_from", "metric":"chrf", - "score":0.3625809543 + "score":0.1606834413 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"yue", + "model":"mistralai\/mistral-saba", + "bcp_47":"om", "task":"translation_to", "metric":"bleu", - "score":0.1277032117 + "score":0.0044245595 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"yue", + "model":"mistralai\/mistral-saba", + "bcp_47":"om", "task":"translation_to", "metric":"chrf", - "score":0.2179430009 + "score":0.1054952984 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-saba", + "bcp_47":"or", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"zh", - "task":"mgsm", - "metric":"accuracy", - "score":0.2 - }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.5 - }, - { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-saba", + "bcp_47":"or", "task":"translation_from", "metric":"bleu", - "score":0.2115579648 + "score":0.1001204869 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-saba", + "bcp_47":"or", "task":"translation_from", "metric":"chrf", - "score":0.4634573062 + "score":0.2836152046 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-saba", + "bcp_47":"or", "task":"translation_to", "metric":"bleu", - "score":0.1903215556 + "score":0.0445164582 }, { - "model":"meta-llama\/llama-3.1-8b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-saba", + "bcp_47":"or", "task":"translation_to", "metric":"chrf", - "score":0.2429625775 + "score":0.2337334441 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-saba", + "bcp_47":"pa", "task":"classification", "metric":"accuracy", - "score":0.7 - }, - { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.5 + "score":0.9 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-saba", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.0534412445 + "score":0.4077844252 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-saba", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.1423750168 + "score":0.6076754833 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-saba", + "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.0522677244 + "score":0.4459003493 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-saba", + "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.1317238701 + "score":0.5840266721 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-saba", + "bcp_47":"pl", "task":"classification", "metric":"accuracy", - "score":0.4 + "score":0.9 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-saba", + "bcp_47":"pl", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.7 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-saba", + "bcp_47":"pl", "task":"mmlu", "metric":"accuracy", - "score":0.3 + "score":0.8 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-saba", + "bcp_47":"pl", "task":"translation_from", "metric":"bleu", - "score":0.0 + "score":0.2148436144 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-saba", + "bcp_47":"pl", "task":"translation_from", "metric":"chrf", - "score":0.0061046998 + "score":0.4670207413 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-saba", + "bcp_47":"pl", "task":"translation_to", "metric":"bleu", - "score":0.048395385 + "score":0.2898684366 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-saba", + "bcp_47":"pl", "task":"translation_to", "metric":"chrf", - "score":0.1624192131 + "score":0.525989117 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"de", + "model":"mistralai\/mistral-saba", + "bcp_47":"pt", "task":"classification", "metric":"accuracy", - "score":0.7 - }, - { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"de", - "task":"mgsm", - "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"de", + "model":"mistralai\/mistral-saba", + "bcp_47":"pt", "task":"mmlu", "metric":"accuracy", - "score":0.1 + "score":0.7 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"de", + "model":"mistralai\/mistral-saba", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.0365328036 + "score":0.264907032 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"de", + "model":"mistralai\/mistral-saba", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.1594198405 + "score":0.4939362461 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"de", + "model":"mistralai\/mistral-saba", + "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.089863703 + "score":0.4563355662 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"de", + "model":"mistralai\/mistral-saba", + "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.2290725718 + "score":0.6843169799 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-saba", + "bcp_47":"ro", "task":"classification", "metric":"accuracy", - "score":0.5 + "score":0.9 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-saba", + "bcp_47":"ro", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.7 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-saba", + "bcp_47":"ro", "task":"mmlu", "metric":"accuracy", - "score":0.3 + "score":0.9 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-saba", + "bcp_47":"ro", "task":"translation_from", "metric":"bleu", - "score":0.1186358374 + "score":0.258396409 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-saba", + "bcp_47":"ro", "task":"translation_from", "metric":"chrf", - "score":0.2861009841 + "score":0.4912290692 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-saba", + "bcp_47":"ro", "task":"translation_to", "metric":"bleu", - "score":0.0659782167 + "score":0.4713411152 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-saba", + "bcp_47":"ro", "task":"translation_to", "metric":"chrf", - "score":0.1219080159 + "score":0.6517904546 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-saba", + "bcp_47":"ru", "task":"classification", "metric":"accuracy", - "score":0.3 + "score":0.9 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-saba", + "bcp_47":"ru", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-saba", + "bcp_47":"ru", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":0.8 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-saba", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.0197183104 + "score":0.1955652432 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-saba", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.1858500787 + "score":0.4654058492 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-saba", + "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.1372446539 + "score":0.2591393679 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-saba", + "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.1970334371 + "score":0.4936043335 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-saba", + "bcp_47":"rw", "task":"classification", "metric":"accuracy", - "score":0.5 + "score":0.8 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-saba", + "bcp_47":"rw", "task":"mgsm", "metric":"accuracy", "score":0.0 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-saba", + "bcp_47":"rw", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":0.6 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-saba", + "bcp_47":"rw", "task":"translation_from", "metric":"bleu", - "score":0.0225723033 + "score":0.0562734776 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-saba", + "bcp_47":"rw", "task":"translation_from", "metric":"chrf", - "score":0.2128372612 + "score":0.212197658 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-saba", + "bcp_47":"rw", "task":"translation_to", "metric":"bleu", - "score":0.0900337367 + "score":0.0314083234 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-saba", + "bcp_47":"rw", "task":"translation_to", "metric":"chrf", - "score":0.2030113676 - }, - { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":0.5 + "score":0.1492631083 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"hi", - "task":"mmlu", + "model":"mistralai\/mistral-saba", + "bcp_47":"sd", + "task":"classification", "metric":"accuracy", - "score":0.1 + "score":0.9 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"hi", + "model":"mistralai\/mistral-saba", + "bcp_47":"sd", "task":"translation_from", "metric":"bleu", - "score":0.1275394125 + "score":0.0890242869 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"hi", + "model":"mistralai\/mistral-saba", + "bcp_47":"sd", "task":"translation_from", "metric":"chrf", - "score":0.2249822055 + "score":0.2507686532 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"hi", + "model":"mistralai\/mistral-saba", + "bcp_47":"sd", "task":"translation_to", "metric":"bleu", - "score":0.1164104087 + "score":0.0 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"hi", + "model":"mistralai\/mistral-saba", + "bcp_47":"sd", "task":"translation_to", "metric":"chrf", - "score":0.2255759794 + "score":0.0807676975 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-saba", + "bcp_47":"si", "task":"classification", "metric":"accuracy", - "score":0.6 + "score":0.4 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-saba", + "bcp_47":"si", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.7 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-saba", + "bcp_47":"si", "task":"translation_from", "metric":"bleu", - "score":0.0396919548 + "score":0.0084519738 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-saba", + "bcp_47":"si", "task":"translation_from", "metric":"chrf", - "score":0.193498077 + "score":0.151041875 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-saba", + "bcp_47":"si", "task":"translation_to", "metric":"bleu", - "score":0.0463130015 + "score":0.0056901248 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-saba", + "bcp_47":"si", "task":"translation_to", "metric":"chrf", - "score":0.147263979 + "score":0.100130068 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"ja", + "model":"mistralai\/mistral-saba", + "bcp_47":"sn", "task":"classification", "metric":"accuracy", - "score":0.5 + "score":0.9 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"ja", + "model":"mistralai\/mistral-saba", + "bcp_47":"sn", "task":"mgsm", "metric":"accuracy", "score":0.0 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"ja", + "model":"mistralai\/mistral-saba", + "bcp_47":"sn", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.5 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"ja", + "model":"mistralai\/mistral-saba", + "bcp_47":"sn", "task":"translation_from", "metric":"bleu", - "score":0.0196332917 + "score":0.0267041676 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"ja", + "model":"mistralai\/mistral-saba", + "bcp_47":"sn", "task":"translation_from", "metric":"chrf", - "score":0.0615297483 + "score":0.1555601794 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"ja", + "model":"mistralai\/mistral-saba", + "bcp_47":"sn", "task":"translation_to", "metric":"bleu", - "score":0.002077843 + "score":0.018455165 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"ja", + "model":"mistralai\/mistral-saba", + "bcp_47":"sn", "task":"translation_to", "metric":"chrf", - "score":0.0228028425 + "score":0.1280213362 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"jv", + "model":"mistralai\/mistral-saba", + "bcp_47":"so", "task":"classification", "metric":"accuracy", - "score":0.5 + "score":0.7 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"jv", + "model":"mistralai\/mistral-saba", + "bcp_47":"so", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"so", "task":"translation_from", "metric":"bleu", - "score":0.0192847454 + "score":0.0558797598 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"jv", + "model":"mistralai\/mistral-saba", + "bcp_47":"so", "task":"translation_from", "metric":"chrf", - "score":0.1432000045 + "score":0.1672295272 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"jv", + "model":"mistralai\/mistral-saba", + "bcp_47":"so", "task":"translation_to", "metric":"bleu", - "score":0.0179600462 + "score":0.0266323434 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"jv", + "model":"mistralai\/mistral-saba", + "bcp_47":"so", "task":"translation_to", "metric":"chrf", - "score":0.1308378956 + "score":0.1344659816 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"mr", + "model":"mistralai\/mistral-saba", + "bcp_47":"sr", "task":"classification", "metric":"accuracy", - "score":0.3 + "score":0.9 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"mr", + "model":"mistralai\/mistral-saba", + "bcp_47":"sr", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"sr", "task":"translation_from", "metric":"bleu", - "score":0.0103335448 + "score":0.2165549669 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"mr", + "model":"mistralai\/mistral-saba", + "bcp_47":"sr", "task":"translation_from", "metric":"chrf", - "score":0.0394434629 + "score":0.4902121608 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"mr", + "model":"mistralai\/mistral-saba", + "bcp_47":"sr", "task":"translation_to", "metric":"bleu", - "score":0.0093410183 + "score":0.2493024035 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"mr", + "model":"mistralai\/mistral-saba", + "bcp_47":"sr", "task":"translation_to", "metric":"chrf", - "score":0.0758287765 + "score":0.4391116426 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-saba", + "bcp_47":"su", "task":"classification", "metric":"accuracy", - "score":0.3 + "score":0.9 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-saba", + "bcp_47":"su", "task":"translation_from", "metric":"bleu", - "score":0.2072883352 + "score":0.1532491466 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-saba", + "bcp_47":"su", "task":"translation_from", "metric":"chrf", - "score":0.2238489904 + "score":0.3330342559 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-saba", + "bcp_47":"su", "task":"translation_to", "metric":"bleu", - "score":0.2192906863 + "score":0.0762662838 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-saba", + "bcp_47":"su", "task":"translation_to", "metric":"chrf", - "score":0.330676254 + "score":0.2740420072 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-saba", + "bcp_47":"sv", "task":"classification", "metric":"accuracy", - "score":0.2 + "score":0.9 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-saba", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"sv", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":0.8 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-saba", + "bcp_47":"sv", "task":"translation_from", "metric":"bleu", - "score":0.0506856305 + "score":0.2875970952 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-saba", + "bcp_47":"sv", "task":"translation_from", "metric":"chrf", - "score":0.2502940387 + "score":0.4962250868 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-saba", + "bcp_47":"sv", "task":"translation_to", "metric":"bleu", - "score":0.0801303171 + "score":0.382073635 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-saba", + "bcp_47":"sv", "task":"translation_to", "metric":"chrf", - "score":0.1635269784 + "score":0.6293993104 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-saba", + "bcp_47":"sw", "task":"classification", "metric":"accuracy", - "score":0.6 + "score":0.9 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-saba", + "bcp_47":"sw", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.7 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-saba", + "bcp_47":"sw", "task":"mmlu", "metric":"accuracy", - "score":0.2 + "score":0.6 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-saba", + "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.050859162 + "score":0.0845702794 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-saba", + "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.2002283949 + "score":0.2799479817 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-saba", + "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.0199756762 + "score":0.1327606257 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-saba", + "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.1055944134 + "score":0.4346855791 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-saba", + "bcp_47":"ta", "task":"classification", "metric":"accuracy", - "score":0.4 - }, - { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"sw", - "task":"mgsm", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.3 + "score":0.9 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-saba", + "bcp_47":"ta", "task":"translation_from", "metric":"bleu", - "score":0.001996605 + "score":0.2777158956 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-saba", + "bcp_47":"ta", "task":"translation_from", "metric":"chrf", - "score":0.1999016804 + "score":0.4958635491 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-saba", + "bcp_47":"ta", "task":"translation_to", "metric":"bleu", - "score":0.0453589274 + "score":0.2970897235 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-saba", + "bcp_47":"ta", "task":"translation_to", "metric":"chrf", - "score":0.1405820992 + "score":0.5394670378 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"te", "task":"classification", "metric":"accuracy", - "score":0.4 + "score":0.9 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"te", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"te", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":0.5 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.1115247653 + "score":0.3805998732 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.1296059134 + "score":0.5566308844 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.1480453761 + "score":0.3811390337 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.2690624141 + "score":0.5895281984 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-saba", + "bcp_47":"tg", "task":"classification", "metric":"accuracy", - "score":0.4 + "score":0.9 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-saba", + "bcp_47":"tg", "task":"translation_from", "metric":"bleu", - "score":0.0114376329 + "score":0.0685553777 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-saba", + "bcp_47":"tg", "task":"translation_from", "metric":"chrf", - "score":0.0233475148 + "score":0.2845942287 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-saba", + "bcp_47":"tg", "task":"translation_to", "metric":"bleu", - "score":0.0385720696 + "score":0.0371906835 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-saba", + "bcp_47":"tg", "task":"translation_to", "metric":"chrf", - "score":0.1423687352 + "score":0.1797173863 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-saba", + "bcp_47":"th", "task":"classification", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"vi", - "task":"mmlu", + "model":"mistralai\/mistral-saba", + "bcp_47":"th", + "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":0.9 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-saba", + "bcp_47":"th", "task":"translation_from", "metric":"bleu", - "score":0.0697220351 + "score":0.2079294904 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-saba", + "bcp_47":"th", "task":"translation_from", "metric":"chrf", - "score":0.1874677848 + "score":0.4320631023 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-saba", + "bcp_47":"th", "task":"translation_to", "metric":"bleu", - "score":0.135086862 + "score":0.2456928253 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-saba", + "bcp_47":"th", "task":"translation_to", "metric":"chrf", - "score":0.2446182636 + "score":0.3989628007 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-saba", + "bcp_47":"ti", "task":"classification", "metric":"accuracy", - "score":0.7 + "score":0.2 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"zh", - "task":"mgsm", - "metric":"accuracy", + "model":"mistralai\/mistral-saba", + "bcp_47":"ti", + "task":"translation_from", + "metric":"bleu", + "score":0.0154825384 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"ti", + "task":"translation_from", + "metric":"chrf", + "score":0.1339811483 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"ti", + "task":"translation_to", + "metric":"bleu", "score":0.0 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-saba", + "bcp_47":"ti", + "task":"translation_to", + "metric":"chrf", + "score":0.0278445131 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"tr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"tr", "task":"mmlu", "metric":"accuracy", - "score":0.1 + "score":0.9 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-saba", + "bcp_47":"tr", "task":"translation_from", "metric":"bleu", - "score":0.0190942897 + "score":0.2699521486 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-saba", + "bcp_47":"tr", "task":"translation_from", "metric":"chrf", - "score":0.1108498114 + "score":0.478882362 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-saba", + "bcp_47":"tr", "task":"translation_to", "metric":"bleu", - "score":0.0 + "score":0.2654978305 }, { - "model":"meta-llama\/llama-3.2-1b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-saba", + "bcp_47":"tr", "task":"translation_to", "metric":"chrf", - "score":0.0294450289 + "score":0.5487755246 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"am", + "model":"mistralai\/mistral-saba", + "bcp_47":"uk", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"am", - "task":"mgsm", + "model":"mistralai\/mistral-saba", + "bcp_47":"uk", + "task":"mmlu", "metric":"accuracy", - "score":0.1 + "score":0.8 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"am", - "task":"mmlu", + "model":"mistralai\/mistral-saba", + "bcp_47":"uk", + "task":"translation_from", + "metric":"bleu", + "score":0.2622533206 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"uk", + "task":"translation_from", + "metric":"chrf", + "score":0.4831695415 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"uk", + "task":"translation_to", + "metric":"bleu", + "score":0.3002613398 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"uk", + "task":"translation_to", + "metric":"chrf", + "score":0.4834403722 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"umb", + "task":"classification", "metric":"accuracy", "score":0.4 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"am", + "model":"mistralai\/mistral-saba", + "bcp_47":"umb", "task":"translation_from", "metric":"bleu", - "score":0.1452228976 + "score":0.0279025481 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"am", + "model":"mistralai\/mistral-saba", + "bcp_47":"umb", "task":"translation_from", "metric":"chrf", - "score":0.3699202818 + "score":0.0843438607 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"am", + "model":"mistralai\/mistral-saba", + "bcp_47":"umb", "task":"translation_to", "metric":"bleu", - "score":0.0630164833 + "score":0.0224775292 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"am", + "model":"mistralai\/mistral-saba", + "bcp_47":"umb", + "task":"translation_to", + "metric":"chrf", + "score":0.1057554869 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"ur", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"ur", + "task":"translation_from", + "metric":"bleu", + "score":0.2469989894 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"ur", + "task":"translation_from", + "metric":"chrf", + "score":0.4943114536 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"ur", + "task":"translation_to", + "metric":"bleu", + "score":0.2844546137 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.1755172285 + "score":0.477210689 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"apc", + "model":"mistralai\/mistral-saba", + "bcp_47":"uz", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"apc", + "model":"mistralai\/mistral-saba", + "bcp_47":"uz", "task":"translation_from", "metric":"bleu", - "score":0.2933386948 + "score":0.1727284585 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"apc", + "model":"mistralai\/mistral-saba", + "bcp_47":"uz", "task":"translation_from", "metric":"chrf", - "score":0.5447211689 + "score":0.4250344787 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"apc", + "model":"mistralai\/mistral-saba", + "bcp_47":"uz", "task":"translation_to", "metric":"bleu", - "score":0.2166524228 + "score":0.1817744295 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"apc", + "model":"mistralai\/mistral-saba", + "bcp_47":"uz", "task":"translation_to", "metric":"chrf", - "score":0.4496497227 + "score":0.4656549066 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-saba", + "bcp_47":"vi", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-saba", + "bcp_47":"vi", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-saba", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.2997360932 + "score":0.2373174322 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-saba", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.552448295 + "score":0.4521152897 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-saba", + "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.2837522278 + "score":0.2962197342 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-saba", + "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.5150814494 + "score":0.544285644 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", + "model":"mistralai\/mistral-saba", + "bcp_47":"wo", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", + "model":"mistralai\/mistral-saba", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"wo", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"wo", "task":"translation_from", "metric":"bleu", - "score":0.1936957127 + "score":0.0678548322 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", + "model":"mistralai\/mistral-saba", + "bcp_47":"wo", "task":"translation_from", "metric":"chrf", - "score":0.4274660929 + "score":0.1995976377 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", + "model":"mistralai\/mistral-saba", + "bcp_47":"wo", "task":"translation_to", "metric":"bleu", - "score":0.2338775014 + "score":0.0410008999 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", + "model":"mistralai\/mistral-saba", + "bcp_47":"wo", "task":"translation_to", "metric":"chrf", - "score":0.4546098648 + "score":0.1410775666 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"az", + "model":"mistralai\/mistral-saba", + "bcp_47":"wuu", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"az", + "model":"mistralai\/mistral-saba", + "bcp_47":"wuu", "task":"translation_from", "metric":"bleu", - "score":0.1576463626 + "score":0.1807443545 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"az", + "model":"mistralai\/mistral-saba", + "bcp_47":"wuu", "task":"translation_from", "metric":"chrf", - "score":0.3910005157 + "score":0.4282740606 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"az", + "model":"mistralai\/mistral-saba", + "bcp_47":"wuu", "task":"translation_to", "metric":"bleu", - "score":0.1690495289 + "score":0.1030562145 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"az", + "model":"mistralai\/mistral-saba", + "bcp_47":"wuu", "task":"translation_to", "metric":"chrf", - "score":0.3930640761 + "score":0.1694260317 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bho", + "model":"mistralai\/mistral-saba", + "bcp_47":"xh", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bho", + "model":"mistralai\/mistral-saba", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"xh", "task":"translation_from", "metric":"bleu", - "score":0.3061950313 + "score":0.0705660888 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bho", + "model":"mistralai\/mistral-saba", + "bcp_47":"xh", "task":"translation_from", "metric":"chrf", - "score":0.5535821276 + "score":0.1999709116 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bho", + "model":"mistralai\/mistral-saba", + "bcp_47":"xh", "task":"translation_to", "metric":"bleu", - "score":0.1811004213 + "score":0.005606616 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bho", + "model":"mistralai\/mistral-saba", + "bcp_47":"xh", "task":"translation_to", "metric":"chrf", - "score":0.3534531968 + "score":0.0791302868 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-saba", + "bcp_47":"yo", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.6 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-saba", + "bcp_47":"yo", "task":"mgsm", "metric":"accuracy", - "score":0.4 + "score":0.2 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-saba", + "bcp_47":"yo", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.5 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-saba", + "bcp_47":"yo", "task":"translation_from", "metric":"bleu", - "score":0.2646772038 + "score":0.0146140319 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-saba", + "bcp_47":"yo", "task":"translation_from", "metric":"chrf", - "score":0.5157826791 + "score":0.1546761245 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-saba", + "bcp_47":"yo", "task":"translation_to", "metric":"bleu", - "score":0.331255344 + "score":0.0066574272 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-saba", + "bcp_47":"yo", "task":"translation_to", "metric":"chrf", - "score":0.5093924414 + "score":0.0720455741 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", + "model":"mistralai\/mistral-saba", + "bcp_47":"yue", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"mgsm", - "metric":"accuracy", - "score":0.2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", + "model":"mistralai\/mistral-saba", + "bcp_47":"yue", "task":"translation_from", "metric":"bleu", - "score":0.3129672706 + "score":0.1686505919 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", + "model":"mistralai\/mistral-saba", + "bcp_47":"yue", "task":"translation_from", "metric":"chrf", - "score":0.5456543979 + "score":0.4407452421 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", + "model":"mistralai\/mistral-saba", + "bcp_47":"yue", "task":"translation_to", "metric":"bleu", - "score":0.4852409005 + "score":0.1561257665 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", + "model":"mistralai\/mistral-saba", + "bcp_47":"yue", "task":"translation_to", "metric":"chrf", - "score":0.6908376394 + "score":0.2413348415 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-saba", + "bcp_47":"zh", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-saba", + "bcp_47":"zh", "task":"mgsm", "metric":"accuracy", "score":0.7 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-saba", + "bcp_47":"zh", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-saba", + "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.5510215557 + "score":0.2391219094 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-saba", + "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.6909834226 + "score":0.4993680631 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-saba", + "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.6679215449 + "score":0.2546682455 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-saba", + "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.823262947 + "score":0.3131256963 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-saba", + "bcp_47":"zu", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-saba", + "bcp_47":"zu", "task":"mgsm", "metric":"accuracy", - "score":0.2 + "score":0.1 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-saba", + "bcp_47":"zu", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.3 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-saba", + "bcp_47":"zu", "task":"translation_from", "metric":"bleu", - "score":0.3139331841 + "score":0.0409238482 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-saba", + "bcp_47":"zu", "task":"translation_from", "metric":"chrf", - "score":0.5454623234 + "score":0.1759269251 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-saba", + "bcp_47":"zu", "task":"translation_to", "metric":"bleu", - "score":0.3561290923 + "score":0.040396663 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-saba", + "bcp_47":"zu", "task":"translation_to", "metric":"chrf", - "score":0.599796306 + "score":0.1387970813 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"aeb", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.2175149129 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.4527759686 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.1124798847 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.2758121544 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"af", + "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"af", "task":"translation_from", "metric":"bleu", - "score":0.3069040556 + "score":0.0 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"af", "task":"translation_from", "metric":"chrf", - "score":0.5327832177 + "score":0.0 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"af", "task":"translation_to", "metric":"bleu", - "score":0.2185015953 + "score":0.0 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"af", "task":"translation_to", "metric":"chrf", - "score":0.4264089038 + "score":0.0 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ak", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ak", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.5 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ak", "task":"translation_from", "metric":"bleu", - "score":0.3745780882 + "score":0.0499477269 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ak", "task":"translation_from", "metric":"chrf", - "score":0.5785175063 + "score":0.161467557 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ak", "task":"translation_to", "metric":"bleu", - "score":0.2904415478 + "score":0.0061206295 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ak", "task":"translation_to", "metric":"chrf", - "score":0.5908280404 + "score":0.1175310591 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"am", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.4 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"am", "task":"mgsm", "metric":"accuracy", - "score":0.4 + "score":0.1 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"am", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.2 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"am", "task":"translation_from", "metric":"bleu", - "score":0.2963449909 + "score":0.0 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"am", "task":"translation_from", "metric":"chrf", - "score":0.5544997379 + "score":0.0682401612 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"am", "task":"translation_to", "metric":"bleu", - "score":0.5091700689 + "score":0.0028802187 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"am", "task":"translation_to", "metric":"chrf", - "score":0.690320784 + "score":0.0506386945 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"apc", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"apc", "task":"translation_from", "metric":"bleu", - "score":0.295613677 + "score":0.1505032551 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"apc", "task":"translation_from", "metric":"chrf", - "score":0.5221513183 + "score":0.4086092545 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"apc", "task":"translation_to", "metric":"bleu", - "score":0.1697878702 + "score":0.1882561377 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"apc", "task":"translation_to", "metric":"chrf", - "score":0.4619303787 + "score":0.3814760125 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ar", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"mgsm", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ar", + "task":"mmlu", "metric":"accuracy", - "score":0.1 + "score":0.8 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ar", + "task":"translation_from", + "metric":"bleu", + "score":0.1878091774 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ar", + "task":"translation_from", + "metric":"chrf", + "score":0.4280751788 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ar", + "task":"translation_to", + "metric":"bleu", + "score":0.2100749947 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ar", + "task":"translation_to", + "metric":"chrf", + "score":0.3864616183 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ary", + "task":"classification", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ary", "task":"translation_from", "metric":"bleu", - "score":0.1704488365 + "score":0.093266394 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ary", "task":"translation_from", "metric":"chrf", - "score":0.4403441536 + "score":0.311215609 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ary", "task":"translation_to", "metric":"bleu", - "score":0.1466885285 + "score":0.1039989943 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ary", "task":"translation_to", "metric":"chrf", - "score":0.4179596519 + "score":0.2907556954 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"arz", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"arz", "task":"translation_from", "metric":"bleu", - "score":0.385731086 + "score":0.1020177653 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"arz", "task":"translation_from", "metric":"chrf", - "score":0.6034244629 + "score":0.3338664094 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"arz", "task":"translation_to", "metric":"bleu", - "score":0.357812342 + "score":0.1064323135 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"arz", "task":"translation_to", "metric":"chrf", - "score":0.5894721809 + "score":0.3080022567 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"as", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"as", "task":"translation_from", "metric":"bleu", - "score":0.3143630083 + "score":0.0979045908 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"as", "task":"translation_from", "metric":"chrf", - "score":0.5621460006 + "score":0.3174950846 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"as", "task":"translation_to", "metric":"bleu", - "score":0.3372718385 + "score":0.0117862293 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"as", "task":"translation_to", "metric":"chrf", - "score":0.6543894215 + "score":0.1847940791 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"awa", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"mgsm", - "metric":"accuracy", - "score":0.3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"awa", "task":"translation_from", "metric":"bleu", - "score":0.2934122255 + "score":0.2573591397 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"awa", "task":"translation_from", "metric":"chrf", - "score":0.5393871714 + "score":0.4309874046 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"awa", "task":"translation_to", "metric":"bleu", - "score":0.3100077394 + "score":0.0851522303 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"awa", "task":"translation_to", "metric":"chrf", - "score":0.5714730187 + "score":0.2284178182 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"az", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"mgsm", - "metric":"accuracy", - "score":0.2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"az", "task":"translation_from", "metric":"bleu", - "score":0.284322765 + "score":0.0818689903 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"az", "task":"translation_from", "metric":"chrf", - "score":0.5304019177 + "score":0.2636451344 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"az", "task":"translation_to", "metric":"bleu", - "score":0.2212745751 + "score":0.0746797577 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"az", "task":"translation_to", "metric":"chrf", - "score":0.355950114 + "score":0.3147526037 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"be", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"be", "task":"translation_from", "metric":"bleu", - "score":0.2779520489 + "score":0.0989261118 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"be", "task":"translation_from", "metric":"chrf", - "score":0.5022141687 + "score":0.3536619814 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"be", "task":"translation_to", "metric":"bleu", - "score":0.2476437073 + "score":0.1746758677 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"be", "task":"translation_to", "metric":"chrf", - "score":0.4805413308 + "score":0.3604842775 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"bho", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"bho", "task":"translation_from", "metric":"bleu", - "score":0.2379701997 + "score":0.1908291186 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"bho", "task":"translation_from", "metric":"chrf", - "score":0.4807978998 + "score":0.4048132215 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"bho", "task":"translation_to", "metric":"bleu", - "score":0.2068140088 + "score":0.0320570973 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"bho", "task":"translation_to", "metric":"chrf", - "score":0.4615143451 + "score":0.1921106676 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"bm", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"bm", "task":"translation_from", "metric":"bleu", - "score":0.2508944927 + "score":0.0 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"bm", "task":"translation_from", "metric":"chrf", - "score":0.4998320266 + "score":0.0 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"bm", "task":"translation_to", "metric":"bleu", - "score":0.210142355 + "score":0.0 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"bm", "task":"translation_to", "metric":"chrf", - "score":0.3127505848 + "score":0.0 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"bn", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.2566290969 + "score":0.1554049163 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.5196341734 + "score":0.3557989532 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.2701878605 + "score":0.2229681692 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.4964908212 + "score":0.3722031872 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ca", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ca", "task":"translation_from", "metric":"bleu", - "score":0.3224419544 + "score":0.0 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ca", "task":"translation_from", "metric":"chrf", - "score":0.5606155155 + "score":0.0 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ca", "task":"translation_to", "metric":"bleu", - "score":0.1663847917 + "score":0.0 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ca", "task":"translation_to", "metric":"chrf", - "score":0.4383662593 + "score":0.0 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ms", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ceb", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ms", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ms", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ceb", "task":"translation_from", "metric":"bleu", - "score":0.3103894957 + "score":0.2130798288 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ms", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ceb", "task":"translation_from", "metric":"chrf", - "score":0.5854645421 + "score":0.3738480621 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ms", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ceb", "task":"translation_to", "metric":"bleu", - "score":0.3913336262 + "score":0.1589337472 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ms", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ceb", "task":"translation_to", "metric":"chrf", - "score":0.6467989318 + "score":0.4334432444 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"my", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ckb", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"my", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ckb", "task":"translation_from", "metric":"bleu", - "score":0.2392486974 + "score":0.037561576 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"my", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ckb", "task":"translation_from", "metric":"chrf", - "score":0.4920626101 + "score":0.1318206471 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"my", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ckb", "task":"translation_to", "metric":"bleu", - "score":0.2130836675 + "score":0.0 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"my", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ckb", "task":"translation_to", "metric":"chrf", - "score":0.4622075168 + "score":0.1217595648 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"cs", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"cs", "task":"mgsm", "metric":"accuracy", - "score":0.1 + "score":0.8 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"cs", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.8 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"cs", "task":"translation_from", "metric":"bleu", - "score":0.0356994946 + "score":0.210101514 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"cs", "task":"translation_from", "metric":"chrf", - "score":0.2438060785 + "score":0.4301134482 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"cs", "task":"translation_to", "metric":"bleu", - "score":0.0183592041 + "score":0.362165784 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"om", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"cs", "task":"translation_to", "metric":"chrf", - "score":0.3076327609 + "score":0.5625700474 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"de", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.2403245803 + "score":0.2836619572 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.5023246313 + "score":0.5189927538 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.1415388613 + "score":0.3481484827 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.4055113288 + "score":0.5703115876 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"el", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"el", "task":"translation_from", "metric":"bleu", - "score":0.4519562833 + "score":0.2310257801 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"el", "task":"translation_from", "metric":"chrf", - "score":0.6328740374 + "score":0.4431650209 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"el", "task":"translation_to", "metric":"bleu", - "score":0.3918546765 + "score":0.2968021074 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"el", "task":"translation_to", "metric":"chrf", - "score":0.551810658 + "score":0.4607855577 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"en", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"en", "task":"mgsm", "metric":"accuracy", - "score":0.1 + "score":1.0 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"en", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.2474554181 + "score":0.4358717425 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.490135462 + "score":0.6055153523 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.3387973296 + "score":0.6254747881 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.5550868321 + "score":0.7898596498 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"es", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"es", + "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.3065957195 + "score":0.2211802733 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.5567333989 + "score":0.4673850088 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.4450524918 + "score":0.3141247128 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.6712742861 + "score":0.5664089061 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fa", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"mgsm", - "metric":"accuracy", - "score":0.3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fa", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.6 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fa", "task":"translation_from", "metric":"bleu", - "score":0.2184907643 + "score":0.1378005544 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fa", "task":"translation_from", "metric":"chrf", - "score":0.4824691404 + "score":0.3634410941 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fa", "task":"translation_to", "metric":"bleu", - "score":0.3406091079 + "score":0.1662541754 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fa", "task":"translation_to", "metric":"chrf", - "score":0.5689518318 + "score":0.3656154799 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fil", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fil", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fil", "task":"translation_from", "metric":"bleu", - "score":0.2363136631 + "score":0.2598161419 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fil", "task":"translation_from", "metric":"chrf", - "score":0.4724628618 + "score":0.4673557809 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fil", "task":"translation_to", "metric":"bleu", - "score":0.1012580658 + "score":0.2352273865 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fil", "task":"translation_to", "metric":"chrf", - "score":0.3226539734 + "score":0.5423645035 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fr", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fr", "task":"mgsm", "metric":"accuracy", - "score":0.1 + "score":1.0 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fr", "task":"mmlu", "metric":"accuracy", "score":0.7 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.2373393477 + "score":0.2637885864 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.5017230165 + "score":0.50661739 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.2334583695 + "score":0.3898419239 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.5603415221 + "score":0.5983170279 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fuv", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.7 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fuv", "task":"translation_from", "metric":"bleu", - "score":0.2147204762 + "score":0.030172991 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fuv", "task":"translation_from", "metric":"chrf", - "score":0.4649686586 + "score":0.1791853335 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fuv", "task":"translation_to", "metric":"bleu", - "score":0.2451735521 + "score":0.0012644122 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fuv", "task":"translation_to", "metric":"chrf", - "score":0.5352886898 + "score":0.0541809315 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"gu", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"mgsm", - "metric":"accuracy", - "score":0.1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"gu", "task":"translation_from", "metric":"bleu", - "score":0.3767393472 + "score":0.1879687767 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"gu", "task":"translation_from", "metric":"chrf", - "score":0.5870286691 + "score":0.3575768224 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"gu", "task":"translation_to", "metric":"bleu", - "score":0.3415510311 + "score":0.1193068232 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"gu", "task":"translation_to", "metric":"chrf", - "score":0.5592933672 + "score":0.3258076554 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ha", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ha", "task":"mgsm", "metric":"accuracy", "score":0.1 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ha", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ha", "task":"translation_from", "metric":"bleu", - "score":0.2385233061 + "score":0.0424529379 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ha", "task":"translation_from", "metric":"chrf", - "score":0.4987667959 + "score":0.205545596 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ha", "task":"translation_to", "metric":"bleu", - "score":0.3202315883 + "score":0.0315047557 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ha", "task":"translation_to", "metric":"chrf", - "score":0.4748886274 + "score":0.1862281652 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"hi", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"hi", "task":"mmlu", "metric":"accuracy", "score":0.7 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.2786347493 + "score":0.2931006661 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.5143010521 + "score":0.5117710763 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.3361615644 + "score":0.3454885653 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.5732166456 + "score":0.5632832845 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"hne", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"hne", "task":"translation_from", "metric":"bleu", - "score":0.252958993 + "score":0.1423442665 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"hne", "task":"translation_from", "metric":"chrf", - "score":0.5053979802 + "score":0.3938289086 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"hne", "task":"translation_to", "metric":"bleu", - "score":0.2339821201 + "score":0.0479071398 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"hne", "task":"translation_to", "metric":"chrf", - "score":0.425306622 + "score":0.2390532358 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"uz", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ht", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.0 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"uz", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ht", "task":"translation_from", "metric":"bleu", - "score":0.236632122 + "score":0.0 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"uz", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ht", "task":"translation_from", "metric":"chrf", - "score":0.4793696196 + "score":0.0 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"uz", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ht", "task":"translation_to", "metric":"bleu", - "score":0.265421135 + "score":0.0 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"uz", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ht", "task":"translation_to", "metric":"chrf", - "score":0.5116987882 + "score":0.0 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"hu", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"hu", + "task":"mgsm", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"hu", "task":"translation_from", "metric":"bleu", - "score":0.2721498467 + "score":0.1466679693 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"hu", "task":"translation_from", "metric":"chrf", - "score":0.5200799335 + "score":0.4020226017 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"hu", "task":"translation_to", "metric":"bleu", - "score":0.3613736416 + "score":0.2296543368 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"hu", "task":"translation_to", "metric":"chrf", - "score":0.5866656133 + "score":0.4623290904 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"wuu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"id", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"wuu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.1844305556 + "score":0.1846129963 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"wuu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.4417239043 + "score":0.4218789485 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"wuu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.1248600823 + "score":0.2363785743 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"wuu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.1650750126 + "score":0.5715726858 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ig", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.5 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ig", "task":"translation_from", "metric":"bleu", - "score":0.2018552397 + "score":0.042005649 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ig", "task":"translation_from", "metric":"chrf", - "score":0.4546838419 + "score":0.1704312564 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ig", "task":"translation_to", "metric":"bleu", - "score":0.1477972133 + "score":0.0060037968 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ig", "task":"translation_to", "metric":"chrf", - "score":0.238559837 + "score":0.1052387436 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ilo", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"mgsm", - "metric":"accuracy", - "score":0.3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ilo", "task":"translation_from", "metric":"bleu", - "score":0.2259180607 + "score":0.1206947602 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ilo", "task":"translation_from", "metric":"chrf", - "score":0.5258178103 + "score":0.2893596175 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ilo", "task":"translation_to", "metric":"bleu", - "score":0.2474954475 + "score":0.0376635554 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ilo", "task":"translation_to", "metric":"chrf", - "score":0.2841722148 + "score":0.2154020665 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"am", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"it", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"am", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"it", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":1.0 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"am", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"it", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"am", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"it", "task":"translation_from", "metric":"bleu", - "score":0.278050095 + "score":0.203133363 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"am", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"it", "task":"translation_from", "metric":"chrf", - "score":0.5030892659 + "score":0.4421827582 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"am", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"it", "task":"translation_to", "metric":"bleu", - "score":0.2056413876 + "score":0.2636104621 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"am", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"it", "task":"translation_to", "metric":"chrf", - "score":0.319475702 + "score":0.5093890816 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"apc", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ja", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"apc", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.3412628716 + "score":0.1660483895 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"apc", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.6168944847 + "score":0.4317128373 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"apc", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.2079777284 + "score":0.2448276505 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"apc", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.4737326062 + "score":0.4102738917 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"jv", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.3288891576 + "score":0.1159703103 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.560493221 + "score":0.3116167676 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.3370289388 + "score":0.0803083214 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.5616376735 + "score":0.3001867634 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ki", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ki", "task":"translation_from", "metric":"bleu", - "score":0.2820784803 + "score":0.0 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ki", "task":"translation_from", "metric":"chrf", - "score":0.5005600008 + "score":0.0 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ki", "task":"translation_to", "metric":"bleu", - "score":0.1762767818 + "score":0.0 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ki", "task":"translation_to", "metric":"chrf", - "score":0.3980584269 + "score":0.0 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"az", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"kk", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"az", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"kk", "task":"translation_from", "metric":"bleu", - "score":0.2078798411 + "score":0.1346426707 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"az", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"kk", "task":"translation_from", "metric":"chrf", - "score":0.4443945632 + "score":0.3961827686 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"az", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"kk", "task":"translation_to", "metric":"bleu", - "score":0.1864199422 + "score":0.138703676 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"az", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"kk", "task":"translation_to", "metric":"chrf", - "score":0.4220840798 + "score":0.4106570721 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bho", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"km", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.6 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bho", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"km", "task":"translation_from", "metric":"bleu", - "score":0.2239129937 + "score":0.0501718274 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bho", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"km", "task":"translation_from", "metric":"chrf", - "score":0.4981762083 + "score":0.2070022512 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bho", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"km", "task":"translation_to", "metric":"bleu", - "score":0.1952639614 + "score":0.0014765966 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bho", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"km", "task":"translation_to", "metric":"chrf", - "score":0.40510597 + "score":0.0534187009 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"kn", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"kn", "task":"translation_from", "metric":"bleu", - "score":0.3130233588 + "score":0.1342281856 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"kn", "task":"translation_from", "metric":"chrf", - "score":0.5569163893 + "score":0.3526105747 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"kn", "task":"translation_to", "metric":"bleu", - "score":0.3322667951 + "score":0.146553268 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"kn", "task":"translation_to", "metric":"chrf", - "score":0.5140240989 + "score":0.3291051456 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ko", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ko", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ko", "task":"translation_from", "metric":"bleu", - "score":0.386239845 + "score":0.1737342381 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ko", "task":"translation_from", "metric":"chrf", - "score":0.6110300223 + "score":0.4232883693 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ko", "task":"translation_to", "metric":"bleu", - "score":0.4508475568 + "score":0.2383832092 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ko", "task":"translation_to", "metric":"chrf", - "score":0.6653203029 + "score":0.33001113 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"lua", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", "score":0.7 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"lua", "task":"translation_from", "metric":"bleu", - "score":0.5649266234 + "score":0.0707102369 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"lua", "task":"translation_from", "metric":"chrf", - "score":0.7240609445 + "score":0.2324042355 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"lua", "task":"translation_to", "metric":"bleu", - "score":0.6160790992 + "score":0.0 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"lua", "task":"translation_to", "metric":"chrf", - "score":0.8133281991 + "score":0.1164466909 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"mag", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"mag", "task":"translation_from", "metric":"bleu", - "score":0.3152773331 + "score":0.2572289084 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"mag", "task":"translation_from", "metric":"chrf", - "score":0.5548531112 + "score":0.5125685183 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"mag", "task":"translation_to", "metric":"bleu", - "score":0.3335962816 + "score":0.1223672825 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"mag", "task":"translation_to", "metric":"chrf", - "score":0.5859881472 + "score":0.3023512099 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"mai", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.5 + "score":0.8 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"mai", "task":"translation_from", "metric":"bleu", - "score":0.2974755741 + "score":0.2098940087 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"mai", "task":"translation_from", "metric":"chrf", - "score":0.548510072 + "score":0.443017936 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"mai", "task":"translation_to", "metric":"bleu", - "score":0.198877694 + "score":0.0762167285 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"mai", "task":"translation_to", "metric":"chrf", - "score":0.4016676481 + "score":0.2552721118 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"mg", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"mg", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.3 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"mg", "task":"translation_from", "metric":"bleu", - "score":0.3394346908 + "score":0.0777950532 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"mg", "task":"translation_from", "metric":"chrf", - "score":0.5772205685 + "score":0.2573049595 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"mg", "task":"translation_to", "metric":"bleu", - "score":0.2961737536 + "score":0.0666322315 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"mg", "task":"translation_to", "metric":"chrf", - "score":0.5732830973 + "score":0.3626993592 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ml", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ml", "task":"translation_from", "metric":"bleu", - "score":0.3174175523 + "score":0.2059798463 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ml", "task":"translation_from", "metric":"chrf", - "score":0.5682518332 + "score":0.4231363675 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ml", "task":"translation_to", "metric":"bleu", - "score":0.5173973527 + "score":0.2059172406 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ml", "task":"translation_to", "metric":"chrf", - "score":0.7056428374 + "score":0.4148312305 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"mr", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.336179684 + "score":0.2216993022 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.5448761462 + "score":0.4221894818 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.1255076156 + "score":0.1386303624 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.4301109075 + "score":0.3369477219 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ms", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ms", "task":"mmlu", "metric":"accuracy", "score":0.6 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ms", "task":"translation_from", "metric":"bleu", - "score":0.2176466652 + "score":0.2392636803 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ms", "task":"translation_from", "metric":"chrf", - "score":0.4472887488 + "score":0.4545241599 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ms", "task":"translation_to", "metric":"bleu", - "score":0.2048605344 + "score":0.3632780792 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ms", "task":"translation_to", "metric":"chrf", - "score":0.4547067722 + "score":0.6254141203 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"my", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"my", "task":"translation_from", "metric":"bleu", - "score":0.3796955055 + "score":0.0217828279 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"my", "task":"translation_from", "metric":"chrf", - "score":0.6056742688 + "score":0.144054989 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"my", "task":"translation_to", "metric":"bleu", - "score":0.382370623 + "score":0.0351771663 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"my", "task":"translation_to", "metric":"chrf", - "score":0.5922578575 + "score":0.2287244941 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ne", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ne", "task":"mmlu", "metric":"accuracy", - "score":1.0 + "score":0.7 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ne", "task":"translation_from", "metric":"bleu", - "score":0.2523550022 + "score":0.1464596557 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ne", "task":"translation_from", "metric":"chrf", - "score":0.5458277736 + "score":0.3564056311 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ne", "task":"translation_to", "metric":"bleu", - "score":0.3774331947 + "score":0.1517063855 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ne", "task":"translation_to", "metric":"chrf", - "score":0.6486159416 + "score":0.4352500122 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"nl", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"nl", "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"nl", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"nl", "task":"translation_from", "metric":"bleu", - "score":0.2923994901 + "score":0.2230448991 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"nl", "task":"translation_from", "metric":"chrf", - "score":0.5447705341 + "score":0.4584787016 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"nl", "task":"translation_to", "metric":"bleu", - "score":0.4037821428 + "score":0.2531295878 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"nl", "task":"translation_to", "metric":"chrf", - "score":0.6296260979 + "score":0.5302964071 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ny", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ny", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.4 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ny", "task":"translation_from", "metric":"bleu", - "score":0.3130983776 + "score":0.0696320569 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ny", "task":"translation_from", "metric":"chrf", - "score":0.5536124921 + "score":0.2331307278 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ny", "task":"translation_to", "metric":"bleu", - "score":0.3266051607 + "score":0.0252073886 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ny", "task":"translation_to", "metric":"chrf", - "score":0.4444671407 + "score":0.1703033014 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"om", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"om", "task":"translation_from", "metric":"bleu", - "score":0.3146151088 + "score":0.0276939955 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"om", "task":"translation_from", "metric":"chrf", - "score":0.5434123174 + "score":0.1837469296 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"om", "task":"translation_to", "metric":"bleu", - "score":0.3068652176 + "score":0.0160221908 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"om", "task":"translation_to", "metric":"chrf", - "score":0.5696595268 + "score":0.2144565152 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"or", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"or", "task":"translation_from", "metric":"bleu", - "score":0.273765965 + "score":0.083347512 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"or", "task":"translation_from", "metric":"chrf", - "score":0.5541955864 + "score":0.2190646209 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"or", "task":"translation_to", "metric":"bleu", - "score":0.2689874625 + "score":0.0679191643 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"or", "task":"translation_to", "metric":"chrf", - "score":0.5150630417 + "score":0.2873941526 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"pa", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.2599758467 + "score":0.3647734864 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.4915631618 + "score":0.5784168493 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.1778560135 + "score":0.3897396366 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.2969773205 + "score":0.5030239884 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"pl", "task":"classification", "metric":"accuracy", + "score":0.9 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", "score":0.8 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"pl", "task":"translation_from", "metric":"bleu", - "score":0.3697837131 + "score":0.1850936564 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"pl", "task":"translation_from", "metric":"chrf", - "score":0.598263628 + "score":0.3999928464 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"pl", "task":"translation_to", "metric":"bleu", - "score":0.2866761532 + "score":0.2726874239 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"pl", "task":"translation_to", "metric":"chrf", - "score":0.5500074549 + "score":0.4948927457 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"pt", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.3125095049 + "score":0.2070601418 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.5535296132 + "score":0.4601106145 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.2275791183 + "score":0.412349088 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.4569915545 + "score":0.6102742767 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ms", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ro", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ms", - "task":"mmlu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ro", + "task":"mgsm", "metric":"accuracy", "score":0.8 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ms", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ro", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ro", "task":"translation_from", "metric":"bleu", - "score":0.345465339 + "score":0.2142629544 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ms", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ro", "task":"translation_from", "metric":"chrf", - "score":0.5897544047 + "score":0.4499459763 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ms", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ro", "task":"translation_to", "metric":"bleu", - "score":0.4313143535 + "score":0.3895465667 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ms", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ro", "task":"translation_to", "metric":"chrf", - "score":0.672362003 + "score":0.5708848992 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"my", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ru", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"my", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.3075903861 + "score":0.1710045162 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"my", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.578349632 + "score":0.433047449 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"my", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.1897910105 + "score":0.2961144006 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"my", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.4717519215 + "score":0.5257430939 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"om", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"rw", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"om", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"rw", "task":"mgsm", "metric":"accuracy", - "score":0.6 + "score":0.1 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"om", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"rw", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.2 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"om", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"rw", "task":"translation_from", "metric":"bleu", - "score":0.0536067183 + "score":0.057729338 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"om", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"rw", "task":"translation_from", "metric":"chrf", - "score":0.2934406231 + "score":0.2177957601 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"om", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"rw", "task":"translation_to", "metric":"bleu", - "score":0.0212136796 + "score":0.0230572611 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"om", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"rw", "task":"translation_to", "metric":"chrf", - "score":0.3367052821 + "score":0.16449999 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sd", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sd", "task":"translation_from", "metric":"bleu", - "score":0.2884546263 + "score":0.0484864486 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sd", "task":"translation_from", "metric":"chrf", - "score":0.5474826718 + "score":0.1952223401 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sd", "task":"translation_to", "metric":"bleu", - "score":0.2053276951 + "score":0.0005975301 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sd", "task":"translation_to", "metric":"chrf", - "score":0.4215800492 + "score":0.1227717162 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"si", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.6 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"si", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"si", "task":"translation_from", "metric":"bleu", - "score":0.4246522462 + "score":0.0165865489 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"si", "task":"translation_from", "metric":"chrf", - "score":0.6364852561 + "score":0.1532087128 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"si", "task":"translation_to", "metric":"bleu", - "score":0.439726575 + "score":0.0 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"si", "task":"translation_to", "metric":"chrf", - "score":0.5806732389 + "score":0.1038227782 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sn", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sn", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.1 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sn", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.4 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sn", "task":"translation_from", "metric":"bleu", - "score":0.2708043929 + "score":0.0457227327 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sn", "task":"translation_from", "metric":"chrf", - "score":0.5320865131 + "score":0.2051868353 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sn", "task":"translation_to", "metric":"bleu", - "score":0.2827359953 + "score":0.0141586748 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sn", "task":"translation_to", "metric":"chrf", - "score":0.5407300006 + "score":0.1192333436 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"so", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"so", "task":"mmlu", "metric":"accuracy", - "score":1.0 + "score":0.5 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"so", "task":"translation_from", "metric":"bleu", - "score":0.3451568022 + "score":0.0421597981 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"so", "task":"translation_from", "metric":"chrf", - "score":0.5845365036 + "score":0.1665679168 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"so", "task":"translation_to", "metric":"bleu", - "score":0.4582156105 + "score":0.0011074127 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"so", "task":"translation_to", "metric":"chrf", - "score":0.6491023878 + "score":0.1483863351 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"mgsm", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sr", + "task":"mmlu", "metric":"accuracy", - "score":1.0 + "score":0.7 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"mmlu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sr", + "task":"translation_from", + "metric":"bleu", + "score":0.1814266299 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sr", + "task":"translation_from", + "metric":"chrf", + "score":0.4404144211 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sr", + "task":"translation_to", + "metric":"bleu", + "score":0.2821064012 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sr", + "task":"translation_to", + "metric":"chrf", + "score":0.492442613 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"su", + "task":"classification", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"su", "task":"translation_from", "metric":"bleu", - "score":0.2567420946 + "score":0.1500059372 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"su", "task":"translation_from", "metric":"chrf", - "score":0.5061211552 + "score":0.385325025 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"su", "task":"translation_to", "metric":"bleu", - "score":0.4025875747 + "score":0.0190556256 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"su", "task":"translation_to", "metric":"chrf", - "score":0.6083538055 + "score":0.201727165 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sv", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.8 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sv", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sv", "task":"translation_from", "metric":"bleu", - "score":0.3060556532 + "score":0.2063172621 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sv", "task":"translation_from", "metric":"chrf", - "score":0.5236224481 + "score":0.4245629061 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sv", "task":"translation_to", "metric":"bleu", - "score":0.2303677631 + "score":0.2871245672 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sv", "task":"translation_to", "metric":"chrf", - "score":0.4550652237 + "score":0.5575367366 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"sw", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"sw", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"sw", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.4 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.3425500041 + "score":0.1106429776 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.5680420054 + "score":0.3246322884 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.2980763573 + "score":0.1586725311 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.5924685945 + "score":0.4486820539 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"ta", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"ta", "task":"translation_from", "metric":"bleu", - "score":0.2473591284 + "score":0.0861902503 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"ta", "task":"translation_from", "metric":"chrf", - "score":0.5382867852 + "score":0.2737902674 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"ta", "task":"translation_to", "metric":"bleu", - "score":0.3068229029 + "score":0.1910130331 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"ta", "task":"translation_to", "metric":"chrf", - "score":0.5637367471 + "score":0.4159297845 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"te", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"te", "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.6 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"te", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.4 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.3462186566 + "score":0.2631133201 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.6055817314 + "score":0.504043761 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.3822149946 + "score":0.2496114121 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.5783618359 + "score":0.4707696336 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"tg", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"tg", "task":"translation_from", "metric":"bleu", - "score":0.2652851581 + "score":0.0528559098 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"tg", "task":"translation_from", "metric":"chrf", - "score":0.5278626321 + "score":0.2067746551 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"tg", "task":"translation_to", "metric":"bleu", - "score":0.3718263092 + "score":0.0275980154 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"tg", "task":"translation_to", "metric":"chrf", - "score":0.5255136074 + "score":0.1880963665 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"th", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"mmlu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"th", + "task":"mgsm", "metric":"accuracy", "score":0.7 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"th", "task":"translation_from", "metric":"bleu", - "score":0.2978237586 + "score":0.1533969949 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"th", "task":"translation_from", "metric":"chrf", - "score":0.5152360665 + "score":0.3718867563 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"th", "task":"translation_to", "metric":"bleu", - "score":0.3447394658 + "score":0.2858310833 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"th", "task":"translation_to", "metric":"chrf", - "score":0.5850690403 + "score":0.4323129392 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ti", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.3 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ti", "task":"translation_from", "metric":"bleu", - "score":0.253549974 + "score":0.0536249593 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ti", "task":"translation_from", "metric":"chrf", - "score":0.5235064606 + "score":0.190207113 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ti", "task":"translation_to", "metric":"bleu", - "score":0.2484556869 + "score":0.0 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ti", "task":"translation_to", "metric":"chrf", - "score":0.429442787 + "score":0.0308454815 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"uz", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"tr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"uz", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"tr", "task":"translation_from", "metric":"bleu", - "score":0.2701010494 + "score":0.1776801562 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"uz", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"tr", "task":"translation_from", "metric":"chrf", - "score":0.5241051692 + "score":0.4036600408 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"uz", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"tr", "task":"translation_to", "metric":"bleu", - "score":0.3181656056 + "score":0.2335702423 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"uz", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"tr", "task":"translation_to", "metric":"chrf", - "score":0.5907906511 + "score":0.4992388897 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"uk", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"uk", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"uk", "task":"translation_from", "metric":"bleu", - "score":0.2670924013 + "score":0.1788374332 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"uk", "task":"translation_from", "metric":"chrf", - "score":0.5198891912 + "score":0.4671147568 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"uk", "task":"translation_to", "metric":"bleu", - "score":0.3597766713 + "score":0.2348003993 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"uk", "task":"translation_to", "metric":"chrf", - "score":0.6081806669 + "score":0.4786253942 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"wuu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"umb", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.2 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"wuu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"umb", "task":"translation_from", "metric":"bleu", - "score":0.2653942694 + "score":0.0150184554 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"wuu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"umb", "task":"translation_from", "metric":"chrf", - "score":0.4893923691 + "score":0.1309010161 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"wuu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"umb", "task":"translation_to", "metric":"bleu", - "score":0.1157826458 + "score":0.0010839978 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"wuu", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"umb", "task":"translation_to", "metric":"chrf", - "score":0.1765005496 + "score":0.0719045729 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ur", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.2204568545 + "score":0.1854021136 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.4894165826 + "score":0.4258067424 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.1569463992 + "score":0.1388133394 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.232785021 + "score":0.3685419874 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"uz", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", "score":0.8 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"uz", "task":"translation_from", "metric":"bleu", - "score":0.2703289724 + "score":0.1877241389 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"uz", "task":"translation_from", "metric":"chrf", - "score":0.5473102513 + "score":0.4060591516 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"uz", "task":"translation_to", "metric":"bleu", - "score":0.317769874 + "score":0.1165785177 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"uz", "task":"translation_to", "metric":"chrf", - "score":0.3676906362 + "score":0.4074870036 }, { - "model":"microsoft\/phi-4", - "bcp_47":"am", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"vi", "task":"classification", "metric":"accuracy", - "score":0.4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"am", - "task":"mgsm", - "metric":"accuracy", - "score":0.1 + "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"am", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"vi", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.7 }, { - "model":"microsoft\/phi-4", - "bcp_47":"am", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.0476085337 + "score":0.2204611632 }, { - "model":"microsoft\/phi-4", - "bcp_47":"am", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.205897506 + "score":0.4366931331 }, { - "model":"microsoft\/phi-4", - "bcp_47":"am", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.0110136998 + "score":0.2957932526 }, { - "model":"microsoft\/phi-4", - "bcp_47":"am", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.0688367427 + "score":0.5127606293 }, { - "model":"microsoft\/phi-4", - "bcp_47":"apc", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"wo", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"apc", - "task":"translation_from", - "metric":"bleu", - "score":0.0927070911 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"apc", - "task":"translation_from", - "metric":"chrf", - "score":0.3300356171 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"apc", - "task":"translation_to", - "metric":"bleu", - "score":0.1909661669 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"apc", - "task":"translation_to", - "metric":"chrf", - "score":0.4391780261 + "score":0.6 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"classification", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"wo", + "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ar", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"wo", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.1 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ar", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"wo", "task":"translation_from", "metric":"bleu", - "score":0.1548779531 + "score":0.0530966299 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ar", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"wo", "task":"translation_from", "metric":"chrf", - "score":0.3887963415 + "score":0.183305815 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ar", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"wo", "task":"translation_to", "metric":"bleu", - "score":0.268706305 + "score":0.0017326575 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ar", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"wo", "task":"translation_to", "metric":"chrf", - "score":0.4959259833 + "score":0.1225688999 }, { - "model":"microsoft\/phi-4", - "bcp_47":"arz", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"wuu", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"arz", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"wuu", "task":"translation_from", "metric":"bleu", - "score":0.106947781 + "score":0.1059358827 }, { - "model":"microsoft\/phi-4", - "bcp_47":"arz", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"wuu", "task":"translation_from", "metric":"chrf", - "score":0.3169488071 + "score":0.3291955196 }, { - "model":"microsoft\/phi-4", - "bcp_47":"arz", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"wuu", "task":"translation_to", "metric":"bleu", - "score":0.1479958867 + "score":0.0116334446 }, { - "model":"microsoft\/phi-4", - "bcp_47":"arz", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"wuu", "task":"translation_to", "metric":"chrf", - "score":0.3761797641 + "score":0.0643182856 }, { - "model":"microsoft\/phi-4", - "bcp_47":"az", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"xh", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"az", - "task":"translation_from", - "metric":"bleu", - "score":0.0298418752 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"az", - "task":"translation_from", - "metric":"chrf", - "score":0.2580610439 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"az", - "task":"translation_to", - "metric":"bleu", - "score":0.041095966 + "score":0.8 }, { - "model":"microsoft\/phi-4", - "bcp_47":"az", - "task":"translation_to", - "metric":"chrf", - "score":0.2930729253 + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 }, { - "model":"microsoft\/phi-4", - "bcp_47":"bho", - "task":"classification", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"xh", + "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.1 }, { - "model":"microsoft\/phi-4", - "bcp_47":"bho", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"xh", "task":"translation_from", "metric":"bleu", - "score":0.1569501012 + "score":0.0665909516 }, { - "model":"microsoft\/phi-4", - "bcp_47":"bho", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"xh", "task":"translation_from", "metric":"chrf", - "score":0.4039420627 + "score":0.2275785677 }, { - "model":"microsoft\/phi-4", - "bcp_47":"bho", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"xh", "task":"translation_to", "metric":"bleu", - "score":0.1151073387 + "score":0.0230978994 }, { - "model":"microsoft\/phi-4", - "bcp_47":"bho", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"xh", "task":"translation_to", "metric":"chrf", - "score":0.3126448605 + "score":0.1160311087 }, { - "model":"microsoft\/phi-4", - "bcp_47":"bn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"yo", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.5 }, { - "model":"microsoft\/phi-4", - "bcp_47":"bn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"yo", "task":"mgsm", "metric":"accuracy", - "score":0.7 + "score":0.1 }, { - "model":"microsoft\/phi-4", - "bcp_47":"bn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"yo", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.2 }, { - "model":"microsoft\/phi-4", - "bcp_47":"bn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"yo", "task":"translation_from", "metric":"bleu", - "score":0.095240952 + "score":0.0299390587 }, { - "model":"microsoft\/phi-4", - "bcp_47":"bn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"yo", "task":"translation_from", "metric":"chrf", - "score":0.3840548344 + "score":0.1474455997 }, { - "model":"microsoft\/phi-4", - "bcp_47":"bn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"yo", "task":"translation_to", "metric":"bleu", - "score":0.1876367188 + "score":0.0 }, { - "model":"microsoft\/phi-4", - "bcp_47":"bn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"yo", "task":"translation_to", "metric":"chrf", - "score":0.4310988737 + "score":0.0919549448 }, { - "model":"microsoft\/phi-4", - "bcp_47":"de", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"yue", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"yue", "task":"translation_from", "metric":"bleu", - "score":0.2546126219 + "score":0.1503741808 }, { - "model":"microsoft\/phi-4", - "bcp_47":"de", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"yue", "task":"translation_from", "metric":"chrf", - "score":0.4840060449 + "score":0.3985964495 }, { - "model":"microsoft\/phi-4", - "bcp_47":"de", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"yue", "task":"translation_to", "metric":"bleu", - "score":0.3171866034 + "score":0.1755859315 }, { - "model":"microsoft\/phi-4", - "bcp_47":"de", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"yue", "task":"translation_to", "metric":"chrf", - "score":0.5752285995 + "score":0.2407951689 }, { - "model":"microsoft\/phi-4", - "bcp_47":"en", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"zh", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"en", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"zh", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"microsoft\/phi-4", - "bcp_47":"en", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"zh", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"microsoft\/phi-4", - "bcp_47":"en", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.3642023499 + "score":0.1386896901 }, { - "model":"microsoft\/phi-4", - "bcp_47":"en", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.5697992815 + "score":0.413832278 }, { - "model":"microsoft\/phi-4", - "bcp_47":"en", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.4959810553 + "score":0.2503925306 }, { - "model":"microsoft\/phi-4", - "bcp_47":"en", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.7232313255 + "score":0.3045084897 }, { - "model":"microsoft\/phi-4", - "bcp_47":"es", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"zu", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"microsoft\/phi-4", - "bcp_47":"es", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"zu", "task":"mgsm", "metric":"accuracy", - "score":0.6 + "score":0.1 }, { - "model":"microsoft\/phi-4", - "bcp_47":"es", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"zu", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.3 }, { - "model":"microsoft\/phi-4", - "bcp_47":"es", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"zu", "task":"translation_from", "metric":"bleu", - "score":0.1732534835 + "score":0.0365820579 }, { - "model":"microsoft\/phi-4", - "bcp_47":"es", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"zu", "task":"translation_from", "metric":"chrf", - "score":0.4434970776 + "score":0.1964572986 }, { - "model":"microsoft\/phi-4", - "bcp_47":"es", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"zu", "task":"translation_to", "metric":"bleu", - "score":0.3605235101 + "score":0.0044447951 }, { - "model":"microsoft\/phi-4", - "bcp_47":"es", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"zu", "task":"translation_to", "metric":"chrf", - "score":0.5849733787 + "score":0.1846817289 }, { - "model":"microsoft\/phi-4", - "bcp_47":"fa", + "model":"openai\/gpt-4.1", + "bcp_47":"aeb", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"mmlu", + "model":"openai\/gpt-4.1", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.2428195445 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.5030866734 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.2620151049 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.4506581715 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"af", + "task":"classification", "metric":"accuracy", - "score":0.7 + "score":0.0 }, { - "model":"microsoft\/phi-4", - "bcp_47":"fa", + "model":"openai\/gpt-4.1", + "bcp_47":"af", "task":"translation_from", "metric":"bleu", - "score":0.0868573088 + "score":0.0 }, { - "model":"microsoft\/phi-4", - "bcp_47":"fa", + "model":"openai\/gpt-4.1", + "bcp_47":"af", "task":"translation_from", "metric":"chrf", - "score":0.3068232268 + "score":0.0 }, { - "model":"microsoft\/phi-4", - "bcp_47":"fa", + "model":"openai\/gpt-4.1", + "bcp_47":"af", "task":"translation_to", "metric":"bleu", - "score":0.0883262705 + "score":0.0 }, { - "model":"microsoft\/phi-4", - "bcp_47":"fa", + "model":"openai\/gpt-4.1", + "bcp_47":"af", "task":"translation_to", "metric":"chrf", - "score":0.3294670602 + "score":0.0 }, { - "model":"microsoft\/phi-4", - "bcp_47":"fil", + "model":"openai\/gpt-4.1", + "bcp_47":"ak", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"fil", + "model":"openai\/gpt-4.1", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"ak", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.5 }, { - "model":"microsoft\/phi-4", - "bcp_47":"fil", + "model":"openai\/gpt-4.1", + "bcp_47":"ak", "task":"translation_from", "metric":"bleu", - "score":0.1921595243 + "score":0.0873196299 }, { - "model":"microsoft\/phi-4", - "bcp_47":"fil", + "model":"openai\/gpt-4.1", + "bcp_47":"ak", "task":"translation_from", "metric":"chrf", - "score":0.4381909531 + "score":0.2791620733 }, { - "model":"microsoft\/phi-4", - "bcp_47":"fil", + "model":"openai\/gpt-4.1", + "bcp_47":"ak", "task":"translation_to", "metric":"bleu", - "score":0.2102834142 + "score":0.0938455414 }, { - "model":"microsoft\/phi-4", - "bcp_47":"fil", + "model":"openai\/gpt-4.1", + "bcp_47":"ak", "task":"translation_to", "metric":"chrf", - "score":0.503934087 + "score":0.3566262434 }, { - "model":"microsoft\/phi-4", - "bcp_47":"fr", + "model":"openai\/gpt-4.1", + "bcp_47":"am", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"fr", + "model":"openai\/gpt-4.1", + "bcp_47":"am", "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.7 }, { - "model":"microsoft\/phi-4", - "bcp_47":"fr", + "model":"openai\/gpt-4.1", + "bcp_47":"am", "task":"mmlu", "metric":"accuracy", "score":0.6 }, { - "model":"microsoft\/phi-4", - "bcp_47":"fr", + "model":"openai\/gpt-4.1", + "bcp_47":"am", "task":"translation_from", "metric":"bleu", - "score":0.1763652726 + "score":0.1724572981 }, { - "model":"microsoft\/phi-4", - "bcp_47":"fr", + "model":"openai\/gpt-4.1", + "bcp_47":"am", "task":"translation_from", "metric":"chrf", - "score":0.4428784232 + "score":0.4396154177 }, { - "model":"microsoft\/phi-4", - "bcp_47":"fr", + "model":"openai\/gpt-4.1", + "bcp_47":"am", "task":"translation_to", "metric":"bleu", - "score":0.3772793055 + "score":0.151364721 }, { - "model":"microsoft\/phi-4", - "bcp_47":"fr", + "model":"openai\/gpt-4.1", + "bcp_47":"am", "task":"translation_to", "metric":"chrf", - "score":0.5820724576 + "score":0.2888758833 }, { - "model":"microsoft\/phi-4", - "bcp_47":"gu", + "model":"openai\/gpt-4.1", + "bcp_47":"apc", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"gu", + "model":"openai\/gpt-4.1", + "bcp_47":"apc", "task":"translation_from", "metric":"bleu", - "score":0.1581139234 + "score":0.2635134498 }, { - "model":"microsoft\/phi-4", - "bcp_47":"gu", + "model":"openai\/gpt-4.1", + "bcp_47":"apc", "task":"translation_from", "metric":"chrf", - "score":0.3992847318 + "score":0.5460096147 }, { - "model":"microsoft\/phi-4", - "bcp_47":"gu", + "model":"openai\/gpt-4.1", + "bcp_47":"apc", "task":"translation_to", "metric":"bleu", - "score":0.1006122628 + "score":0.2693884383 }, { - "model":"microsoft\/phi-4", - "bcp_47":"gu", + "model":"openai\/gpt-4.1", + "bcp_47":"apc", "task":"translation_to", "metric":"chrf", - "score":0.3529986856 + "score":0.5166212712 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ha", + "model":"openai\/gpt-4.1", + "bcp_47":"ar", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"mgsm", - "metric":"accuracy", - "score":0.1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", + "model":"openai\/gpt-4.1", + "bcp_47":"ar", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.8 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ha", + "model":"openai\/gpt-4.1", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.0310807341 + "score":0.2499610519 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ha", + "model":"openai\/gpt-4.1", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.2470826922 + "score":0.5318854927 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ha", + "model":"openai\/gpt-4.1", + "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.0634023566 + "score":0.4039353928 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ha", + "model":"openai\/gpt-4.1", + "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.2955476351 + "score":0.6016089011 }, { - "model":"microsoft\/phi-4", - "bcp_47":"hi", + "model":"openai\/gpt-4.1", + "bcp_47":"ary", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", + "model":"openai\/gpt-4.1", + "bcp_47":"ary", "task":"translation_from", "metric":"bleu", - "score":0.2788689746 + "score":0.1580325965 }, { - "model":"microsoft\/phi-4", - "bcp_47":"hi", + "model":"openai\/gpt-4.1", + "bcp_47":"ary", "task":"translation_from", "metric":"chrf", - "score":0.5417455941 + "score":0.4452763225 }, { - "model":"microsoft\/phi-4", - "bcp_47":"hi", + "model":"openai\/gpt-4.1", + "bcp_47":"ary", "task":"translation_to", "metric":"bleu", - "score":0.2369610218 + "score":0.1755215463 }, { - "model":"microsoft\/phi-4", - "bcp_47":"hi", + "model":"openai\/gpt-4.1", + "bcp_47":"ary", "task":"translation_to", "metric":"chrf", - "score":0.3765795877 + "score":0.4247958024 }, { - "model":"microsoft\/phi-4", - "bcp_47":"id", + "model":"openai\/gpt-4.1", + "bcp_47":"arz", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", + "model":"openai\/gpt-4.1", + "bcp_47":"arz", "task":"translation_from", "metric":"bleu", - "score":0.0855471394 + "score":0.2186059158 }, { - "model":"microsoft\/phi-4", - "bcp_47":"id", + "model":"openai\/gpt-4.1", + "bcp_47":"arz", "task":"translation_from", "metric":"chrf", - "score":0.3720740561 + "score":0.4527608912 }, { - "model":"microsoft\/phi-4", - "bcp_47":"id", + "model":"openai\/gpt-4.1", + "bcp_47":"arz", "task":"translation_to", "metric":"bleu", - "score":0.284365864 + "score":0.2928280563 }, { - "model":"microsoft\/phi-4", - "bcp_47":"id", + "model":"openai\/gpt-4.1", + "bcp_47":"arz", "task":"translation_to", "metric":"chrf", - "score":0.589202199 + "score":0.4822967505 }, { - "model":"microsoft\/phi-4", - "bcp_47":"it", + "model":"openai\/gpt-4.1", + "bcp_47":"as", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", + "model":"openai\/gpt-4.1", + "bcp_47":"as", "task":"translation_from", "metric":"bleu", - "score":0.1849581121 + "score":0.2425216718 }, { - "model":"microsoft\/phi-4", - "bcp_47":"it", + "model":"openai\/gpt-4.1", + "bcp_47":"as", "task":"translation_from", "metric":"chrf", - "score":0.4562979327 + "score":0.4831264986 }, { - "model":"microsoft\/phi-4", - "bcp_47":"it", + "model":"openai\/gpt-4.1", + "bcp_47":"as", "task":"translation_to", "metric":"bleu", - "score":0.2591551222 + "score":0.1377054899 }, { - "model":"microsoft\/phi-4", - "bcp_47":"it", + "model":"openai\/gpt-4.1", + "bcp_47":"as", "task":"translation_to", "metric":"chrf", - "score":0.5311194854 + "score":0.3411255917 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ja", + "model":"openai\/gpt-4.1", + "bcp_47":"awa", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"mgsm", - "metric":"accuracy", - "score":0.7 + "model":"openai\/gpt-4.1", + "bcp_47":"awa", + "task":"translation_from", + "metric":"bleu", + "score":0.3603859441 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"mmlu", + "model":"openai\/gpt-4.1", + "bcp_47":"awa", + "task":"translation_from", + "metric":"chrf", + "score":0.5684805903 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"awa", + "task":"translation_to", + "metric":"bleu", + "score":0.1408898772 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"awa", + "task":"translation_to", + "metric":"chrf", + "score":0.3872495567 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"az", + "task":"classification", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ja", + "model":"openai\/gpt-4.1", + "bcp_47":"az", "task":"translation_from", "metric":"bleu", - "score":0.1462066826 + "score":0.169544784 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ja", + "model":"openai\/gpt-4.1", + "bcp_47":"az", "task":"translation_from", "metric":"chrf", - "score":0.4299215293 + "score":0.4154274624 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ja", + "model":"openai\/gpt-4.1", + "bcp_47":"az", "task":"translation_to", "metric":"bleu", - "score":0.2371087689 + "score":0.1683183381 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ja", + "model":"openai\/gpt-4.1", + "bcp_47":"az", "task":"translation_to", "metric":"chrf", - "score":0.4064089202 + "score":0.4409361184 }, { - "model":"microsoft\/phi-4", - "bcp_47":"jv", + "model":"openai\/gpt-4.1", + "bcp_47":"be", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"jv", + "model":"openai\/gpt-4.1", + "bcp_47":"be", "task":"translation_from", "metric":"bleu", - "score":0.1102793601 + "score":0.1501419666 }, { - "model":"microsoft\/phi-4", - "bcp_47":"jv", + "model":"openai\/gpt-4.1", + "bcp_47":"be", "task":"translation_from", "metric":"chrf", - "score":0.3718502317 + "score":0.4658338479 }, { - "model":"microsoft\/phi-4", - "bcp_47":"jv", + "model":"openai\/gpt-4.1", + "bcp_47":"be", "task":"translation_to", "metric":"bleu", - "score":0.0999035402 + "score":0.281865771 }, { - "model":"microsoft\/phi-4", - "bcp_47":"jv", + "model":"openai\/gpt-4.1", + "bcp_47":"be", "task":"translation_to", "metric":"chrf", - "score":0.3664761129 + "score":0.4773167113 }, { - "model":"microsoft\/phi-4", - "bcp_47":"kn", + "model":"openai\/gpt-4.1", + "bcp_47":"bho", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"kn", + "model":"openai\/gpt-4.1", + "bcp_47":"bho", "task":"translation_from", "metric":"bleu", - "score":0.104202131 + "score":0.2591609762 }, { - "model":"microsoft\/phi-4", - "bcp_47":"kn", + "model":"openai\/gpt-4.1", + "bcp_47":"bho", "task":"translation_from", "metric":"chrf", - "score":0.3590734072 + "score":0.5223588424 }, { - "model":"microsoft\/phi-4", - "bcp_47":"kn", + "model":"openai\/gpt-4.1", + "bcp_47":"bho", "task":"translation_to", "metric":"bleu", - "score":0.0705324379 + "score":0.1993415983 }, { - "model":"microsoft\/phi-4", - "bcp_47":"kn", + "model":"openai\/gpt-4.1", + "bcp_47":"bho", "task":"translation_to", "metric":"chrf", - "score":0.3025321109 + "score":0.4224866763 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ko", + "model":"openai\/gpt-4.1", + "bcp_47":"bm", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 + "score":0.0 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ko", + "model":"openai\/gpt-4.1", + "bcp_47":"bm", "task":"translation_from", "metric":"bleu", - "score":0.1107444823 + "score":0.0 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ko", + "model":"openai\/gpt-4.1", + "bcp_47":"bm", "task":"translation_from", "metric":"chrf", - "score":0.3916459404 + "score":0.0 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ko", + "model":"openai\/gpt-4.1", + "bcp_47":"bm", "task":"translation_to", "metric":"bleu", - "score":0.1649626358 + "score":0.0 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ko", + "model":"openai\/gpt-4.1", + "bcp_47":"bm", "task":"translation_to", "metric":"chrf", - "score":0.2656552119 + "score":0.0 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ml", + "model":"openai\/gpt-4.1", + "bcp_47":"bn", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ml", + "model":"openai\/gpt-4.1", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.1675392326 + "score":0.2991941811 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ml", + "model":"openai\/gpt-4.1", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.4161590898 + "score":0.5494978816 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ml", + "model":"openai\/gpt-4.1", + "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.101823454 + "score":0.3244067885 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ml", + "model":"openai\/gpt-4.1", + "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.3124446375 + "score":0.5219822848 }, { - "model":"microsoft\/phi-4", - "bcp_47":"mr", + "model":"openai\/gpt-4.1", + "bcp_47":"ca", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"microsoft\/phi-4", - "bcp_47":"mr", + "model":"openai\/gpt-4.1", + "bcp_47":"ca", "task":"translation_from", "metric":"bleu", - "score":0.1012625471 + "score":0.0 }, { - "model":"microsoft\/phi-4", - "bcp_47":"mr", + "model":"openai\/gpt-4.1", + "bcp_47":"ca", "task":"translation_from", "metric":"chrf", - "score":0.3580813711 + "score":0.0 }, { - "model":"microsoft\/phi-4", - "bcp_47":"mr", + "model":"openai\/gpt-4.1", + "bcp_47":"ca", "task":"translation_to", "metric":"bleu", - "score":0.0891010327 + "score":0.0 }, { - "model":"microsoft\/phi-4", - "bcp_47":"mr", + "model":"openai\/gpt-4.1", + "bcp_47":"ca", "task":"translation_to", "metric":"chrf", - "score":0.3158325956 + "score":0.0 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ms", + "model":"openai\/gpt-4.1", + "bcp_47":"ceb", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ms", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ms", + "model":"openai\/gpt-4.1", + "bcp_47":"ceb", "task":"translation_from", "metric":"bleu", - "score":0.1211248924 + "score":0.4271806928 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ms", + "model":"openai\/gpt-4.1", + "bcp_47":"ceb", "task":"translation_from", "metric":"chrf", - "score":0.389246098 + "score":0.6413850627 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ms", + "model":"openai\/gpt-4.1", + "bcp_47":"ceb", "task":"translation_to", "metric":"bleu", - "score":0.2367123999 + "score":0.3702054313 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ms", + "model":"openai\/gpt-4.1", + "bcp_47":"ceb", "task":"translation_to", "metric":"chrf", - "score":0.5273473365 + "score":0.6183232461 }, { - "model":"microsoft\/phi-4", - "bcp_47":"my", + "model":"openai\/gpt-4.1", + "bcp_47":"ckb", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"my", + "model":"openai\/gpt-4.1", + "bcp_47":"ckb", "task":"translation_from", "metric":"bleu", - "score":0.1262296798 + "score":0.2020995263 }, { - "model":"microsoft\/phi-4", - "bcp_47":"my", + "model":"openai\/gpt-4.1", + "bcp_47":"ckb", "task":"translation_from", "metric":"chrf", - "score":0.3480250641 + "score":0.4532917138 }, { - "model":"microsoft\/phi-4", - "bcp_47":"my", + "model":"openai\/gpt-4.1", + "bcp_47":"ckb", "task":"translation_to", "metric":"bleu", - "score":0.104091386 + "score":0.1831160509 }, { - "model":"microsoft\/phi-4", - "bcp_47":"my", + "model":"openai\/gpt-4.1", + "bcp_47":"ckb", "task":"translation_to", "metric":"chrf", - "score":0.3135377948 + "score":0.4629805537 }, { - "model":"microsoft\/phi-4", - "bcp_47":"om", + "model":"openai\/gpt-4.1", + "bcp_47":"cs", "task":"classification", "metric":"accuracy", - "score":0.6 + "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"om", + "model":"openai\/gpt-4.1", + "bcp_47":"cs", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.7 }, { - "model":"microsoft\/phi-4", - "bcp_47":"om", + "model":"openai\/gpt-4.1", + "bcp_47":"cs", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.7 }, { - "model":"microsoft\/phi-4", - "bcp_47":"om", + "model":"openai\/gpt-4.1", + "bcp_47":"cs", "task":"translation_from", "metric":"bleu", - "score":0.0103766134 + "score":0.3165458461 }, { - "model":"microsoft\/phi-4", - "bcp_47":"om", + "model":"openai\/gpt-4.1", + "bcp_47":"cs", "task":"translation_from", "metric":"chrf", - "score":0.1821363344 + "score":0.571286718 }, { - "model":"microsoft\/phi-4", - "bcp_47":"om", + "model":"openai\/gpt-4.1", + "bcp_47":"cs", "task":"translation_to", "metric":"bleu", - "score":0.0003856632 + "score":0.3923540946 }, { - "model":"microsoft\/phi-4", - "bcp_47":"om", + "model":"openai\/gpt-4.1", + "bcp_47":"cs", "task":"translation_to", "metric":"chrf", - "score":0.0985339751 + "score":0.6004577577 }, { - "model":"microsoft\/phi-4", - "bcp_47":"or", + "model":"openai\/gpt-4.1", + "bcp_47":"de", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"or", + "model":"openai\/gpt-4.1", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.1279029727 + "score":0.3466410252 }, { - "model":"microsoft\/phi-4", - "bcp_47":"or", + "model":"openai\/gpt-4.1", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.3504496172 + "score":0.5865767052 }, { - "model":"microsoft\/phi-4", - "bcp_47":"or", + "model":"openai\/gpt-4.1", + "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.1158076498 + "score":0.4978134672 }, { - "model":"microsoft\/phi-4", - "bcp_47":"or", + "model":"openai\/gpt-4.1", + "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.3583374616 + "score":0.6912703606 }, { - "model":"microsoft\/phi-4", - "bcp_47":"pa", + "model":"openai\/gpt-4.1", + "bcp_47":"el", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"pa", + "model":"openai\/gpt-4.1", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"el", "task":"translation_from", "metric":"bleu", - "score":0.3550414512 + "score":0.308914586 }, { - "model":"microsoft\/phi-4", - "bcp_47":"pa", + "model":"openai\/gpt-4.1", + "bcp_47":"el", "task":"translation_from", "metric":"chrf", - "score":0.5626107823 + "score":0.5426019264 }, { - "model":"microsoft\/phi-4", - "bcp_47":"pa", + "model":"openai\/gpt-4.1", + "bcp_47":"el", "task":"translation_to", "metric":"bleu", - "score":0.2784963846 + "score":0.2768987754 }, { - "model":"microsoft\/phi-4", - "bcp_47":"pa", + "model":"openai\/gpt-4.1", + "bcp_47":"el", "task":"translation_to", "metric":"chrf", - "score":0.4121299981 + "score":0.4945030297 }, { - "model":"microsoft\/phi-4", - "bcp_47":"pl", + "model":"openai\/gpt-4.1", + "bcp_47":"en", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"pl", + "model":"openai\/gpt-4.1", + "bcp_47":"en", "task":"mgsm", "metric":"accuracy", - "score":0.6 + "score":1.0 }, { - "model":"microsoft\/phi-4", - "bcp_47":"pl", + "model":"openai\/gpt-4.1", + "bcp_47":"en", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.6 }, { - "model":"microsoft\/phi-4", - "bcp_47":"pl", + "model":"openai\/gpt-4.1", + "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.1049411882 + "score":0.539334775 }, { - "model":"microsoft\/phi-4", - "bcp_47":"pl", + "model":"openai\/gpt-4.1", + "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.371724232 + "score":0.7031277793 }, { - "model":"microsoft\/phi-4", - "bcp_47":"pl", + "model":"openai\/gpt-4.1", + "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.2126550777 + "score":0.6275460309 }, { - "model":"microsoft\/phi-4", - "bcp_47":"pl", + "model":"openai\/gpt-4.1", + "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.4754992095 + "score":0.8258272044 }, { - "model":"microsoft\/phi-4", - "bcp_47":"pt", + "model":"openai\/gpt-4.1", + "bcp_47":"es", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"pt", + "model":"openai\/gpt-4.1", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"es", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"microsoft\/phi-4", - "bcp_47":"pt", + "model":"openai\/gpt-4.1", + "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.1813353123 + "score":0.3148515413 }, { - "model":"microsoft\/phi-4", - "bcp_47":"pt", + "model":"openai\/gpt-4.1", + "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.4632560004 + "score":0.5634810123 }, { - "model":"microsoft\/phi-4", - "bcp_47":"pt", + "model":"openai\/gpt-4.1", + "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.3450201321 + "score":0.4056181014 }, { - "model":"microsoft\/phi-4", - "bcp_47":"pt", + "model":"openai\/gpt-4.1", + "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.5827805827 + "score":0.6446334193 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ru", + "model":"openai\/gpt-4.1", + "bcp_47":"fa", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"mgsm", - "metric":"accuracy", "score":0.8 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ru", + "model":"openai\/gpt-4.1", + "bcp_47":"fa", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.8 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ru", + "model":"openai\/gpt-4.1", + "bcp_47":"fa", "task":"translation_from", "metric":"bleu", - "score":0.164734586 + "score":0.3057972645 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ru", + "model":"openai\/gpt-4.1", + "bcp_47":"fa", "task":"translation_from", "metric":"chrf", - "score":0.4400610126 + "score":0.5437056078 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ru", + "model":"openai\/gpt-4.1", + "bcp_47":"fa", "task":"translation_to", "metric":"bleu", - "score":0.2884407046 + "score":0.2134083705 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ru", + "model":"openai\/gpt-4.1", + "bcp_47":"fa", "task":"translation_to", "metric":"chrf", - "score":0.5338739518 + "score":0.4531825072 }, { - "model":"microsoft\/phi-4", - "bcp_47":"sd", + "model":"openai\/gpt-4.1", + "bcp_47":"fil", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"sd", + "model":"openai\/gpt-4.1", + "bcp_47":"fil", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"fil", "task":"translation_from", "metric":"bleu", - "score":0.0476641683 + "score":0.3908134626 }, { - "model":"microsoft\/phi-4", - "bcp_47":"sd", + "model":"openai\/gpt-4.1", + "bcp_47":"fil", "task":"translation_from", "metric":"chrf", - "score":0.1691869095 + "score":0.6127114899 }, { - "model":"microsoft\/phi-4", - "bcp_47":"sd", + "model":"openai\/gpt-4.1", + "bcp_47":"fil", "task":"translation_to", "metric":"bleu", - "score":0.0111247819 + "score":0.3246807458 }, { - "model":"microsoft\/phi-4", - "bcp_47":"sd", + "model":"openai\/gpt-4.1", + "bcp_47":"fil", "task":"translation_to", "metric":"chrf", - "score":0.151377306 + "score":0.5949140146 }, { - "model":"microsoft\/phi-4", - "bcp_47":"sw", + "model":"openai\/gpt-4.1", + "bcp_47":"fr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"sw", + "model":"openai\/gpt-4.1", + "bcp_47":"fr", "task":"mgsm", "metric":"accuracy", - "score":0.6 + "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"sw", + "model":"openai\/gpt-4.1", + "bcp_47":"fr", "task":"mmlu", "metric":"accuracy", "score":0.6 }, { - "model":"microsoft\/phi-4", - "bcp_47":"sw", + "model":"openai\/gpt-4.1", + "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.1325294802 + "score":0.3184811644 }, { - "model":"microsoft\/phi-4", - "bcp_47":"sw", + "model":"openai\/gpt-4.1", + "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.4051925402 + "score":0.5751428267 }, { - "model":"microsoft\/phi-4", - "bcp_47":"sw", + "model":"openai\/gpt-4.1", + "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.1631216823 + "score":0.5082124359 }, { - "model":"microsoft\/phi-4", - "bcp_47":"sw", + "model":"openai\/gpt-4.1", + "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.4696161488 + "score":0.6953832529 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ta", + "model":"openai\/gpt-4.1", + "bcp_47":"fuv", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ta", + "model":"openai\/gpt-4.1", + "bcp_47":"fuv", "task":"translation_from", "metric":"bleu", - "score":0.1338729952 + "score":0.0379690036 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ta", + "model":"openai\/gpt-4.1", + "bcp_47":"fuv", "task":"translation_from", "metric":"chrf", - "score":0.3640492116 + "score":0.2450412363 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ta", + "model":"openai\/gpt-4.1", + "bcp_47":"fuv", "task":"translation_to", "metric":"bleu", - "score":0.1115670494 + "score":0.0600253056 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ta", + "model":"openai\/gpt-4.1", + "bcp_47":"fuv", "task":"translation_to", "metric":"chrf", - "score":0.4303510763 + "score":0.2209496659 }, { - "model":"microsoft\/phi-4", - "bcp_47":"te", + "model":"openai\/gpt-4.1", + "bcp_47":"gu", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"mgsm", - "metric":"accuracy", - "score":0.1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", + "model":"openai\/gpt-4.1", + "bcp_47":"gu", "task":"translation_from", "metric":"bleu", - "score":0.2374723306 + "score":0.2877530662 }, { - "model":"microsoft\/phi-4", - "bcp_47":"te", + "model":"openai\/gpt-4.1", + "bcp_47":"gu", "task":"translation_from", "metric":"chrf", - "score":0.4675485501 + "score":0.5281343849 }, { - "model":"microsoft\/phi-4", - "bcp_47":"te", + "model":"openai\/gpt-4.1", + "bcp_47":"gu", "task":"translation_to", "metric":"bleu", - "score":0.2528444882 + "score":0.1402688672 }, { - "model":"microsoft\/phi-4", - "bcp_47":"te", + "model":"openai\/gpt-4.1", + "bcp_47":"gu", "task":"translation_to", "metric":"chrf", - "score":0.4794045124 + "score":0.4396874045 }, { - "model":"microsoft\/phi-4", - "bcp_47":"th", + "model":"openai\/gpt-4.1", + "bcp_47":"ha", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"th", + "model":"openai\/gpt-4.1", + "bcp_47":"ha", "task":"mgsm", "metric":"accuracy", + "score":0.6 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"ha", + "task":"mmlu", + "metric":"accuracy", "score":0.7 }, { - "model":"microsoft\/phi-4", - "bcp_47":"th", + "model":"openai\/gpt-4.1", + "bcp_47":"ha", "task":"translation_from", "metric":"bleu", - "score":0.1140490825 + "score":0.2003303143 }, { - "model":"microsoft\/phi-4", - "bcp_47":"th", + "model":"openai\/gpt-4.1", + "bcp_47":"ha", "task":"translation_from", "metric":"chrf", - "score":0.3668015685 + "score":0.4279958144 }, { - "model":"microsoft\/phi-4", - "bcp_47":"th", + "model":"openai\/gpt-4.1", + "bcp_47":"ha", "task":"translation_to", "metric":"bleu", - "score":0.1317498141 + "score":0.2428342826 }, { - "model":"microsoft\/phi-4", - "bcp_47":"th", + "model":"openai\/gpt-4.1", + "bcp_47":"ha", "task":"translation_to", "metric":"chrf", - "score":0.2770372268 + "score":0.5208238431 }, { - "model":"microsoft\/phi-4", - "bcp_47":"tr", + "model":"openai\/gpt-4.1", + "bcp_47":"hi", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"tr", + "model":"openai\/gpt-4.1", + "bcp_47":"hi", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"tr", + "model":"openai\/gpt-4.1", + "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.1209396556 + "score":0.3556331675 }, { - "model":"microsoft\/phi-4", - "bcp_47":"tr", + "model":"openai\/gpt-4.1", + "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.3409074931 + "score":0.5802678717 }, { - "model":"microsoft\/phi-4", - "bcp_47":"tr", + "model":"openai\/gpt-4.1", + "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.270580586 + "score":0.38273354 }, { - "model":"microsoft\/phi-4", - "bcp_47":"tr", + "model":"openai\/gpt-4.1", + "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.537606561 + "score":0.6044055498 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ur", + "model":"openai\/gpt-4.1", + "bcp_47":"hne", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ur", + "model":"openai\/gpt-4.1", + "bcp_47":"hne", "task":"translation_from", "metric":"bleu", - "score":0.1155003818 + "score":0.2441042617 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ur", + "model":"openai\/gpt-4.1", + "bcp_47":"hne", "task":"translation_from", "metric":"chrf", - "score":0.3250077925 + "score":0.509051591 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ur", + "model":"openai\/gpt-4.1", + "bcp_47":"hne", "task":"translation_to", "metric":"bleu", - "score":0.1195513435 + "score":0.1488771793 }, { - "model":"microsoft\/phi-4", - "bcp_47":"ur", + "model":"openai\/gpt-4.1", + "bcp_47":"hne", "task":"translation_to", "metric":"chrf", - "score":0.3158904676 + "score":0.3979048506 }, { - "model":"microsoft\/phi-4", - "bcp_47":"uz", + "model":"openai\/gpt-4.1", + "bcp_47":"ht", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"microsoft\/phi-4", - "bcp_47":"uz", + "model":"openai\/gpt-4.1", + "bcp_47":"ht", "task":"translation_from", "metric":"bleu", - "score":0.0676473408 + "score":0.0 }, { - "model":"microsoft\/phi-4", - "bcp_47":"uz", + "model":"openai\/gpt-4.1", + "bcp_47":"ht", "task":"translation_from", "metric":"chrf", - "score":0.2672641675 + "score":0.0 }, { - "model":"microsoft\/phi-4", - "bcp_47":"uz", + "model":"openai\/gpt-4.1", + "bcp_47":"ht", "task":"translation_to", "metric":"bleu", - "score":0.0166808106 + "score":0.0 }, { - "model":"microsoft\/phi-4", - "bcp_47":"uz", + "model":"openai\/gpt-4.1", + "bcp_47":"ht", "task":"translation_to", "metric":"chrf", - "score":0.2361978954 + "score":0.0 }, { - "model":"microsoft\/phi-4", - "bcp_47":"vi", + "model":"openai\/gpt-4.1", + "bcp_47":"hu", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"mmlu", + "model":"openai\/gpt-4.1", + "bcp_47":"hu", + "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":0.7 }, { - "model":"microsoft\/phi-4", - "bcp_47":"vi", + "model":"openai\/gpt-4.1", + "bcp_47":"hu", "task":"translation_from", "metric":"bleu", - "score":0.1452425625 + "score":0.2781326859 }, { - "model":"microsoft\/phi-4", - "bcp_47":"vi", + "model":"openai\/gpt-4.1", + "bcp_47":"hu", "task":"translation_from", "metric":"chrf", - "score":0.3941195385 + "score":0.5567082198 }, { - "model":"microsoft\/phi-4", - "bcp_47":"vi", + "model":"openai\/gpt-4.1", + "bcp_47":"hu", "task":"translation_to", "metric":"bleu", - "score":0.2680553268 + "score":0.3429728329 }, { - "model":"microsoft\/phi-4", - "bcp_47":"vi", + "model":"openai\/gpt-4.1", + "bcp_47":"hu", "task":"translation_to", "metric":"chrf", - "score":0.5055559664 + "score":0.6056687314 }, { - "model":"microsoft\/phi-4", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1", + "bcp_47":"id", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.0721904827 + "score":0.3462344182 }, { - "model":"microsoft\/phi-4", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.3322122834 + "score":0.5958151457 }, { - "model":"microsoft\/phi-4", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1", + "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.0963078281 + "score":0.3538211232 }, { - "model":"microsoft\/phi-4", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1", + "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.1506583582 + "score":0.6387367985 }, { - "model":"microsoft\/phi-4", - "bcp_47":"yue", + "model":"openai\/gpt-4.1", + "bcp_47":"ig", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"yue", + "model":"openai\/gpt-4.1", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"ig", "task":"translation_from", "metric":"bleu", - "score":0.1360263411 + "score":0.1914060382 }, { - "model":"microsoft\/phi-4", - "bcp_47":"yue", + "model":"openai\/gpt-4.1", + "bcp_47":"ig", "task":"translation_from", "metric":"chrf", - "score":0.4135302369 + "score":0.4768796669 }, { - "model":"microsoft\/phi-4", - "bcp_47":"yue", + "model":"openai\/gpt-4.1", + "bcp_47":"ig", "task":"translation_to", "metric":"bleu", - "score":0.1427052583 + "score":0.1949774059 }, { - "model":"microsoft\/phi-4", - "bcp_47":"yue", + "model":"openai\/gpt-4.1", + "bcp_47":"ig", "task":"translation_to", "metric":"chrf", - "score":0.2190638456 + "score":0.4716938743 }, { - "model":"microsoft\/phi-4", - "bcp_47":"zh", + "model":"openai\/gpt-4.1", + "bcp_47":"ilo", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"mgsm", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", + "model":"openai\/gpt-4.1", + "bcp_47":"ilo", "task":"translation_from", "metric":"bleu", - "score":0.1516445239 + "score":0.2651265931 }, { - "model":"microsoft\/phi-4", - "bcp_47":"zh", + "model":"openai\/gpt-4.1", + "bcp_47":"ilo", "task":"translation_from", "metric":"chrf", - "score":0.4517979691 + "score":0.4942111299 }, { - "model":"microsoft\/phi-4", - "bcp_47":"zh", + "model":"openai\/gpt-4.1", + "bcp_47":"ilo", "task":"translation_to", "metric":"bleu", - "score":0.2058198052 + "score":0.1732257355 }, { - "model":"microsoft\/phi-4", - "bcp_47":"zh", + "model":"openai\/gpt-4.1", + "bcp_47":"ilo", "task":"translation_to", "metric":"chrf", - "score":0.2799124898 + "score":0.4781715485 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"am", + "model":"openai\/gpt-4.1", + "bcp_47":"it", "task":"classification", "metric":"accuracy", - "score":0.4 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"am", + "model":"openai\/gpt-4.1", + "bcp_47":"it", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":1.0 }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"am", + { + "model":"openai\/gpt-4.1", + "bcp_47":"it", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":0.7 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"am", + "model":"openai\/gpt-4.1", + "bcp_47":"it", "task":"translation_from", "metric":"bleu", - "score":0.0143438883 + "score":0.3009538263 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"am", + "model":"openai\/gpt-4.1", + "bcp_47":"it", "task":"translation_from", "metric":"chrf", - "score":0.0651139855 + "score":0.5501601568 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"am", + "model":"openai\/gpt-4.1", + "bcp_47":"it", "task":"translation_to", "metric":"bleu", - "score":0.0 + "score":0.3493795467 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"am", + "model":"openai\/gpt-4.1", + "bcp_47":"it", "task":"translation_to", "metric":"chrf", - "score":0.0145699741 + "score":0.6074911227 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"apc", + "model":"openai\/gpt-4.1", + "bcp_47":"ja", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"apc", + "model":"openai\/gpt-4.1", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.1077126314 + "score":0.2184952439 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"apc", + "model":"openai\/gpt-4.1", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.3303312588 + "score":0.5137071093 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"apc", + "model":"openai\/gpt-4.1", + "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.0568249639 + "score":0.2956671283 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"apc", + "model":"openai\/gpt-4.1", + "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.1985159581 + "score":0.4548120956 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", + "model":"openai\/gpt-4.1", + "bcp_47":"jv", "task":"classification", "metric":"accuracy", - "score":0.8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.2 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", + "model":"openai\/gpt-4.1", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.1428907436 + "score":0.3245483021 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", + "model":"openai\/gpt-4.1", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.3107041775 + "score":0.5653097878 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", + "model":"openai\/gpt-4.1", + "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.1849770017 + "score":0.2393376297 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", + "model":"openai\/gpt-4.1", + "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.2932088535 + "score":0.5786070517 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", + "model":"openai\/gpt-4.1", + "bcp_47":"ki", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", + "model":"openai\/gpt-4.1", + "bcp_47":"ki", "task":"translation_from", "metric":"bleu", - "score":0.021812522 + "score":0.0 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", + "model":"openai\/gpt-4.1", + "bcp_47":"ki", "task":"translation_from", "metric":"chrf", - "score":0.1700035697 + "score":0.0 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", + "model":"openai\/gpt-4.1", + "bcp_47":"ki", "task":"translation_to", "metric":"bleu", - "score":0.0687018163 + "score":0.0 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", + "model":"openai\/gpt-4.1", + "bcp_47":"ki", "task":"translation_to", "metric":"chrf", - "score":0.213092048 + "score":0.0 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"az", + "model":"openai\/gpt-4.1", + "bcp_47":"kk", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"az", + "model":"openai\/gpt-4.1", + "bcp_47":"kk", "task":"translation_from", "metric":"bleu", - "score":0.0805820584 + "score":0.2332022845 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"az", + "model":"openai\/gpt-4.1", + "bcp_47":"kk", "task":"translation_from", "metric":"chrf", - "score":0.2555758551 + "score":0.5054273222 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"az", + "model":"openai\/gpt-4.1", + "bcp_47":"kk", "task":"translation_to", "metric":"bleu", - "score":0.0296286693 + "score":0.3295494284 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"az", + "model":"openai\/gpt-4.1", + "bcp_47":"kk", "task":"translation_to", "metric":"chrf", - "score":0.1319853113 + "score":0.5830629495 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bho", + "model":"openai\/gpt-4.1", + "bcp_47":"km", "task":"classification", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bho", + "model":"openai\/gpt-4.1", + "bcp_47":"km", "task":"translation_from", "metric":"bleu", - "score":0.0459721625 + "score":0.2813089854 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bho", + "model":"openai\/gpt-4.1", + "bcp_47":"km", "task":"translation_from", "metric":"chrf", - "score":0.2229551601 + "score":0.5573839136 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bho", + "model":"openai\/gpt-4.1", + "bcp_47":"km", "task":"translation_to", "metric":"bleu", - "score":0.0233985631 + "score":0.1797121389 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bho", + "model":"openai\/gpt-4.1", + "bcp_47":"km", "task":"translation_to", "metric":"chrf", - "score":0.1665184954 + "score":0.3875039113 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", + "model":"openai\/gpt-4.1", + "bcp_47":"kn", "task":"classification", "metric":"accuracy", - "score":0.8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"mgsm", - "metric":"accuracy", - "score":0.1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.3 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", + "model":"openai\/gpt-4.1", + "bcp_47":"kn", "task":"translation_from", "metric":"bleu", - "score":0.0355167863 + "score":0.2681346443 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", + "model":"openai\/gpt-4.1", + "bcp_47":"kn", "task":"translation_from", "metric":"chrf", - "score":0.2600874171 + "score":0.516271515 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", + "model":"openai\/gpt-4.1", + "bcp_47":"kn", "task":"translation_to", "metric":"bleu", - "score":0.0323184525 + "score":0.3292637181 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", + "model":"openai\/gpt-4.1", + "bcp_47":"kn", "task":"translation_to", "metric":"chrf", - "score":0.1970289791 + "score":0.5411335167 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", + "model":"openai\/gpt-4.1", + "bcp_47":"ko", "task":"classification", "metric":"accuracy", - "score":0.8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"mgsm", - "metric":"accuracy", - "score":0.1 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", + "model":"openai\/gpt-4.1", + "bcp_47":"ko", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.7 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", + "model":"openai\/gpt-4.1", + "bcp_47":"ko", "task":"translation_from", "metric":"bleu", - "score":0.1237340737 + "score":0.2062159679 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", + "model":"openai\/gpt-4.1", + "bcp_47":"ko", "task":"translation_from", "metric":"chrf", - "score":0.3601104142 + "score":0.4930481948 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", + "model":"openai\/gpt-4.1", + "bcp_47":"ko", "task":"translation_to", "metric":"bleu", - "score":0.1371705946 + "score":0.199120471 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", + "model":"openai\/gpt-4.1", + "bcp_47":"ko", "task":"translation_to", "metric":"chrf", - "score":0.4120757797 + "score":0.2986152055 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", + "model":"openai\/gpt-4.1", + "bcp_47":"lua", "task":"classification", "metric":"accuracy", - "score":0.8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"mgsm", - "metric":"accuracy", - "score":0.2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", + "model":"openai\/gpt-4.1", + "bcp_47":"lua", "task":"translation_from", "metric":"bleu", - "score":0.3548422361 + "score":0.1624653517 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", + "model":"openai\/gpt-4.1", + "bcp_47":"lua", "task":"translation_from", "metric":"chrf", - "score":0.460765953 + "score":0.3643510485 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", + "model":"openai\/gpt-4.1", + "bcp_47":"lua", "task":"translation_to", "metric":"bleu", - "score":0.4690424472 + "score":0.0482270518 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", + "model":"openai\/gpt-4.1", + "bcp_47":"lua", "task":"translation_to", "metric":"chrf", - "score":0.6788013861 + "score":0.2811541542 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", + "model":"openai\/gpt-4.1", + "bcp_47":"mag", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"mgsm", - "metric":"accuracy", - "score":0.3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", + "model":"openai\/gpt-4.1", + "bcp_47":"mag", "task":"translation_from", "metric":"bleu", - "score":0.1169662945 + "score":0.3712275773 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", + "model":"openai\/gpt-4.1", + "bcp_47":"mag", "task":"translation_from", "metric":"chrf", - "score":0.3242693179 + "score":0.6060872554 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", + "model":"openai\/gpt-4.1", + "bcp_47":"mag", "task":"translation_to", "metric":"bleu", - "score":0.2556403143 + "score":0.2415518345 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", + "model":"openai\/gpt-4.1", + "bcp_47":"mag", "task":"translation_to", "metric":"chrf", - "score":0.4583071754 + "score":0.4847424345 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", + "model":"openai\/gpt-4.1", + "bcp_47":"mai", "task":"classification", "metric":"accuracy", - "score":0.8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.4 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", + "model":"openai\/gpt-4.1", + "bcp_47":"mai", "task":"translation_from", "metric":"bleu", - "score":0.0271486292 + "score":0.3038147054 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", + "model":"openai\/gpt-4.1", + "bcp_47":"mai", "task":"translation_from", "metric":"chrf", - "score":0.2182731449 + "score":0.5564897496 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", + "model":"openai\/gpt-4.1", + "bcp_47":"mai", "task":"translation_to", "metric":"bleu", - "score":0.0526574176 + "score":0.1265912109 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", + "model":"openai\/gpt-4.1", + "bcp_47":"mai", "task":"translation_to", "metric":"chrf", - "score":0.2424108963 + "score":0.4505477793 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", + "model":"openai\/gpt-4.1", + "bcp_47":"mg", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", + "model":"openai\/gpt-4.1", + "bcp_47":"mg", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":0.6 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", + "model":"openai\/gpt-4.1", + "bcp_47":"mg", "task":"translation_from", "metric":"bleu", - "score":0.0762125847 + "score":0.2892690248 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", + "model":"openai\/gpt-4.1", + "bcp_47":"mg", "task":"translation_from", "metric":"chrf", - "score":0.2228549327 + "score":0.5283814116 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", + "model":"openai\/gpt-4.1", + "bcp_47":"mg", "task":"translation_to", "metric":"bleu", - "score":0.0269063649 + "score":0.2604484731 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", + "model":"openai\/gpt-4.1", + "bcp_47":"mg", "task":"translation_to", "metric":"chrf", - "score":0.2401408344 + "score":0.5570920222 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", + "model":"openai\/gpt-4.1", + "bcp_47":"ml", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"mgsm", - "metric":"accuracy", - "score":0.3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", + "model":"openai\/gpt-4.1", + "bcp_47":"ml", "task":"translation_from", "metric":"bleu", - "score":0.0839707225 + "score":0.3167316864 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", + "model":"openai\/gpt-4.1", + "bcp_47":"ml", "task":"translation_from", "metric":"chrf", - "score":0.3074010094 + "score":0.5615256782 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", + "model":"openai\/gpt-4.1", + "bcp_47":"ml", "task":"translation_to", "metric":"bleu", - "score":0.2478840637 + "score":0.2233206779 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", + "model":"openai\/gpt-4.1", + "bcp_47":"ml", "task":"translation_to", "metric":"chrf", - "score":0.4205657928 + "score":0.4945538715 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", + "model":"openai\/gpt-4.1", + "bcp_47":"mr", "task":"classification", "metric":"accuracy", - "score":0.4 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", + "model":"openai\/gpt-4.1", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.0005257422 + "score":0.2372647899 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", + "model":"openai\/gpt-4.1", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.0721265952 + "score":0.5201689948 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", + "model":"openai\/gpt-4.1", + "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.000262224 + "score":0.2837915649 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", + "model":"openai\/gpt-4.1", + "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.0118348356 + "score":0.4968686069 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", + "model":"openai\/gpt-4.1", + "bcp_47":"ms", "task":"classification", "metric":"accuracy", - "score":0.7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"mgsm", - "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", + "model":"openai\/gpt-4.1", + "bcp_47":"ms", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.8 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", + "model":"openai\/gpt-4.1", + "bcp_47":"ms", "task":"translation_from", "metric":"bleu", - "score":0.0318398305 + "score":0.3817837328 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", + "model":"openai\/gpt-4.1", + "bcp_47":"ms", "task":"translation_from", "metric":"chrf", - "score":0.1834830244 + "score":0.6303019898 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", + "model":"openai\/gpt-4.1", + "bcp_47":"ms", "task":"translation_to", "metric":"bleu", - "score":0.0320718253 + "score":0.4073449446 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", + "model":"openai\/gpt-4.1", + "bcp_47":"ms", "task":"translation_to", "metric":"chrf", - "score":0.1032515167 + "score":0.6943366118 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", + "model":"openai\/gpt-4.1", + "bcp_47":"my", "task":"classification", "metric":"accuracy", - "score":0.8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.5 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", + "model":"openai\/gpt-4.1", + "bcp_47":"my", "task":"translation_from", "metric":"bleu", - "score":0.1989310744 + "score":0.3249100629 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", + "model":"openai\/gpt-4.1", + "bcp_47":"my", "task":"translation_from", "metric":"chrf", - "score":0.408792844 + "score":0.5431426981 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", + "model":"openai\/gpt-4.1", + "bcp_47":"my", "task":"translation_to", "metric":"bleu", - "score":0.2107266229 + "score":0.235732523 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", + "model":"openai\/gpt-4.1", + "bcp_47":"my", "task":"translation_to", "metric":"chrf", - "score":0.3722535388 + "score":0.5043766555 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", + "model":"openai\/gpt-4.1", + "bcp_47":"ne", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", + "model":"openai\/gpt-4.1", + "bcp_47":"ne", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.7 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", + "model":"openai\/gpt-4.1", + "bcp_47":"ne", "task":"translation_from", "metric":"bleu", - "score":0.1251179936 + "score":0.3096041789 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", + "model":"openai\/gpt-4.1", + "bcp_47":"ne", "task":"translation_from", "metric":"chrf", - "score":0.3078536626 + "score":0.5699841909 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", + "model":"openai\/gpt-4.1", + "bcp_47":"ne", "task":"translation_to", "metric":"bleu", - "score":0.1049757961 + "score":0.2732360862 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", + "model":"openai\/gpt-4.1", + "bcp_47":"ne", "task":"translation_to", "metric":"chrf", - "score":0.338086632 + "score":0.5138403369 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", + "model":"openai\/gpt-4.1", + "bcp_47":"nl", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", + "model":"openai\/gpt-4.1", + "bcp_47":"nl", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", + "model":"openai\/gpt-4.1", + "bcp_47":"nl", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", + "model":"openai\/gpt-4.1", + "bcp_47":"nl", "task":"translation_from", "metric":"bleu", - "score":0.1041933329 + "score":0.2771400437 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", + "model":"openai\/gpt-4.1", + "bcp_47":"nl", "task":"translation_from", "metric":"chrf", - "score":0.3064701129 + "score":0.5234495758 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", + "model":"openai\/gpt-4.1", + "bcp_47":"nl", "task":"translation_to", "metric":"bleu", - "score":0.1299185029 + "score":0.3125238973 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", + "model":"openai\/gpt-4.1", + "bcp_47":"nl", "task":"translation_to", "metric":"chrf", - "score":0.3570513672 + "score":0.5924438438 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", + "model":"openai\/gpt-4.1", + "bcp_47":"ny", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"mgsm", - "metric":"accuracy", - "score":0.2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", + "model":"openai\/gpt-4.1", + "bcp_47":"ny", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":0.6 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", + "model":"openai\/gpt-4.1", + "bcp_47":"ny", "task":"translation_from", "metric":"bleu", - "score":0.1170990874 + "score":0.2155748492 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", + "model":"openai\/gpt-4.1", + "bcp_47":"ny", "task":"translation_from", "metric":"chrf", - "score":0.3281623219 + "score":0.4825510875 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", + "model":"openai\/gpt-4.1", + "bcp_47":"ny", "task":"translation_to", "metric":"bleu", - "score":0.1166577127 + "score":0.1108028659 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", + "model":"openai\/gpt-4.1", + "bcp_47":"ny", "task":"translation_to", "metric":"chrf", - "score":0.2303280443 + "score":0.4669878278 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", + "model":"openai\/gpt-4.1", + "bcp_47":"om", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", + "model":"openai\/gpt-4.1", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"om", "task":"translation_from", "metric":"bleu", - "score":0.0192945074 + "score":0.1205990098 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", + "model":"openai\/gpt-4.1", + "bcp_47":"om", "task":"translation_from", "metric":"chrf", - "score":0.2015068169 + "score":0.3774448724 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", + "model":"openai\/gpt-4.1", + "bcp_47":"om", "task":"translation_to", "metric":"bleu", - "score":0.045857499 + "score":0.0499279171 }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", + { + "model":"openai\/gpt-4.1", + "bcp_47":"om", "task":"translation_to", "metric":"chrf", - "score":0.1778848232 + "score":0.3917438838 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", + "model":"openai\/gpt-4.1", + "bcp_47":"or", "task":"classification", "metric":"accuracy", - "score":0.6 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", + "model":"openai\/gpt-4.1", + "bcp_47":"or", "task":"translation_from", "metric":"bleu", - "score":0.0343738545 + "score":0.2796086811 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", + "model":"openai\/gpt-4.1", + "bcp_47":"or", "task":"translation_from", "metric":"chrf", - "score":0.1971697601 + "score":0.5313259159 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", + "model":"openai\/gpt-4.1", + "bcp_47":"or", "task":"translation_to", "metric":"bleu", - "score":0.012430185 + "score":0.1726812539 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", + "model":"openai\/gpt-4.1", + "bcp_47":"or", "task":"translation_to", "metric":"chrf", - "score":0.0969965616 + "score":0.4298144259 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", + "model":"openai\/gpt-4.1", + "bcp_47":"pa", "task":"classification", "metric":"accuracy", - "score":0.8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.2 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", + "model":"openai\/gpt-4.1", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.1011791445 + "score":0.4066850608 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", + "model":"openai\/gpt-4.1", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.2665626277 + "score":0.6424035216 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", + "model":"openai\/gpt-4.1", + "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.0674482283 + "score":0.4726631876 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", + "model":"openai\/gpt-4.1", + "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.1439352867 + "score":0.6063294964 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", + "model":"openai\/gpt-4.1", + "bcp_47":"pl", "task":"classification", "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", "score":0.8 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", + "model":"openai\/gpt-4.1", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"pl", "task":"translation_from", "metric":"bleu", - "score":0.044306682 + "score":0.279299064 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", + "model":"openai\/gpt-4.1", + "bcp_47":"pl", "task":"translation_from", "metric":"chrf", - "score":0.2110608123 + "score":0.5370393541 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", + "model":"openai\/gpt-4.1", + "bcp_47":"pl", "task":"translation_to", "metric":"bleu", - "score":0.0101250707 + "score":0.3400908956 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", + "model":"openai\/gpt-4.1", + "bcp_47":"pl", "task":"translation_to", "metric":"chrf", - "score":0.1446641679 + "score":0.5719220223 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", + "model":"openai\/gpt-4.1", + "bcp_47":"pt", "task":"classification", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", + "model":"openai\/gpt-4.1", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.0250471784 + "score":0.3091176603 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", + "model":"openai\/gpt-4.1", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.2097577846 + "score":0.5550502185 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", + "model":"openai\/gpt-4.1", + "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.034382114 + "score":0.4520197651 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", + "model":"openai\/gpt-4.1", + "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.2211758055 + "score":0.6675992003 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ms", + "model":"openai\/gpt-4.1", + "bcp_47":"ro", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ms", + "model":"openai\/gpt-4.1", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"ro", "task":"mmlu", "metric":"accuracy", - "score":0.2 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ms", + "model":"openai\/gpt-4.1", + "bcp_47":"ro", "task":"translation_from", "metric":"bleu", - "score":0.120023798 + "score":0.2929157497 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ms", + "model":"openai\/gpt-4.1", + "bcp_47":"ro", "task":"translation_from", "metric":"chrf", - "score":0.3039131897 + "score":0.5489344393 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ms", + "model":"openai\/gpt-4.1", + "bcp_47":"ro", "task":"translation_to", "metric":"bleu", - "score":0.1137229069 + "score":0.4680709113 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ms", + "model":"openai\/gpt-4.1", + "bcp_47":"ro", "task":"translation_to", "metric":"chrf", - "score":0.3446031673 + "score":0.656644785 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"my", + "model":"openai\/gpt-4.1", + "bcp_47":"ru", "task":"classification", "metric":"accuracy", - "score":0.6 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"my", + "model":"openai\/gpt-4.1", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.1101780964 + "score":0.2332295676 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"my", + "model":"openai\/gpt-4.1", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.2424045636 + "score":0.5393238215 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"my", + "model":"openai\/gpt-4.1", + "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.0971253665 + "score":0.3359555862 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"my", + "model":"openai\/gpt-4.1", + "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.1223804901 + "score":0.5768159572 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"om", + "model":"openai\/gpt-4.1", + "bcp_47":"rw", "task":"classification", "metric":"accuracy", - "score":0.4 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"om", + "model":"openai\/gpt-4.1", + "bcp_47":"rw", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.5 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"om", + "model":"openai\/gpt-4.1", + "bcp_47":"rw", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.4 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"om", + "model":"openai\/gpt-4.1", + "bcp_47":"rw", "task":"translation_from", "metric":"bleu", - "score":0.0171568718 + "score":0.1988009754 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"om", + "model":"openai\/gpt-4.1", + "bcp_47":"rw", "task":"translation_from", "metric":"chrf", - "score":0.1561109456 + "score":0.4678679556 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"om", + "model":"openai\/gpt-4.1", + "bcp_47":"rw", "task":"translation_to", "metric":"bleu", - "score":0.0097264241 + "score":0.2629383296 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"om", + "model":"openai\/gpt-4.1", + "bcp_47":"rw", "task":"translation_to", "metric":"chrf", - "score":0.0452833915 + "score":0.5460945267 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", + "model":"openai\/gpt-4.1", + "bcp_47":"sd", "task":"classification", "metric":"accuracy", - "score":0.4 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", + "model":"openai\/gpt-4.1", + "bcp_47":"sd", "task":"translation_from", "metric":"bleu", - "score":0.0554840251 + "score":0.3262698326 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", + "model":"openai\/gpt-4.1", + "bcp_47":"sd", "task":"translation_from", "metric":"chrf", - "score":0.1538079363 + "score":0.5582120149 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", + "model":"openai\/gpt-4.1", + "bcp_47":"sd", "task":"translation_to", "metric":"bleu", - "score":0.0033288372 + "score":0.3228689165 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", + "model":"openai\/gpt-4.1", + "bcp_47":"sd", "task":"translation_to", "metric":"chrf", - "score":0.036508675 + "score":0.4980199993 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", + "model":"openai\/gpt-4.1", + "bcp_47":"si", "task":"classification", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", + "model":"openai\/gpt-4.1", + "bcp_47":"si", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"si", "task":"translation_from", "metric":"bleu", - "score":0.3055395757 + "score":0.2183778489 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", + "model":"openai\/gpt-4.1", + "bcp_47":"si", "task":"translation_from", "metric":"chrf", - "score":0.4480585816 + "score":0.4879608634 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", + "model":"openai\/gpt-4.1", + "bcp_47":"si", "task":"translation_to", "metric":"bleu", - "score":0.2165906221 + "score":0.2090356271 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", + "model":"openai\/gpt-4.1", + "bcp_47":"si", "task":"translation_to", "metric":"chrf", - "score":0.3271537328 + "score":0.3834363403 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", + "model":"openai\/gpt-4.1", + "bcp_47":"sn", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", + "model":"openai\/gpt-4.1", + "bcp_47":"sn", "task":"mgsm", "metric":"accuracy", - "score":0.2 + "score":0.7 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", + "model":"openai\/gpt-4.1", + "bcp_47":"sn", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.7 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", + "model":"openai\/gpt-4.1", + "bcp_47":"sn", "task":"translation_from", "metric":"bleu", - "score":0.1017362354 + "score":0.1117579943 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", + "model":"openai\/gpt-4.1", + "bcp_47":"sn", "task":"translation_from", "metric":"chrf", - "score":0.2782010079 + "score":0.3651910045 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", + "model":"openai\/gpt-4.1", + "bcp_47":"sn", "task":"translation_to", "metric":"bleu", - "score":0.1041302213 + "score":0.1550941263 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", + "model":"openai\/gpt-4.1", + "bcp_47":"sn", "task":"translation_to", "metric":"chrf", - "score":0.2865629267 + "score":0.5033416845 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", + "model":"openai\/gpt-4.1", + "bcp_47":"so", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", + "model":"openai\/gpt-4.1", + "bcp_47":"so", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.6 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", + "model":"openai\/gpt-4.1", + "bcp_47":"so", "task":"translation_from", "metric":"bleu", - "score":0.1031395116 + "score":0.2638307043 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", + "model":"openai\/gpt-4.1", + "bcp_47":"so", "task":"translation_from", "metric":"chrf", - "score":0.3223915745 + "score":0.4819229353 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", + "model":"openai\/gpt-4.1", + "bcp_47":"so", "task":"translation_to", "metric":"bleu", - "score":0.1194174782 + "score":0.184886568 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", + "model":"openai\/gpt-4.1", + "bcp_47":"so", "task":"translation_to", "metric":"chrf", - "score":0.3618255907 + "score":0.4611492374 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", + "model":"openai\/gpt-4.1", + "bcp_47":"sr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"mgsm", + "model":"openai\/gpt-4.1", + "bcp_47":"sr", + "task":"mmlu", "metric":"accuracy", - "score":0.1 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"mmlu", + "model":"openai\/gpt-4.1", + "bcp_47":"sr", + "task":"translation_from", + "metric":"bleu", + "score":0.2842627945 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"sr", + "task":"translation_from", + "metric":"chrf", + "score":0.5655019867 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"sr", + "task":"translation_to", + "metric":"bleu", + "score":0.3294849496 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"sr", + "task":"translation_to", + "metric":"chrf", + "score":0.5361539575 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"su", + "task":"classification", "metric":"accuracy", - "score":0.5 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", + "model":"openai\/gpt-4.1", + "bcp_47":"su", "task":"translation_from", "metric":"bleu", - "score":0.0826481083 + "score":0.2389196918 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", + "model":"openai\/gpt-4.1", + "bcp_47":"su", "task":"translation_from", "metric":"chrf", - "score":0.2913230821 + "score":0.4797843722 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", + "model":"openai\/gpt-4.1", + "bcp_47":"su", "task":"translation_to", "metric":"bleu", - "score":0.1808682916 + "score":0.1891587494 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", + "model":"openai\/gpt-4.1", + "bcp_47":"su", "task":"translation_to", "metric":"chrf", - "score":0.3815777762 + "score":0.4981237511 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", + "model":"openai\/gpt-4.1", + "bcp_47":"sv", "task":"classification", "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", "score":0.8 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", + "model":"openai\/gpt-4.1", + "bcp_47":"sv", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"sv", "task":"translation_from", "metric":"bleu", - "score":0.0448599501 + "score":0.2815285609 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", + "model":"openai\/gpt-4.1", + "bcp_47":"sv", "task":"translation_from", "metric":"chrf", - "score":0.1691371082 + "score":0.5465800135 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", + "model":"openai\/gpt-4.1", + "bcp_47":"sv", "task":"translation_to", "metric":"bleu", - "score":0.0 + "score":0.3801186069 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", + "model":"openai\/gpt-4.1", + "bcp_47":"sv", "task":"translation_to", "metric":"chrf", - "score":0.0527194634 + "score":0.6436092706 }, { - "model":"microsoft\/phi-4-multimodal-instruct", + "model":"openai\/gpt-4.1", "bcp_47":"sw", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", + "model":"openai\/gpt-4.1", "bcp_47":"sw", "task":"mgsm", "metric":"accuracy", - "score":0.3 + "score":1.0 }, { - "model":"microsoft\/phi-4-multimodal-instruct", + "model":"openai\/gpt-4.1", "bcp_47":"sw", "task":"mmlu", "metric":"accuracy", - "score":0.3 + "score":0.7 }, { - "model":"microsoft\/phi-4-multimodal-instruct", + "model":"openai\/gpt-4.1", "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.0422003709 + "score":0.3118480568 }, { - "model":"microsoft\/phi-4-multimodal-instruct", + "model":"openai\/gpt-4.1", "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.253591842 + "score":0.546369665 }, { - "model":"microsoft\/phi-4-multimodal-instruct", + "model":"openai\/gpt-4.1", "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.0280729387 + "score":0.3964352653 }, { - "model":"microsoft\/phi-4-multimodal-instruct", + "model":"openai\/gpt-4.1", "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.1884927612 + "score":0.6509673425 }, { - "model":"microsoft\/phi-4-multimodal-instruct", + "model":"openai\/gpt-4.1", "bcp_47":"ta", "task":"classification", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", + "model":"openai\/gpt-4.1", "bcp_47":"ta", "task":"translation_from", "metric":"bleu", - "score":0.0366379898 + "score":0.261907541 }, { - "model":"microsoft\/phi-4-multimodal-instruct", + "model":"openai\/gpt-4.1", "bcp_47":"ta", "task":"translation_from", "metric":"chrf", - "score":0.1847934746 + "score":0.5163685859 }, { - "model":"microsoft\/phi-4-multimodal-instruct", + "model":"openai\/gpt-4.1", "bcp_47":"ta", "task":"translation_to", "metric":"bleu", - "score":0.0141355453 + "score":0.2722219181 }, { - "model":"microsoft\/phi-4-multimodal-instruct", + "model":"openai\/gpt-4.1", "bcp_47":"ta", "task":"translation_to", "metric":"chrf", - "score":0.1724636201 + "score":0.532399617 }, { - "model":"microsoft\/phi-4-multimodal-instruct", + "model":"openai\/gpt-4.1", "bcp_47":"te", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", + "model":"openai\/gpt-4.1", "bcp_47":"te", "task":"mgsm", "metric":"accuracy", - "score":0.2 + "score":1.0 }, { - "model":"microsoft\/phi-4-multimodal-instruct", + "model":"openai\/gpt-4.1", "bcp_47":"te", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":0.8 }, { - "model":"microsoft\/phi-4-multimodal-instruct", + "model":"openai\/gpt-4.1", "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.1550101498 + "score":0.393859257 }, { - "model":"microsoft\/phi-4-multimodal-instruct", + "model":"openai\/gpt-4.1", "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.3623113506 + "score":0.6378203173 }, { - "model":"microsoft\/phi-4-multimodal-instruct", + "model":"openai\/gpt-4.1", "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.1217984824 + "score":0.3327078813 }, { - "model":"microsoft\/phi-4-multimodal-instruct", + "model":"openai\/gpt-4.1", "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.2801870917 + "score":0.5457177636 }, { - "model":"microsoft\/phi-4-multimodal-instruct", + "model":"openai\/gpt-4.1", + "bcp_47":"tg", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"tg", + "task":"translation_from", + "metric":"bleu", + "score":0.2154192376 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"tg", + "task":"translation_from", + "metric":"chrf", + "score":0.4696470371 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"tg", + "task":"translation_to", + "metric":"bleu", + "score":0.2538014928 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"tg", + "task":"translation_to", + "metric":"chrf", + "score":0.5009654989 + }, + { + "model":"openai\/gpt-4.1", "bcp_47":"th", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", + "model":"openai\/gpt-4.1", "bcp_47":"th", "task":"mgsm", "metric":"accuracy", - "score":0.1 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", + "model":"openai\/gpt-4.1", "bcp_47":"th", "task":"translation_from", "metric":"bleu", - "score":0.0853746951 + "score":0.3143461477 }, { - "model":"microsoft\/phi-4-multimodal-instruct", + "model":"openai\/gpt-4.1", "bcp_47":"th", "task":"translation_from", "metric":"chrf", - "score":0.3009803927 + "score":0.5485350923 }, { - "model":"microsoft\/phi-4-multimodal-instruct", + "model":"openai\/gpt-4.1", "bcp_47":"th", "task":"translation_to", "metric":"bleu", - "score":0.0676677726 + "score":0.39778814 }, { - "model":"microsoft\/phi-4-multimodal-instruct", + "model":"openai\/gpt-4.1", "bcp_47":"th", "task":"translation_to", "metric":"chrf", - "score":0.2051763344 + "score":0.5566425188 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", + "model":"openai\/gpt-4.1", + "bcp_47":"ti", "task":"classification", "metric":"accuracy", - "score":0.8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.3 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", + "model":"openai\/gpt-4.1", + "bcp_47":"ti", "task":"translation_from", "metric":"bleu", - "score":0.1075252941 + "score":0.1498024182 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", + "model":"openai\/gpt-4.1", + "bcp_47":"ti", "task":"translation_from", "metric":"chrf", - "score":0.2810155518 + "score":0.3821120653 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", + "model":"openai\/gpt-4.1", + "bcp_47":"ti", "task":"translation_to", "metric":"bleu", - "score":0.0683323294 + "score":0.0693185679 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", + "model":"openai\/gpt-4.1", + "bcp_47":"ti", "task":"translation_to", "metric":"chrf", - "score":0.2657241512 + "score":0.1815602807 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", + "model":"openai\/gpt-4.1", + "bcp_47":"tr", "task":"classification", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", + "model":"openai\/gpt-4.1", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"tr", "task":"translation_from", "metric":"bleu", - "score":0.096255918 + "score":0.2731125622 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", + "model":"openai\/gpt-4.1", + "bcp_47":"tr", "task":"translation_from", "metric":"chrf", - "score":0.2490196736 + "score":0.5386147699 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", + "model":"openai\/gpt-4.1", + "bcp_47":"tr", "task":"translation_to", "metric":"bleu", - "score":0.0759551519 + "score":0.3357059921 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", + "model":"openai\/gpt-4.1", + "bcp_47":"tr", "task":"translation_to", "metric":"chrf", - "score":0.2765897266 + "score":0.6001525874 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"uz", + "model":"openai\/gpt-4.1", + "bcp_47":"uk", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"uz", + "model":"openai\/gpt-4.1", + "bcp_47":"uk", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"uk", "task":"translation_from", "metric":"bleu", - "score":0.030810794 + "score":0.2620427472 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"uz", + "model":"openai\/gpt-4.1", + "bcp_47":"uk", "task":"translation_from", "metric":"chrf", - "score":0.1804383237 + "score":0.5463036194 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"uz", + "model":"openai\/gpt-4.1", + "bcp_47":"uk", "task":"translation_to", "metric":"bleu", - "score":0.0151653031 + "score":0.3493974795 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"uz", + "model":"openai\/gpt-4.1", + "bcp_47":"uk", "task":"translation_to", "metric":"chrf", - "score":0.0766086067 + "score":0.5517845172 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", + "model":"openai\/gpt-4.1", + "bcp_47":"umb", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.3 + "score":0.5 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", + "model":"openai\/gpt-4.1", + "bcp_47":"umb", "task":"translation_from", "metric":"bleu", - "score":0.1578714698 + "score":0.0571388098 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", + "model":"openai\/gpt-4.1", + "bcp_47":"umb", "task":"translation_from", "metric":"chrf", - "score":0.3784433754 + "score":0.2146586416 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", + "model":"openai\/gpt-4.1", + "bcp_47":"umb", "task":"translation_to", "metric":"bleu", - "score":0.1713340477 + "score":0.0411925065 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", + "model":"openai\/gpt-4.1", + "bcp_47":"umb", "task":"translation_to", "metric":"chrf", - "score":0.3260532752 + "score":0.1869298599 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1", + "bcp_47":"ur", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.0482308543 + "score":0.205946158 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.2087387992 + "score":0.5021595381 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1", + "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.0574307954 + "score":0.2933139984 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1", + "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.1098000711 + "score":0.4825872793 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", + "model":"openai\/gpt-4.1", + "bcp_47":"uz", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", + "model":"openai\/gpt-4.1", + "bcp_47":"uz", "task":"translation_from", "metric":"bleu", - "score":0.0513648793 + "score":0.2191445081 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", + "model":"openai\/gpt-4.1", + "bcp_47":"uz", "task":"translation_from", "metric":"chrf", - "score":0.2577830867 + "score":0.4863403733 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", + "model":"openai\/gpt-4.1", + "bcp_47":"uz", "task":"translation_to", "metric":"bleu", - "score":0.119690435 + "score":0.2099586093 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", + "model":"openai\/gpt-4.1", + "bcp_47":"uz", "task":"translation_to", "metric":"chrf", - "score":0.1721639976 + "score":0.5133143617 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", + "model":"openai\/gpt-4.1", + "bcp_47":"vi", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"mgsm", - "metric":"accuracy", - "score":0.2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", + "model":"openai\/gpt-4.1", + "bcp_47":"vi", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.8 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", + "model":"openai\/gpt-4.1", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.0821079546 + "score":0.2583850394 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", + "model":"openai\/gpt-4.1", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.3164863838 + "score":0.5425702257 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", + "model":"openai\/gpt-4.1", + "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.1265931852 + "score":0.418014366 }, { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", + "model":"openai\/gpt-4.1", + "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.1793067232 + "score":0.6308329518 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"am", + "model":"openai\/gpt-4.1", + "bcp_47":"wo", "task":"classification", "metric":"accuracy", - "score":0.1 + "score":0.8 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"am", + "model":"openai\/gpt-4.1", + "bcp_47":"wo", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.4 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"am", + "model":"openai\/gpt-4.1", + "bcp_47":"wo", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.5 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"am", + "model":"openai\/gpt-4.1", + "bcp_47":"wo", "task":"translation_from", "metric":"bleu", - "score":0.0457848104 + "score":0.0837728981 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"am", + "model":"openai\/gpt-4.1", + "bcp_47":"wo", "task":"translation_from", "metric":"chrf", - "score":0.1635760551 + "score":0.3448337519 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"am", + "model":"openai\/gpt-4.1", + "bcp_47":"wo", "task":"translation_to", "metric":"bleu", - "score":0.0043114209 + "score":0.1156898441 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"am", + "model":"openai\/gpt-4.1", + "bcp_47":"wo", "task":"translation_to", "metric":"chrf", - "score":0.0733956093 + "score":0.3359373421 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"apc", + "model":"openai\/gpt-4.1", + "bcp_47":"wuu", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"apc", + "model":"openai\/gpt-4.1", + "bcp_47":"wuu", "task":"translation_from", "metric":"bleu", - "score":0.0844832543 + "score":0.2145078635 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"apc", + "model":"openai\/gpt-4.1", + "bcp_47":"wuu", "task":"translation_from", "metric":"chrf", - "score":0.2899357726 + "score":0.4857656934 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"apc", + "model":"openai\/gpt-4.1", + "bcp_47":"wuu", "task":"translation_to", "metric":"bleu", - "score":0.0202296618 + "score":0.1355871579 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"apc", + "model":"openai\/gpt-4.1", + "bcp_47":"wuu", "task":"translation_to", "metric":"chrf", - "score":0.1170466993 + "score":0.178819439 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", + "model":"openai\/gpt-4.1", + "bcp_47":"xh", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", + "model":"openai\/gpt-4.1", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"xh", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.8 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", + "model":"openai\/gpt-4.1", + "bcp_47":"xh", "task":"translation_from", "metric":"bleu", - "score":0.1314009634 + "score":0.2072124604 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", + "model":"openai\/gpt-4.1", + "bcp_47":"xh", "task":"translation_from", "metric":"chrf", - "score":0.3827163755 + "score":0.4729134507 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", + "model":"openai\/gpt-4.1", + "bcp_47":"xh", "task":"translation_to", "metric":"bleu", - "score":0.0953897712 + "score":0.1306749519 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", + "model":"openai\/gpt-4.1", + "bcp_47":"xh", "task":"translation_to", "metric":"chrf", - "score":0.2894343613 + "score":0.4877811483 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", + "model":"openai\/gpt-4.1", + "bcp_47":"yo", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", + "model":"openai\/gpt-4.1", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"yo", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"yo", "task":"translation_from", "metric":"bleu", - "score":0.1005104859 + "score":0.1312045988 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", + "model":"openai\/gpt-4.1", + "bcp_47":"yo", "task":"translation_from", "metric":"chrf", - "score":0.3241333261 + "score":0.3655601583 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", + "model":"openai\/gpt-4.1", + "bcp_47":"yo", "task":"translation_to", "metric":"bleu", - "score":0.0397410561 + "score":0.1087966113 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", + "model":"openai\/gpt-4.1", + "bcp_47":"yo", "task":"translation_to", "metric":"chrf", - "score":0.1986373033 + "score":0.2839573446 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"az", + "model":"openai\/gpt-4.1", + "bcp_47":"yue", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"az", + "model":"openai\/gpt-4.1", + "bcp_47":"yue", "task":"translation_from", "metric":"bleu", - "score":0.0700327695 + "score":0.1766032126 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"az", + "model":"openai\/gpt-4.1", + "bcp_47":"yue", "task":"translation_from", "metric":"chrf", - "score":0.2793919522 + "score":0.4547311313 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"az", + "model":"openai\/gpt-4.1", + "bcp_47":"yue", "task":"translation_to", "metric":"bleu", - "score":0.04780178 + "score":0.1904214808 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"az", + "model":"openai\/gpt-4.1", + "bcp_47":"yue", "task":"translation_to", "metric":"chrf", - "score":0.1986318307 + "score":0.2615689123 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bho", + "model":"openai\/gpt-4.1", + "bcp_47":"zh", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bho", + "model":"openai\/gpt-4.1", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"openai\/gpt-4.1", + "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.1421502617 + "score":0.2192323177 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bho", + "model":"openai\/gpt-4.1", + "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.3249063292 + "score":0.5110450766 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bho", + "model":"openai\/gpt-4.1", + "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.044984749 + "score":0.2696611562 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bho", + "model":"openai\/gpt-4.1", + "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.1531327249 + "score":0.2988391516 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", + "model":"openai\/gpt-4.1", + "bcp_47":"zu", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", + "model":"openai\/gpt-4.1", + "bcp_47":"zu", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.6 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", + "model":"openai\/gpt-4.1", + "bcp_47":"zu", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.7 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", + "model":"openai\/gpt-4.1", + "bcp_47":"zu", "task":"translation_from", "metric":"bleu", - "score":0.1016298945 + "score":0.2825650355 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", + "model":"openai\/gpt-4.1", + "bcp_47":"zu", "task":"translation_from", "metric":"chrf", - "score":0.2980803254 + "score":0.5492218755 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", + "model":"openai\/gpt-4.1", + "bcp_47":"zu", "task":"translation_to", "metric":"bleu", - "score":0.0978160022 + "score":0.2611643189 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", + "model":"openai\/gpt-4.1", + "bcp_47":"zu", "task":"translation_to", "metric":"chrf", - "score":0.2190252958 + "score":0.5637612249 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"aeb", "task":"classification", "metric":"accuracy", - "score":0.8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"mgsm", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 + "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"aeb", "task":"translation_from", "metric":"bleu", - "score":0.1786073211 + "score":0.2198316321 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"aeb", "task":"translation_from", "metric":"chrf", - "score":0.418923403 + "score":0.4708151995 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"aeb", "task":"translation_to", "metric":"bleu", - "score":0.1529904036 + "score":0.2234579509 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"aeb", "task":"translation_to", "metric":"chrf", - "score":0.4257110482 + "score":0.4401488964 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"af", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"mgsm", - "metric":"accuracy", - "score":0.1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 + "score":0.0 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"af", "task":"translation_from", "metric":"bleu", - "score":0.3166864072 + "score":0.0 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"af", "task":"translation_from", "metric":"chrf", - "score":0.5483508218 + "score":0.0 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"af", "task":"translation_to", "metric":"bleu", - "score":0.4404172544 + "score":0.0 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"af", "task":"translation_to", "metric":"chrf", - "score":0.7231001513 + "score":0.0 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ak", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ak", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.1 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ak", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.3 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ak", "task":"translation_from", "metric":"bleu", - "score":0.1298121807 + "score":0.1056657743 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ak", "task":"translation_from", "metric":"chrf", - "score":0.3403579227 + "score":0.3249231698 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ak", "task":"translation_to", "metric":"bleu", - "score":0.3743863952 + "score":0.0618207736 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ak", "task":"translation_to", "metric":"chrf", - "score":0.5971283997 + "score":0.340632844 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"am", "task":"classification", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"mmlu", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"am", + "task":"mgsm", "metric":"accuracy", "score":0.5 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"am", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"am", "task":"translation_from", "metric":"bleu", - "score":0.1016894588 + "score":0.1521950168 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"am", "task":"translation_from", "metric":"chrf", - "score":0.3636401028 + "score":0.3956387285 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"am", "task":"translation_to", "metric":"bleu", - "score":0.1695199459 + "score":0.0953768122 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"am", "task":"translation_to", "metric":"chrf", - "score":0.3986853323 + "score":0.2497030659 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"apc", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"apc", "task":"translation_from", "metric":"bleu", - "score":0.1164300835 + "score":0.2413546506 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"apc", "task":"translation_from", "metric":"chrf", - "score":0.3215620941 + "score":0.5235234652 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"apc", "task":"translation_to", "metric":"bleu", - "score":0.1452350029 + "score":0.2271910382 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"apc", "task":"translation_to", "metric":"chrf", - "score":0.4128118494 + "score":0.4908497482 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ar", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"mgsm", - "metric":"accuracy", - "score":0.1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ar", "task":"mmlu", "metric":"accuracy", "score":0.6 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.1078563354 + "score":0.2566573338 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.3207926618 + "score":0.5183862763 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.3659011486 + "score":0.3901123396 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.580998869 + "score":0.5771753105 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ary", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ary", "task":"translation_from", "metric":"bleu", - "score":0.0897802232 + "score":0.1301518556 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ary", "task":"translation_from", "metric":"chrf", - "score":0.3334021167 + "score":0.4290918442 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ary", "task":"translation_to", "metric":"bleu", - "score":0.0546926081 + "score":0.1797566847 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ary", "task":"translation_to", "metric":"chrf", - "score":0.2631919591 + "score":0.4271851106 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"arz", "task":"classification", "metric":"accuracy", - "score":0.5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"mgsm", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.3 + "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"arz", "task":"translation_from", "metric":"bleu", - "score":0.038636598 + "score":0.1724971212 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"arz", "task":"translation_from", "metric":"chrf", - "score":0.1770095402 + "score":0.4012455839 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"arz", "task":"translation_to", "metric":"bleu", - "score":0.0050909961 + "score":0.2496844101 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"arz", "task":"translation_to", "metric":"chrf", - "score":0.1811657432 + "score":0.4720007075 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"as", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"as", "task":"translation_from", "metric":"bleu", - "score":0.1271878224 + "score":0.1595843783 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"as", "task":"translation_from", "metric":"chrf", - "score":0.3698932868 + "score":0.4348621346 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"as", "task":"translation_to", "metric":"bleu", - "score":0.1324625901 + "score":0.1540181476 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"as", "task":"translation_to", "metric":"chrf", - "score":0.3233634009 + "score":0.351822758 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"awa", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"awa", "task":"translation_from", "metric":"bleu", - "score":0.1489627056 + "score":0.2979811644 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"awa", "task":"translation_from", "metric":"chrf", - "score":0.4172638299 + "score":0.5341221534 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"awa", "task":"translation_to", "metric":"bleu", - "score":0.2008824981 + "score":0.2462308641 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"awa", "task":"translation_to", "metric":"chrf", - "score":0.5185852751 + "score":0.4432887674 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"az", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"mgsm", - "metric":"accuracy", - "score":0.1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"az", "task":"translation_from", "metric":"bleu", - "score":0.1148524922 + "score":0.1840798833 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"az", "task":"translation_from", "metric":"chrf", - "score":0.3722842281 + "score":0.4151816693 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"az", "task":"translation_to", "metric":"bleu", - "score":0.250138544 + "score":0.1349305067 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"az", "task":"translation_to", "metric":"chrf", - "score":0.5338430631 + "score":0.397143235 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"be", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"mgsm", - "metric":"accuracy", - "score":0.1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 + "score":1.0 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"be", "task":"translation_from", "metric":"bleu", - "score":0.1169165949 + "score":0.1644448391 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"be", "task":"translation_from", "metric":"chrf", - "score":0.3638899173 + "score":0.4629038808 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"be", "task":"translation_to", "metric":"bleu", - "score":0.1330552123 + "score":0.2550498255 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"be", "task":"translation_to", "metric":"chrf", - "score":0.2685952079 + "score":0.4544854197 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"bho", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"bho", "task":"translation_from", "metric":"bleu", - "score":0.0823011221 + "score":0.2230536146 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"bho", "task":"translation_from", "metric":"chrf", - "score":0.2825939861 + "score":0.499651958 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"bho", "task":"translation_to", "metric":"bleu", - "score":0.0327082346 + "score":0.2227847146 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"bho", "task":"translation_to", "metric":"chrf", - "score":0.2319054893 + "score":0.40695057 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"bm", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"bm", "task":"translation_from", "metric":"bleu", - "score":0.1165534681 + "score":0.0 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"bm", "task":"translation_from", "metric":"chrf", - "score":0.3877914341 + "score":0.0 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"bm", "task":"translation_to", "metric":"bleu", - "score":0.1033665849 + "score":0.0 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"bm", "task":"translation_to", "metric":"chrf", - "score":0.3638806009 + "score":0.0 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"bn", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"bn", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.7 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.1314926141 + "score":0.2819696539 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.3540405018 + "score":0.5293077213 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.1705869429 + "score":0.3092254935 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.2612780395 + "score":0.4661357412 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ca", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ca", "task":"translation_from", "metric":"bleu", - "score":0.1039755938 + "score":0.0 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ca", "task":"translation_from", "metric":"chrf", - "score":0.3670583743 + "score":0.0 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ca", "task":"translation_to", "metric":"bleu", - "score":0.0490353313 + "score":0.0 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ca", "task":"translation_to", "metric":"chrf", - "score":0.3016997477 + "score":0.0 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ceb", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ceb", "task":"translation_from", "metric":"bleu", - "score":0.1016737952 + "score":0.365645255 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ceb", "task":"translation_from", "metric":"chrf", - "score":0.3529445259 + "score":0.5771393179 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ceb", "task":"translation_to", "metric":"bleu", - "score":0.0980137705 + "score":0.3274189601 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ceb", "task":"translation_to", "metric":"chrf", - "score":0.3076980329 + "score":0.5630354446 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ms", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ckb", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ms", - "task":"mmlu", - "metric":"accuracy", - "score":0.4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ms", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ckb", "task":"translation_from", "metric":"bleu", - "score":0.2051934522 + "score":0.1379843601 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ms", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ckb", "task":"translation_from", "metric":"chrf", - "score":0.4174861616 + "score":0.3936670775 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ms", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ckb", "task":"translation_to", "metric":"bleu", - "score":0.1030714956 + "score":0.1018796158 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ms", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ckb", "task":"translation_to", "metric":"chrf", - "score":0.3069420156 + "score":0.3594406238 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"my", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"cs", "task":"classification", "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", "score":0.8 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"my", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"cs", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"cs", "task":"translation_from", "metric":"bleu", - "score":0.1062506996 + "score":0.2953385985 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"my", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"cs", "task":"translation_from", "metric":"chrf", - "score":0.3311804385 + "score":0.5543620654 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"my", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"cs", "task":"translation_to", "metric":"bleu", - "score":0.0661499319 + "score":0.342919616 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"my", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"cs", "task":"translation_to", "metric":"chrf", - "score":0.2408635082 + "score":0.5729115023 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"om", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"de", "task":"classification", "metric":"accuracy", - "score":0.4 + "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"om", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"de", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"om", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"de", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.7 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"om", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.0177577979 + "score":0.3052927761 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"om", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.1411822431 + "score":0.5504382993 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"om", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.0101970078 + "score":0.4246355556 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"om", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.1613941454 + "score":0.6487523813 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"el", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"el", "task":"translation_from", "metric":"bleu", - "score":0.0446786865 + "score":0.2853090403 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"el", "task":"translation_from", "metric":"chrf", - "score":0.1562050743 + "score":0.5033746216 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"el", "task":"translation_to", "metric":"bleu", - "score":0.0022538162 + "score":0.2976764649 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"el", "task":"translation_to", "metric":"chrf", - "score":0.0960982382 + "score":0.4568078793 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"en", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.3158857772 + "score":0.5178458342 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.5109022919 + "score":0.6792020066 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.2903521386 + "score":0.6631992536 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.4758823803 + "score":0.8257245236 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"es", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"es", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"es", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.7 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.1198559998 + "score":0.2800331904 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.3492711529 + "score":0.5328441069 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.2480316528 + "score":0.3927902573 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.4488014348 + "score":0.628791549 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"fa", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"fa", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"fa", "task":"translation_from", "metric":"bleu", - "score":0.1398701241 + "score":0.274202443 }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"fa", "task":"translation_from", "metric":"chrf", - "score":0.3034565852 + "score":0.5239221129 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"fa", "task":"translation_to", "metric":"bleu", - "score":0.3460979115 + "score":0.144419277 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"fa", "task":"translation_to", "metric":"chrf", - "score":0.5835851988 + "score":0.405746187 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"fil", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"mgsm", - "metric":"accuracy", - "score":0.1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"fil", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.7 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"fil", "task":"translation_from", "metric":"bleu", - "score":0.0947682488 + "score":0.3517517227 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"fil", "task":"translation_from", "metric":"chrf", - "score":0.3259777135 + "score":0.5678423102 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"fil", "task":"translation_to", "metric":"bleu", - "score":0.1796274314 + "score":0.2861570496 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"fil", "task":"translation_to", "metric":"chrf", - "score":0.4360781177 + "score":0.567530869 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"fr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"fr", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.0299661217 + "score":0.2950999056 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.204544657 + "score":0.5638983665 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.0009238366 + "score":0.5061822417 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.0843772457 + "score":0.6903823708 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"fuv", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"mgsm", - "metric":"accuracy", - "score":0.2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.3 + "score":0.6 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"fuv", "task":"translation_from", "metric":"bleu", - "score":0.0669163701 + "score":0.0579371031 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"fuv", "task":"translation_from", "metric":"chrf", - "score":0.2784916366 + "score":0.2407036725 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"fuv", "task":"translation_to", "metric":"bleu", - "score":0.0633186191 + "score":0.0338899407 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"fuv", "task":"translation_to", "metric":"chrf", - "score":0.3074668268 + "score":0.1685773285 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"gu", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"gu", "task":"translation_from", "metric":"bleu", - "score":0.0917433239 + "score":0.2249525185 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"gu", "task":"translation_from", "metric":"chrf", - "score":0.3851148557 + "score":0.4726822454 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"gu", "task":"translation_to", "metric":"bleu", - "score":0.1299606269 + "score":0.1646493878 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"gu", "task":"translation_to", "metric":"chrf", - "score":0.3428948363 + "score":0.4071725376 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ha", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ha", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.7 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ha", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.4 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ha", "task":"translation_from", "metric":"bleu", - "score":0.1471870965 + "score":0.2293529776 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ha", "task":"translation_from", "metric":"chrf", - "score":0.3392441061 + "score":0.4521332467 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ha", "task":"translation_to", "metric":"bleu", - "score":0.2060450795 + "score":0.2554536105 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ha", "task":"translation_to", "metric":"chrf", - "score":0.3717773766 + "score":0.5371463729 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"hi", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"mgsm", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"hi", + "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.6 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.1079848157 + "score":0.3531906075 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.2801778291 + "score":0.6060071382 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.1131365873 + "score":0.399293733 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.2713637811 + "score":0.6132292528 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"hne", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.2 + "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"hne", "task":"translation_from", "metric":"bleu", - "score":0.1097631082 + "score":0.2232750657 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"hne", "task":"translation_from", "metric":"chrf", - "score":0.3352988316 + "score":0.4801269988 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"hne", "task":"translation_to", "metric":"bleu", - "score":0.0795019275 + "score":0.1922860161 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"hne", "task":"translation_to", "metric":"chrf", - "score":0.2884455353 + "score":0.4363534921 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ht", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ht", "task":"translation_from", "metric":"bleu", - "score":0.0522713846 + "score":0.0 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ht", "task":"translation_from", "metric":"chrf", - "score":0.3192866676 + "score":0.0 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ht", "task":"translation_to", "metric":"bleu", - "score":0.0868686952 + "score":0.0 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ht", "task":"translation_to", "metric":"chrf", - "score":0.2859772299 + "score":0.0 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"uz", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"hu", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"uz", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"hu", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"hu", "task":"translation_from", "metric":"bleu", - "score":0.0689558305 + "score":0.2647815263 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"uz", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"hu", "task":"translation_from", "metric":"chrf", - "score":0.22853185 + "score":0.5197043469 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"uz", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"hu", "task":"translation_to", "metric":"bleu", - "score":0.0415402981 + "score":0.3268056763 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"uz", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"hu", "task":"translation_to", "metric":"chrf", - "score":0.2227329297 + "score":0.5486126608 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"id", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"id", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.7 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.0649160569 + "score":0.2559881532 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.2830042558 + "score":0.5349715693 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.0350138164 + "score":0.3900018149 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.2206802597 + "score":0.6494354052 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ig", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ig", "task":"translation_from", "metric":"bleu", - "score":0.0908263331 + "score":0.1469460203 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ig", "task":"translation_from", "metric":"chrf", - "score":0.3394219762 + "score":0.3801695829 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ig", "task":"translation_to", "metric":"bleu", - "score":0.0 + "score":0.1926475709 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ig", "task":"translation_to", "metric":"chrf", - "score":0.0645497034 + "score":0.4187626054 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ilo", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ilo", "task":"translation_from", "metric":"bleu", - "score":0.0740063452 + "score":0.1826483605 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ilo", "task":"translation_from", "metric":"chrf", - "score":0.2757375638 + "score":0.4686350803 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ilo", "task":"translation_to", "metric":"bleu", - "score":0.0872564614 + "score":0.1078652833 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ilo", "task":"translation_to", "metric":"chrf", - "score":0.1427963743 + "score":0.421647984 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"it", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"it", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"it", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.4 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"it", "task":"translation_from", "metric":"bleu", - "score":0.0992800287 + "score":0.3047636442 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"it", "task":"translation_from", "metric":"chrf", - "score":0.324429867 + "score":0.5385736571 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"it", "task":"translation_to", "metric":"bleu", - "score":0.09185491 + "score":0.3458314466 }, { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"it", "task":"translation_to", "metric":"chrf", - "score":0.1769207611 + "score":0.5969984451 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"am", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ja", "task":"classification", "metric":"accuracy", - "score":0.3 + "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"am", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ja", "task":"mgsm", "metric":"accuracy", - "score":0.2 + "score":1.0 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"am", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ja", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"am", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.0462314764 + "score":0.2100828863 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"am", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.1434072436 + "score":0.4717405627 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"am", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.0132821079 + "score":0.2844229339 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"am", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.0456848091 + "score":0.4435245651 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"apc", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"jv", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"apc", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.2054466179 + "score":0.2977682173 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"apc", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.4635698598 + "score":0.5413323701 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"apc", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.2513408047 + "score":0.2537598479 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"apc", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.5078766295 + "score":0.5629521778 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ki", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0 + "score":0.0 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ki", "task":"translation_from", "metric":"bleu", - "score":0.278999196 + "score":0.0 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ki", "task":"translation_from", "metric":"chrf", - "score":0.5072892325 + "score":0.0 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ki", "task":"translation_to", "metric":"bleu", - "score":0.335915232 + "score":0.0 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ki", "task":"translation_to", "metric":"chrf", - "score":0.5453940527 + "score":0.0 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"kk", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"kk", "task":"translation_from", "metric":"bleu", - "score":0.2249154291 + "score":0.1646050237 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"kk", "task":"translation_from", "metric":"chrf", - "score":0.4283700551 + "score":0.4508391233 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"kk", "task":"translation_to", "metric":"bleu", - "score":0.2483121176 + "score":0.2752297553 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"kk", "task":"translation_to", "metric":"chrf", - "score":0.4611825726 + "score":0.5180256955 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"az", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"km", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"az", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"km", "task":"translation_from", "metric":"bleu", - "score":0.1923090312 + "score":0.2132140468 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"az", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"km", "task":"translation_from", "metric":"chrf", - "score":0.3973361244 + "score":0.5000034068 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"az", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"km", "task":"translation_to", "metric":"bleu", - "score":0.1398741741 + "score":0.1292151863 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"az", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"km", "task":"translation_to", "metric":"chrf", - "score":0.4023712427 + "score":0.3392182289 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"bho", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"kn", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"bho", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"kn", "task":"translation_from", "metric":"bleu", - "score":0.2246336129 + "score":0.2382712271 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"bho", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"kn", "task":"translation_from", "metric":"chrf", - "score":0.4406538597 + "score":0.4901100456 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"bho", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"kn", "task":"translation_to", "metric":"bleu", - "score":0.1192868334 + "score":0.2584591395 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"bho", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"kn", "task":"translation_to", "metric":"chrf", - "score":0.3094007011 + "score":0.4586627531 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ko", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ko", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.6 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ko", "task":"translation_from", "metric":"bleu", - "score":0.2557484343 + "score":0.1783139223 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ko", "task":"translation_from", "metric":"chrf", - "score":0.4816174974 + "score":0.4481556757 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ko", "task":"translation_to", "metric":"bleu", - "score":0.336565743 + "score":0.3002017818 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ko", "task":"translation_to", "metric":"chrf", - "score":0.500099888 + "score":0.3739762238 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"lua", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"mgsm", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"lua", "task":"translation_from", "metric":"bleu", - "score":0.33652498 + "score":0.0772118618 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"lua", "task":"translation_from", "metric":"chrf", - "score":0.5394051209 + "score":0.2815494636 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"lua", "task":"translation_to", "metric":"bleu", - "score":0.4124704223 + "score":0.001488949 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"lua", "task":"translation_to", "metric":"chrf", - "score":0.6500309258 + "score":0.1588971491 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"mag", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"mgsm", - "metric":"accuracy", "score":1.0 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"mag", "task":"translation_from", "metric":"bleu", - "score":0.4669071745 + "score":0.3080966975 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"mag", "task":"translation_from", "metric":"chrf", - "score":0.6351301458 + "score":0.5628489014 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"mag", "task":"translation_to", "metric":"bleu", - "score":0.5813419207 + "score":0.2981973224 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"mag", "task":"translation_to", "metric":"chrf", - "score":0.8065247071 + "score":0.5193764902 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"mai", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"mai", "task":"translation_from", "metric":"bleu", - "score":0.293714449 + "score":0.2802761469 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"mai", "task":"translation_from", "metric":"chrf", - "score":0.4892518335 + "score":0.5391751615 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"mai", "task":"translation_to", "metric":"bleu", - "score":0.3400529578 + "score":0.2042851472 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"mai", "task":"translation_to", "metric":"chrf", - "score":0.6054518089 + "score":0.4615978684 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"mg", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"mg", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.5 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"mg", "task":"translation_from", "metric":"bleu", - "score":0.2392739698 + "score":0.243797007 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"mg", "task":"translation_from", "metric":"chrf", - "score":0.4813714407 + "score":0.4981055966 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"mg", "task":"translation_to", "metric":"bleu", - "score":0.2321648572 + "score":0.2038296766 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"mg", "task":"translation_to", "metric":"chrf", - "score":0.4166342577 + "score":0.5453530515 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ml", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ml", "task":"translation_from", "metric":"bleu", - "score":0.2811212879 + "score":0.2649575888 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ml", "task":"translation_from", "metric":"chrf", - "score":0.4244631944 + "score":0.5072138807 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ml", "task":"translation_to", "metric":"bleu", - "score":0.2282664087 + "score":0.186903033 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ml", "task":"translation_to", "metric":"chrf", - "score":0.5153269959 + "score":0.411527522 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"mr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.2548863763 + "score":0.2358876365 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.5181895957 + "score":0.4961149155 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.4309072933 + "score":0.2674122275 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.6122951839 + "score":0.4442281313 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ms", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ms", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ms", "task":"translation_from", "metric":"bleu", - "score":0.266641943 + "score":0.3443124421 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ms", "task":"translation_from", "metric":"chrf", - "score":0.4689143537 + "score":0.5824988714 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ms", "task":"translation_to", "metric":"bleu", - "score":0.1714078748 + "score":0.3763691574 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ms", "task":"translation_to", "metric":"chrf", - "score":0.45528413 + "score":0.6619682382 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"my", "task":"classification", "metric":"accuracy", - "score":0.8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"mgsm", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.5 + "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"my", "task":"translation_from", "metric":"bleu", - "score":0.0639113657 + "score":0.2596129619 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"my", "task":"translation_from", "metric":"chrf", - "score":0.1707631202 + "score":0.485235691 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"my", "task":"translation_to", "metric":"bleu", - "score":0.0551968249 + "score":0.2234699025 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"my", "task":"translation_to", "metric":"chrf", - "score":0.165412979 + "score":0.4866737746 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ne", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ne", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ne", "task":"translation_from", "metric":"bleu", - "score":0.3708164771 + "score":0.3085593402 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ne", "task":"translation_from", "metric":"chrf", - "score":0.5780452995 + "score":0.5486177789 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ne", "task":"translation_to", "metric":"bleu", - "score":0.3889665973 + "score":0.2319189577 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ne", "task":"translation_to", "metric":"chrf", - "score":0.5940361548 + "score":0.4830752425 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"nl", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"nl", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"nl", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"nl", "task":"translation_from", "metric":"bleu", - "score":0.2714445111 + "score":0.2639124065 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"nl", "task":"translation_from", "metric":"chrf", - "score":0.5033343062 + "score":0.5166255119 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"nl", "task":"translation_to", "metric":"bleu", - "score":0.3367134056 + "score":0.342163716 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"nl", "task":"translation_to", "metric":"chrf", - "score":0.6204206544 + "score":0.6089275595 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ny", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"mgsm", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ny", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.5 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ny", "task":"translation_from", "metric":"bleu", - "score":0.26428669 + "score":0.158564127 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ny", "task":"translation_from", "metric":"chrf", - "score":0.4902151754 + "score":0.4086927045 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ny", "task":"translation_to", "metric":"bleu", - "score":0.3239977856 + "score":0.1237632416 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ny", "task":"translation_to", "metric":"chrf", - "score":0.5865126635 + "score":0.4428640995 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"om", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"om", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.5 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"om", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.4 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"om", "task":"translation_from", "metric":"bleu", - "score":0.2208745982 + "score":0.1266863364 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"om", "task":"translation_from", "metric":"chrf", - "score":0.4944838309 + "score":0.3723937215 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"om", "task":"translation_to", "metric":"bleu", - "score":0.1755723698 + "score":0.0507341481 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"om", "task":"translation_to", "metric":"chrf", - "score":0.3733502483 + "score":0.3372593565 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"or", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"or", "task":"translation_from", "metric":"bleu", - "score":0.1125731148 + "score":0.2495546416 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"or", "task":"translation_from", "metric":"chrf", - "score":0.2778916971 + "score":0.505250418 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"or", "task":"translation_to", "metric":"bleu", - "score":0.0861201622 + "score":0.1370990235 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"or", "task":"translation_to", "metric":"chrf", - "score":0.3310005151 + "score":0.4188964845 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"pa", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.2415284955 + "score":0.3898113091 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.4761318508 + "score":0.6349932626 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.2506029382 + "score":0.4218934881 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.4820610024 + "score":0.5699211354 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"pl", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"pl", "task":"mmlu", "metric":"accuracy", "score":0.6 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"pl", "task":"translation_from", "metric":"bleu", - "score":0.2390442925 + "score":0.2238263799 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"pl", "task":"translation_from", "metric":"chrf", - "score":0.4660486517 + "score":0.5157447202 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"pl", "task":"translation_to", "metric":"bleu", - "score":0.1889249825 + "score":0.3376407171 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"pl", "task":"translation_to", "metric":"chrf", - "score":0.314876296 + "score":0.5674744623 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"pt", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.2936668736 + "score":0.2989764302 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.4940538554 + "score":0.5575461672 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.1686173343 + "score":0.4347143661 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.4033123912 + "score":0.6526848356 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ro", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ro", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ro", "task":"translation_from", "metric":"bleu", - "score":0.3097940645 + "score":0.2365245444 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ro", "task":"translation_from", "metric":"chrf", - "score":0.5304242832 + "score":0.5263187531 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ro", "task":"translation_to", "metric":"bleu", - "score":0.2168719994 + "score":0.4295443245 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ro", "task":"translation_to", "metric":"chrf", - "score":0.4555868419 + "score":0.6303158648 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ms", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ru", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ms", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ru", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.6 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ms", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.3030951939 + "score":0.2156464838 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ms", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.5195567075 + "score":0.4961661832 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ms", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.3655435175 + "score":0.3525318267 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ms", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.6292737269 + "score":0.5377697887 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"my", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"rw", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"my", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"rw", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"rw", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"rw", "task":"translation_from", "metric":"bleu", - "score":0.20731642 + "score":0.1358779492 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"my", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"rw", "task":"translation_from", "metric":"chrf", - "score":0.414222781 + "score":0.4047237198 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"my", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"rw", "task":"translation_to", "metric":"bleu", - "score":0.0884087592 + "score":0.2528406351 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"my", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"rw", "task":"translation_to", "metric":"chrf", - "score":0.2678188556 + "score":0.5425926629 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"om", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"sd", "task":"classification", "metric":"accuracy", - "score":0.7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"om", - "task":"mgsm", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"om", - "task":"mmlu", - "metric":"accuracy", - "score":0.5 + "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"om", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"sd", "task":"translation_from", "metric":"bleu", - "score":0.0200154664 + "score":0.3052635197 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"om", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"sd", "task":"translation_from", "metric":"chrf", - "score":0.1606834413 + "score":0.5444415164 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"om", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"sd", "task":"translation_to", "metric":"bleu", - "score":0.0044245595 + "score":0.319777613 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"om", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"sd", "task":"translation_to", "metric":"chrf", - "score":0.1054952984 + "score":0.5070316671 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"si", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"si", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"si", "task":"translation_from", "metric":"bleu", - "score":0.1001204869 + "score":0.224754909 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"si", "task":"translation_from", "metric":"chrf", - "score":0.2836152046 + "score":0.4942892862 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"si", "task":"translation_to", "metric":"bleu", - "score":0.0445164582 + "score":0.1763683901 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"si", "task":"translation_to", "metric":"chrf", - "score":0.2337334441 + "score":0.3592673643 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"sn", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"sn", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"sn", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"sn", "task":"translation_from", "metric":"bleu", - "score":0.4077844252 + "score":0.0579407228 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"sn", "task":"translation_from", "metric":"chrf", - "score":0.6076754833 + "score":0.3218620552 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"sn", "task":"translation_to", "metric":"bleu", - "score":0.4459003493 + "score":0.1045487932 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"sn", "task":"translation_to", "metric":"chrf", - "score":0.5840266721 + "score":0.4627951581 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"so", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"mgsm", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"so", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.5 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"so", "task":"translation_from", "metric":"bleu", - "score":0.2148436144 + "score":0.2457303069 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"so", "task":"translation_from", "metric":"chrf", - "score":0.4670207413 + "score":0.4607096598 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"so", "task":"translation_to", "metric":"bleu", - "score":0.2898684366 + "score":0.2208751843 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"so", "task":"translation_to", "metric":"chrf", - "score":0.525989117 + "score":0.499725177 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"sr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"sr", "task":"mmlu", "metric":"accuracy", "score":0.7 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"sr", "task":"translation_from", "metric":"bleu", - "score":0.264907032 + "score":0.2080392025 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"sr", "task":"translation_from", "metric":"chrf", - "score":0.4939362461 + "score":0.5029005766 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"sr", "task":"translation_to", "metric":"bleu", - "score":0.4563355662 + "score":0.3955111551 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"sr", "task":"translation_to", "metric":"chrf", - "score":0.6843169799 + "score":0.5840966612 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"su", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"su", "task":"translation_from", "metric":"bleu", - "score":0.1955652432 + "score":0.2108703792 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"su", "task":"translation_from", "metric":"chrf", - "score":0.4654058492 + "score":0.4463761953 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"su", "task":"translation_to", "metric":"bleu", - "score":0.2591393679 + "score":0.1957956536 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"su", "task":"translation_to", "metric":"chrf", - "score":0.4936043335 + "score":0.5109625366 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"sv", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"sv", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"sv", "task":"translation_from", "metric":"bleu", - "score":0.0890242869 + "score":0.3026696791 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"sv", "task":"translation_from", "metric":"chrf", - "score":0.2507686532 + "score":0.5540321116 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"sv", "task":"translation_to", "metric":"bleu", - "score":0.0 + "score":0.379491342 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"sv", "task":"translation_to", "metric":"chrf", - "score":0.0807676975 + "score":0.6341129937 }, { - "model":"mistralai\/mistral-saba", + "model":"openai\/gpt-4.1-mini", "bcp_47":"sw", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", + "model":"openai\/gpt-4.1-mini", "bcp_47":"sw", "task":"mgsm", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"mistralai\/mistral-saba", + "model":"openai\/gpt-4.1-mini", "bcp_47":"sw", "task":"mmlu", "metric":"accuracy", "score":0.6 }, { - "model":"mistralai\/mistral-saba", + "model":"openai\/gpt-4.1-mini", "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.0845702794 + "score":0.2373352462 }, { - "model":"mistralai\/mistral-saba", + "model":"openai\/gpt-4.1-mini", "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.2799479817 + "score":0.4812305289 }, { - "model":"mistralai\/mistral-saba", + "model":"openai\/gpt-4.1-mini", "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.1327606257 + "score":0.3592771753 }, { - "model":"mistralai\/mistral-saba", + "model":"openai\/gpt-4.1-mini", "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.4346855791 + "score":0.6196466978 }, { - "model":"mistralai\/mistral-saba", + "model":"openai\/gpt-4.1-mini", "bcp_47":"ta", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", + "model":"openai\/gpt-4.1-mini", "bcp_47":"ta", "task":"translation_from", "metric":"bleu", - "score":0.2777158956 + "score":0.2189074797 }, { - "model":"mistralai\/mistral-saba", + "model":"openai\/gpt-4.1-mini", "bcp_47":"ta", "task":"translation_from", "metric":"chrf", - "score":0.4958635491 + "score":0.458549356 }, { - "model":"mistralai\/mistral-saba", + "model":"openai\/gpt-4.1-mini", "bcp_47":"ta", "task":"translation_to", "metric":"bleu", - "score":0.2970897235 + "score":0.2096038798 }, { - "model":"mistralai\/mistral-saba", + "model":"openai\/gpt-4.1-mini", "bcp_47":"ta", "task":"translation_to", "metric":"chrf", - "score":0.5394670378 + "score":0.48158495 }, { - "model":"mistralai\/mistral-saba", + "model":"openai\/gpt-4.1-mini", "bcp_47":"te", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", + "model":"openai\/gpt-4.1-mini", "bcp_47":"te", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"mistralai\/mistral-saba", + "model":"openai\/gpt-4.1-mini", "bcp_47":"te", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.6 }, { - "model":"mistralai\/mistral-saba", + "model":"openai\/gpt-4.1-mini", "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.3805998732 + "score":0.3847076164 }, { - "model":"mistralai\/mistral-saba", + "model":"openai\/gpt-4.1-mini", "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.5566308844 + "score":0.5961555843 }, { - "model":"mistralai\/mistral-saba", + "model":"openai\/gpt-4.1-mini", "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.3811390337 + "score":0.3031970309 }, { - "model":"mistralai\/mistral-saba", + "model":"openai\/gpt-4.1-mini", "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.5895281984 + "score":0.4938747459 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"tg", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"tg", "task":"translation_from", "metric":"bleu", - "score":0.2079294904 + "score":0.1923337483 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"tg", "task":"translation_from", "metric":"chrf", - "score":0.4320631023 + "score":0.4073259848 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"tg", "task":"translation_to", "metric":"bleu", - "score":0.2456928253 + "score":0.1777393755 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"tg", "task":"translation_to", "metric":"chrf", - "score":0.3989628007 + "score":0.4229927395 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"th", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"mmlu", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"th", + "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"th", "task":"translation_from", "metric":"bleu", - "score":0.2699521486 + "score":0.1973765077 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"th", "task":"translation_from", "metric":"chrf", - "score":0.478882362 + "score":0.478302799 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"th", "task":"translation_to", "metric":"bleu", - "score":0.2654978305 + "score":0.390011731 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"th", "task":"translation_to", "metric":"chrf", - "score":0.5487755246 + "score":0.5192332126 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ti", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ti", "task":"translation_from", "metric":"bleu", - "score":0.2469989894 + "score":0.0956165324 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ti", "task":"translation_from", "metric":"chrf", - "score":0.4943114536 + "score":0.3010660185 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ti", "task":"translation_to", "metric":"bleu", - "score":0.2844546137 + "score":0.0201085128 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ti", "task":"translation_to", "metric":"chrf", - "score":0.477210689 + "score":0.1279466164 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"uz", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"tr", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"uz", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"tr", "task":"translation_from", "metric":"bleu", - "score":0.1727284585 + "score":0.3027350341 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"uz", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"tr", "task":"translation_from", "metric":"chrf", - "score":0.4250344787 + "score":0.5488245098 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"uz", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"tr", "task":"translation_to", "metric":"bleu", - "score":0.1817744295 + "score":0.3543135567 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"uz", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"tr", "task":"translation_to", "metric":"chrf", - "score":0.4656549066 + "score":0.5739783335 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"uk", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"uk", "task":"mmlu", "metric":"accuracy", "score":0.7 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"uk", "task":"translation_from", "metric":"bleu", - "score":0.2373174322 + "score":0.2739321887 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"uk", "task":"translation_from", "metric":"chrf", - "score":0.4521152897 + "score":0.523898319 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"uk", "task":"translation_to", "metric":"bleu", - "score":0.2962197342 + "score":0.3702945368 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"uk", "task":"translation_to", "metric":"chrf", - "score":0.544285644 + "score":0.5833117124 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"umb", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.5 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"umb", "task":"translation_from", "metric":"bleu", - "score":0.1807443545 + "score":0.0456473272 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"umb", "task":"translation_from", "metric":"chrf", - "score":0.4282740606 + "score":0.1799246176 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"umb", "task":"translation_to", "metric":"bleu", - "score":0.1030562145 + "score":0.0060102851 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"umb", "task":"translation_to", "metric":"chrf", - "score":0.1694260317 + "score":0.0643020373 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ur", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.1686505919 + "score":0.2282243664 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.4407452421 + "score":0.4878680978 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.1561257665 + "score":0.2701355148 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.2413348415 + "score":0.4485608146 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"uz", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"mgsm", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"uz", "task":"translation_from", "metric":"bleu", - "score":0.2391219094 + "score":0.2068814622 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"uz", "task":"translation_from", "metric":"chrf", - "score":0.4993680631 + "score":0.4820023997 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"uz", "task":"translation_to", "metric":"bleu", - "score":0.2546682455 + "score":0.1797290418 }, { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"uz", "task":"translation_to", "metric":"chrf", - "score":0.3131256963 + "score":0.5053214161 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"am", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"vi", "task":"classification", "metric":"accuracy", - "score":0.4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"am", - "task":"mgsm", - "metric":"accuracy", - "score":0.1 + "score":0.9 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"am", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"vi", "task":"mmlu", "metric":"accuracy", - "score":0.2 + "score":0.6 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"am", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.0 + "score":0.2800966186 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"am", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.0682401612 + "score":0.5447813345 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"am", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.0028802187 + "score":0.3743034645 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"am", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.0506386945 + "score":0.5977965321 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"apc", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"wo", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"apc", - "task":"translation_from", - "metric":"bleu", - "score":0.1505032551 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"apc", - "task":"translation_from", - "metric":"chrf", - "score":0.4086092545 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"apc", - "task":"translation_to", - "metric":"bleu", - "score":0.1882561377 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"apc", - "task":"translation_to", - "metric":"chrf", - "score":0.3814760125 + "score":0.8 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"classification", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"wo", + "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"wo", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.2 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"wo", "task":"translation_from", "metric":"bleu", - "score":0.1878091774 + "score":0.0698928855 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"wo", "task":"translation_from", "metric":"chrf", - "score":0.4280751788 + "score":0.2670199291 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"wo", "task":"translation_to", "metric":"bleu", - "score":0.2100749947 + "score":0.0438604879 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"wo", "task":"translation_to", "metric":"chrf", - "score":0.3864616183 + "score":0.2188199264 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"wuu", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"wuu", "task":"translation_from", "metric":"bleu", - "score":0.1020177653 + "score":0.169474795 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"wuu", "task":"translation_from", "metric":"chrf", - "score":0.3338664094 + "score":0.4233016879 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"wuu", "task":"translation_to", "metric":"bleu", - "score":0.1064323135 + "score":0.1115736327 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"wuu", "task":"translation_to", "metric":"chrf", - "score":0.3080022567 + "score":0.1741292068 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"az", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"xh", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"az", - "task":"translation_from", - "metric":"bleu", - "score":0.0818689903 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"az", - "task":"translation_from", - "metric":"chrf", - "score":0.2636451344 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"az", - "task":"translation_to", - "metric":"bleu", - "score":0.0746797577 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"az", - "task":"translation_to", - "metric":"chrf", - "score":0.3147526037 + "model":"openai\/gpt-4.1-mini", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bho", - "task":"classification", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"xh", + "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.2 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bho", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"xh", "task":"translation_from", "metric":"bleu", - "score":0.1908291186 + "score":0.1777667306 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bho", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"xh", "task":"translation_from", "metric":"chrf", - "score":0.4048132215 + "score":0.4381801577 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bho", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"xh", "task":"translation_to", "metric":"bleu", - "score":0.0320570973 + "score":0.0807523022 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bho", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"xh", "task":"translation_to", "metric":"chrf", - "score":0.1921106676 + "score":0.4027285347 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"yo", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"yo", "task":"mgsm", "metric":"accuracy", - "score":0.7 + "score":0.5 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"yo", "task":"mmlu", "metric":"accuracy", "score":0.3 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"yo", "task":"translation_from", "metric":"bleu", - "score":0.1554049163 + "score":0.0871363585 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"yo", "task":"translation_from", "metric":"chrf", - "score":0.3557989532 + "score":0.3153084592 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"yo", "task":"translation_to", "metric":"bleu", - "score":0.2229681692 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3722031872 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":0.9 + "score":0.0712302827 }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"yo", + "task":"translation_to", + "metric":"chrf", + "score":0.266201042 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"mmlu", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"yue", + "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"yue", "task":"translation_from", "metric":"bleu", - "score":0.2836619572 + "score":0.1722143774 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"yue", "task":"translation_from", "metric":"chrf", - "score":0.5189927538 + "score":0.451617464 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"yue", "task":"translation_to", "metric":"bleu", - "score":0.3481484827 + "score":0.1362044502 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"yue", "task":"translation_to", "metric":"chrf", - "score":0.5703115876 + "score":0.2472412788 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"zh", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"zh", "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"zh", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.4358717425 + "score":0.211203078 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.6055153523 + "score":0.4926704854 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.6254747881 + "score":0.2808125016 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.7898596498 + "score":0.3349070044 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"zu", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"zu", "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"zu", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.5 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"zu", "task":"translation_from", "metric":"bleu", - "score":0.2211802733 + "score":0.1986426867 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"zu", "task":"translation_from", "metric":"chrf", - "score":0.4673850088 + "score":0.4568960366 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"zu", "task":"translation_to", "metric":"bleu", - "score":0.3141247128 + "score":0.228999134 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"zu", "task":"translation_to", "metric":"chrf", - "score":0.5664089061 + "score":0.5092438205 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"aeb", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 + "score":0.8 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"aeb", "task":"translation_from", "metric":"bleu", - "score":0.1378005544 + "score":0.1996215211 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"aeb", "task":"translation_from", "metric":"chrf", - "score":0.3634410941 + "score":0.452996678 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"aeb", "task":"translation_to", "metric":"bleu", - "score":0.1662541754 + "score":0.1894542228 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"aeb", "task":"translation_to", "metric":"chrf", - "score":0.3656154799 + "score":0.4104759123 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"af", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 + "score":0.0 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"af", "task":"translation_from", "metric":"bleu", - "score":0.2598161419 + "score":0.0 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"af", "task":"translation_from", "metric":"chrf", - "score":0.4673557809 + "score":0.0 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"af", "task":"translation_to", "metric":"bleu", - "score":0.2352273865 + "score":0.0 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"af", "task":"translation_to", "metric":"chrf", - "score":0.5423645035 + "score":0.0 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ak", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.6 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ak", "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.3 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ak", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.5 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ak", "task":"translation_from", "metric":"bleu", - "score":0.2637885864 + "score":0.0772997859 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ak", "task":"translation_from", "metric":"chrf", - "score":0.50661739 + "score":0.2795137394 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ak", "task":"translation_to", "metric":"bleu", - "score":0.3898419239 + "score":0.0490092548 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ak", "task":"translation_to", "metric":"chrf", - "score":0.5983170279 + "score":0.2793012345 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"am", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"am", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"am", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"am", "task":"translation_from", "metric":"bleu", - "score":0.1879687767 + "score":0.0821675771 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"am", "task":"translation_from", "metric":"chrf", - "score":0.3575768224 + "score":0.3261780265 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"am", "task":"translation_to", "metric":"bleu", - "score":0.1193068232 + "score":0.0581954137 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"am", "task":"translation_to", "metric":"chrf", - "score":0.3258076554 + "score":0.2133137227 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"apc", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"mgsm", - "metric":"accuracy", - "score":0.1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.3 + "score":0.8 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"apc", "task":"translation_from", "metric":"bleu", - "score":0.0424529379 + "score":0.2038935703 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"apc", "task":"translation_from", "metric":"chrf", - "score":0.205545596 + "score":0.4744865332 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"apc", "task":"translation_to", "metric":"bleu", - "score":0.0315047557 + "score":0.198427289 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"apc", "task":"translation_to", "metric":"chrf", - "score":0.1862281652 + "score":0.4466553325 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ar", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ar", "task":"mmlu", "metric":"accuracy", "score":0.7 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.2931006661 + "score":0.2230716751 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.5117710763 + "score":0.4868000305 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.3454885653 + "score":0.3431634646 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.5632832845 + "score":0.5539675011 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ary", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ary", "task":"translation_from", "metric":"bleu", - "score":0.1846129963 + "score":0.0936861 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ary", "task":"translation_from", "metric":"chrf", - "score":0.4218789485 + "score":0.4019740671 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ary", "task":"translation_to", "metric":"bleu", - "score":0.2363785743 + "score":0.1320458692 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ary", "task":"translation_to", "metric":"chrf", - "score":0.5715726858 + "score":0.3969132003 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"arz", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", "score":0.8 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"arz", "task":"translation_from", "metric":"bleu", - "score":0.203133363 + "score":0.147678651 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"arz", "task":"translation_from", "metric":"chrf", - "score":0.4421827582 + "score":0.3870664018 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"arz", "task":"translation_to", "metric":"bleu", - "score":0.2636104621 + "score":0.1925682475 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"arz", "task":"translation_to", "metric":"chrf", - "score":0.5093890816 + "score":0.424235974 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"as", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"mgsm", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", "score":0.8 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"as", "task":"translation_from", "metric":"bleu", - "score":0.1660483895 + "score":0.1549108661 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"as", "task":"translation_from", "metric":"chrf", - "score":0.4317128373 + "score":0.3657540248 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"as", "task":"translation_to", "metric":"bleu", - "score":0.2448276505 + "score":0.1300687711 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"as", "task":"translation_to", "metric":"chrf", - "score":0.4102738917 + "score":0.3850114254 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"awa", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"awa", "task":"translation_from", "metric":"bleu", - "score":0.1159703103 + "score":0.2822625676 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"awa", "task":"translation_from", "metric":"chrf", - "score":0.3116167676 + "score":0.5120051075 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"awa", "task":"translation_to", "metric":"bleu", - "score":0.0803083214 + "score":0.1956229389 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"awa", "task":"translation_to", "metric":"chrf", - "score":0.3001867634 + "score":0.4165258378 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"az", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"az", "task":"translation_from", "metric":"bleu", - "score":0.1342281856 + "score":0.1020059939 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"az", "task":"translation_from", "metric":"chrf", - "score":0.3526105747 + "score":0.3685311802 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"az", "task":"translation_to", "metric":"bleu", - "score":0.146553268 + "score":0.1584050367 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"az", "task":"translation_to", "metric":"chrf", - "score":0.3291051456 + "score":0.4078207292 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"be", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"be", "task":"translation_from", "metric":"bleu", - "score":0.1737342381 + "score":0.129620916 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"be", "task":"translation_from", "metric":"chrf", - "score":0.4232883693 + "score":0.4193741335 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"be", "task":"translation_to", "metric":"bleu", - "score":0.2383832092 + "score":0.1911430477 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"be", "task":"translation_to", "metric":"chrf", - "score":0.33001113 + "score":0.423978547 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"bho", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"bho", "task":"translation_from", "metric":"bleu", - "score":0.2059798463 + "score":0.1839199068 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"bho", "task":"translation_from", "metric":"chrf", - "score":0.4231363675 + "score":0.4589371965 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"bho", "task":"translation_to", "metric":"bleu", - "score":0.2059172406 + "score":0.1754477624 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"bho", "task":"translation_to", "metric":"chrf", - "score":0.4148312305 + "score":0.3729187467 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"bm", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"bm", "task":"translation_from", "metric":"bleu", - "score":0.2216993022 + "score":0.0 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"bm", "task":"translation_from", "metric":"chrf", - "score":0.4221894818 + "score":0.0 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"bm", "task":"translation_to", "metric":"bleu", - "score":0.1386303624 + "score":0.0 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"bm", "task":"translation_to", "metric":"chrf", - "score":0.3369477219 + "score":0.0 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ms", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"bn", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ms", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"bn", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.7 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ms", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.2392636803 + "score":0.2104863522 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ms", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.4545241599 + "score":0.4534437048 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ms", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.3632780792 + "score":0.2824626 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ms", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.6254141203 + "score":0.4822940799 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"my", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ca", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"my", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ca", "task":"translation_from", "metric":"bleu", - "score":0.0217828279 + "score":0.0 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"my", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ca", "task":"translation_from", "metric":"chrf", - "score":0.144054989 + "score":0.0 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"my", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ca", "task":"translation_to", "metric":"bleu", - "score":0.0351771663 + "score":0.0 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"my", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ca", "task":"translation_to", "metric":"chrf", - "score":0.2287244941 + "score":0.0 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"om", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ceb", "task":"classification", "metric":"accuracy", - "score":0.7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"om", - "task":"mgsm", - "metric":"accuracy", - "score":0.1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"om", - "task":"mmlu", - "metric":"accuracy", - "score":0.5 + "score":0.9 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"om", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ceb", "task":"translation_from", "metric":"bleu", - "score":0.0276939955 + "score":0.3067568845 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"om", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ceb", "task":"translation_from", "metric":"chrf", - "score":0.1837469296 + "score":0.522767718 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"om", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ceb", "task":"translation_to", "metric":"bleu", - "score":0.0160221908 + "score":0.2603548365 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"om", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ceb", "task":"translation_to", "metric":"chrf", - "score":0.2144565152 + "score":0.5472674101 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ckb", "task":"classification", "metric":"accuracy", "score":0.8 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ckb", "task":"translation_from", "metric":"bleu", - "score":0.083347512 + "score":0.061613272 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ckb", "task":"translation_from", "metric":"chrf", - "score":0.2190646209 + "score":0.2738044534 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ckb", "task":"translation_to", "metric":"bleu", - "score":0.0679191643 + "score":0.0495010223 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ckb", "task":"translation_to", "metric":"chrf", - "score":0.2873941526 + "score":0.2930209689 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"cs", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"cs", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"cs", "task":"translation_from", "metric":"bleu", - "score":0.3647734864 + "score":0.2480975275 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"cs", "task":"translation_from", "metric":"chrf", - "score":0.5784168493 + "score":0.4908345188 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"cs", "task":"translation_to", "metric":"bleu", - "score":0.3897396366 + "score":0.2780131154 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"cs", "task":"translation_to", "metric":"chrf", - "score":0.5030239884 + "score":0.5272272242 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"de", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"de", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"de", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.1850936564 + "score":0.282506513 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.3999928464 + "score":0.5438865496 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.2726874239 + "score":0.4220387975 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.4948927457 + "score":0.6440212985 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"el", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"mmlu", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"el", + "task":"mgsm", "metric":"accuracy", "score":0.8 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"el", "task":"translation_from", "metric":"bleu", - "score":0.2070601418 + "score":0.2138985353 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"el", "task":"translation_from", "metric":"chrf", - "score":0.4601106145 + "score":0.4787400928 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"el", "task":"translation_to", "metric":"bleu", - "score":0.412349088 + "score":0.3347502447 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"el", "task":"translation_to", "metric":"chrf", - "score":0.6102742767 + "score":0.5277403226 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"en", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"en", "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.7 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"en", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.1710045162 + "score":0.4926163025 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.433047449 + "score":0.6598180449 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.2961144006 + "score":0.5627424753 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.5257430939 + "score":0.7654936904 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"es", "task":"classification", "metric":"accuracy", "score":0.8 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.0484864486 + "score":0.2400384539 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.1952223401 + "score":0.4846098061 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.0005975301 + "score":0.331169359 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.1227717162 + "score":0.541145091 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fa", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"mgsm", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fa", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":0.7 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fa", "task":"translation_from", "metric":"bleu", - "score":0.1106429776 + "score":0.1934774812 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fa", "task":"translation_from", "metric":"chrf", - "score":0.3246322884 + "score":0.4555822394 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fa", "task":"translation_to", "metric":"bleu", - "score":0.1586725311 + "score":0.1515704996 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fa", "task":"translation_to", "metric":"chrf", - "score":0.4486820539 + "score":0.4288811212 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fil", "task":"classification", "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fil", + "task":"mmlu", + "metric":"accuracy", "score":0.7 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fil", "task":"translation_from", "metric":"bleu", - "score":0.0861902503 + "score":0.3049498802 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fil", "task":"translation_from", "metric":"chrf", - "score":0.2737902674 + "score":0.531726813 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fil", "task":"translation_to", "metric":"bleu", - "score":0.1910130331 + "score":0.2572361601 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fil", "task":"translation_to", "metric":"chrf", - "score":0.4159297845 + "score":0.5465796366 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fr", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fr", "task":"mgsm", "metric":"accuracy", - "score":0.6 + "score":0.7 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fr", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":0.6 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.2631133201 + "score":0.2245970544 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.504043761 + "score":0.4773636644 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.2496114121 + "score":0.456500631 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.4707696336 + "score":0.6519350009 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fuv", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.6 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"mgsm", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.0508716923 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.2061725545 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.001678581 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.0842472305 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"gu", + "task":"classification", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"gu", "task":"translation_from", "metric":"bleu", - "score":0.1533969949 + "score":0.1811700298 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"gu", "task":"translation_from", "metric":"chrf", - "score":0.3718867563 + "score":0.4450724584 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"gu", "task":"translation_to", "metric":"bleu", - "score":0.2858310833 + "score":0.1152635411 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"gu", "task":"translation_to", "metric":"chrf", - "score":0.4323129392 + "score":0.3751269086 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ha", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ha", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ha", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.6 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ha", "task":"translation_from", "metric":"bleu", - "score":0.1776801562 + "score":0.1042620188 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ha", "task":"translation_from", "metric":"chrf", - "score":0.4036600408 + "score":0.353512414 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ha", "task":"translation_to", "metric":"bleu", - "score":0.2335702423 + "score":0.1697643488 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ha", "task":"translation_to", "metric":"chrf", - "score":0.4992388897 + "score":0.4858315893 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"hi", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.1854021136 + "score":0.3100386494 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.4258067424 + "score":0.5747433617 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.1388133394 + "score":0.3858833658 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.3685419874 + "score":0.5991711103 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"uz", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"hne", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"uz", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"hne", "task":"translation_from", "metric":"bleu", - "score":0.1877241389 + "score":0.1533855474 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"uz", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"hne", "task":"translation_from", "metric":"chrf", - "score":0.4060591516 + "score":0.4227840042 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"uz", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"hne", "task":"translation_to", "metric":"bleu", - "score":0.1165785177 + "score":0.1131265551 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"uz", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"hne", "task":"translation_to", "metric":"chrf", - "score":0.4074870036 + "score":0.3711711494 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ht", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 + "score":0.0 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ht", "task":"translation_from", "metric":"bleu", - "score":0.2204611632 + "score":0.0 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ht", "task":"translation_from", "metric":"chrf", - "score":0.4366931331 + "score":0.0 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ht", "task":"translation_to", "metric":"bleu", - "score":0.2957932526 + "score":0.0 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ht", "task":"translation_to", "metric":"chrf", - "score":0.5127606293 + "score":0.0 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"hu", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"hu", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"hu", "task":"translation_from", "metric":"bleu", - "score":0.1059358827 + "score":0.2089476707 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"hu", "task":"translation_from", "metric":"chrf", - "score":0.3291955196 + "score":0.4868357652 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"hu", "task":"translation_to", "metric":"bleu", - "score":0.0116334446 + "score":0.2953914361 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"hu", "task":"translation_to", "metric":"chrf", - "score":0.0643182856 + "score":0.5360583303 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"id", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.1503741808 + "score":0.1907075731 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.3985964495 + "score":0.4662972265 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.1755859315 + "score":0.3386484563 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.2407951689 + "score":0.6376664219 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ig", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ig", "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.3 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ig", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.5 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ig", "task":"translation_from", "metric":"bleu", - "score":0.1386896901 + "score":0.0974819198 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ig", "task":"translation_from", "metric":"chrf", - "score":0.413832278 + "score":0.3736857308 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ig", "task":"translation_to", "metric":"bleu", - "score":0.2503925306 + "score":0.170722725 }, { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ig", "task":"translation_to", "metric":"chrf", - "score":0.3045084897 + "score":0.4039469282 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"am", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ilo", "task":"classification", "metric":"accuracy", "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"am", - "task":"mgsm", - "metric":"accuracy", - "score":0.5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"am", - "task":"mmlu", - "metric":"accuracy", - "score":0.3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"am", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ilo", "task":"translation_from", "metric":"bleu", - "score":0.1521950168 + "score":0.1538751748 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"am", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ilo", "task":"translation_from", "metric":"chrf", - "score":0.3956387285 + "score":0.3921570735 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"am", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ilo", "task":"translation_to", "metric":"bleu", - "score":0.0953768122 + "score":0.1222763549 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"am", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ilo", "task":"translation_to", "metric":"chrf", - "score":0.2497030659 + "score":0.3651682861 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"apc", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"it", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"apc", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"it", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"it", "task":"translation_from", "metric":"bleu", - "score":0.2413546506 + "score":0.2389788634 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"apc", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"it", "task":"translation_from", "metric":"chrf", - "score":0.5235234652 + "score":0.4950691973 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"apc", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"it", "task":"translation_to", "metric":"bleu", - "score":0.2271910382 + "score":0.3197810714 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"apc", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"it", "task":"translation_to", "metric":"chrf", - "score":0.4908497482 + "score":0.5649240218 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ja", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ja", "task":"mmlu", "metric":"accuracy", "score":0.6 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.2566573338 + "score":0.2240038475 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.5183862763 + "score":0.4860646744 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.3901123396 + "score":0.2284065848 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.5771753105 + "score":0.3753787999 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"jv", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.1724971212 + "score":0.1867349669 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.4012455839 + "score":0.4122967846 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.2496844101 + "score":0.20591358 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.4720007075 + "score":0.5231507594 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"az", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ki", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"az", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ki", "task":"translation_from", "metric":"bleu", - "score":0.1840798833 + "score":0.0 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"az", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ki", "task":"translation_from", "metric":"chrf", - "score":0.4151816693 + "score":0.0 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"az", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ki", "task":"translation_to", "metric":"bleu", - "score":0.1349305067 + "score":0.0 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"az", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ki", "task":"translation_to", "metric":"chrf", - "score":0.397143235 + "score":0.0 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bho", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"kk", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bho", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"kk", "task":"translation_from", "metric":"bleu", - "score":0.2230536146 + "score":0.1757000759 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bho", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"kk", "task":"translation_from", "metric":"chrf", - "score":0.499651958 + "score":0.4569938635 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bho", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"kk", "task":"translation_to", "metric":"bleu", - "score":0.2227847146 + "score":0.2608919204 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bho", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"kk", "task":"translation_to", "metric":"chrf", - "score":0.40695057 + "score":0.495117819 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"km", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"km", "task":"translation_from", "metric":"bleu", - "score":0.2819696539 + "score":0.1391396286 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"km", "task":"translation_from", "metric":"chrf", - "score":0.5293077213 + "score":0.3419293202 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"km", "task":"translation_to", "metric":"bleu", - "score":0.3092254935 + "score":0.11776525 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"km", "task":"translation_to", "metric":"chrf", - "score":0.4661357412 + "score":0.3296737913 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"kn", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"kn", "task":"translation_from", "metric":"bleu", - "score":0.3052927761 + "score":0.1659549387 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"kn", "task":"translation_from", "metric":"chrf", - "score":0.5504382993 + "score":0.4341818109 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"kn", "task":"translation_to", "metric":"bleu", - "score":0.4246355556 + "score":0.1728970527 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"kn", "task":"translation_to", "metric":"chrf", - "score":0.6487523813 + "score":0.4006604704 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ko", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 + "score":0.7 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ko", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.8 }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ko", "task":"translation_from", "metric":"bleu", - "score":0.5178458342 + "score":0.1418786679 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ko", "task":"translation_from", "metric":"chrf", - "score":0.6792020066 + "score":0.4096096806 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ko", "task":"translation_to", "metric":"bleu", - "score":0.6631992536 + "score":0.2767863837 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ko", "task":"translation_to", "metric":"chrf", - "score":0.8257245236 + "score":0.343465352 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"lua", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 + "score":0.6 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"lua", "task":"translation_from", "metric":"bleu", - "score":0.2800331904 + "score":0.0557337494 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"lua", "task":"translation_from", "metric":"chrf", - "score":0.5328441069 + "score":0.2661879916 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"lua", "task":"translation_to", "metric":"bleu", - "score":0.3927902573 + "score":0.010496354 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"lua", "task":"translation_to", "metric":"chrf", - "score":0.628791549 + "score":0.2072817599 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"mag", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"mag", "task":"translation_from", "metric":"bleu", - "score":0.274202443 + "score":0.2919442529 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"mag", "task":"translation_from", "metric":"chrf", - "score":0.5239221129 + "score":0.558994569 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"mag", "task":"translation_to", "metric":"bleu", - "score":0.144419277 + "score":0.2232843577 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"mag", "task":"translation_to", "metric":"chrf", - "score":0.405746187 + "score":0.4785649547 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"mai", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"mai", "task":"translation_from", "metric":"bleu", - "score":0.3517517227 + "score":0.1885764001 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"mai", "task":"translation_from", "metric":"chrf", - "score":0.5678423102 + "score":0.4905954379 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"mai", "task":"translation_to", "metric":"bleu", - "score":0.2861570496 + "score":0.1518354017 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"mai", "task":"translation_to", "metric":"chrf", - "score":0.567530869 + "score":0.4184448049 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"mg", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"mg", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.4 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"mg", "task":"translation_from", "metric":"bleu", - "score":0.2950999056 + "score":0.2031343023 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"mg", "task":"translation_from", "metric":"chrf", - "score":0.5638983665 + "score":0.4809424331 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"mg", "task":"translation_to", "metric":"bleu", - "score":0.5061822417 + "score":0.1531227243 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"mg", "task":"translation_to", "metric":"chrf", - "score":0.6903823708 + "score":0.486171029 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ml", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ml", "task":"translation_from", "metric":"bleu", - "score":0.2249525185 + "score":0.2649114053 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ml", "task":"translation_from", "metric":"chrf", - "score":0.4726822454 + "score":0.5258722646 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ml", "task":"translation_to", "metric":"bleu", - "score":0.1646493878 + "score":0.1638513843 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ml", "task":"translation_to", "metric":"chrf", - "score":0.4071725376 + "score":0.3671674679 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"mr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"mgsm", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.2293529776 + "score":0.1755855974 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.4521332467 + "score":0.464470709 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.2554536105 + "score":0.2053629902 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.5371463729 + "score":0.4466569291 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ms", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ms", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.5 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ms", "task":"translation_from", "metric":"bleu", - "score":0.3531906075 + "score":0.2391713081 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ms", "task":"translation_from", "metric":"chrf", - "score":0.6060071382 + "score":0.5284921106 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ms", "task":"translation_to", "metric":"bleu", - "score":0.399293733 + "score":0.3851770392 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ms", "task":"translation_to", "metric":"chrf", - "score":0.6132292528 + "score":0.6778949951 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"my", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 + "score":0.6 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"my", "task":"translation_from", "metric":"bleu", - "score":0.2559881532 + "score":0.1921402736 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"my", "task":"translation_from", "metric":"chrf", - "score":0.5349715693 + "score":0.4286234239 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"my", "task":"translation_to", "metric":"bleu", - "score":0.3900018149 + "score":0.226941594 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"my", "task":"translation_to", "metric":"chrf", - "score":0.6494354052 + "score":0.4545167964 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ne", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 + "score":0.7 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ne", "task":"mmlu", "metric":"accuracy", "score":0.4 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ne", "task":"translation_from", "metric":"bleu", - "score":0.3047636442 + "score":0.2044174225 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ne", "task":"translation_from", "metric":"chrf", - "score":0.5385736571 + "score":0.4393220695 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ne", "task":"translation_to", "metric":"bleu", - "score":0.3458314466 + "score":0.204358035 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ne", "task":"translation_to", "metric":"chrf", - "score":0.5969984451 + "score":0.4838815717 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"nl", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"nl", "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"nl", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"nl", "task":"translation_from", "metric":"bleu", - "score":0.2100828863 + "score":0.222496921 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"nl", "task":"translation_from", "metric":"chrf", - "score":0.4717405627 + "score":0.455228974 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"nl", "task":"translation_to", "metric":"bleu", - "score":0.2844229339 + "score":0.2971608126 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"nl", "task":"translation_to", "metric":"chrf", - "score":0.4435245651 + "score":0.5809601739 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ny", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2977682173 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5413323701 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2537598479 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5629521778 + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"classification", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ny", + "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.3 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ny", "task":"translation_from", "metric":"bleu", - "score":0.2382712271 + "score":0.0616783152 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ny", "task":"translation_from", "metric":"chrf", - "score":0.4901100456 + "score":0.2486430016 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ny", "task":"translation_to", "metric":"bleu", - "score":0.2584591395 + "score":0.1096684518 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ny", "task":"translation_to", "metric":"chrf", - "score":0.4586627531 + "score":0.4236658223 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"om", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"om", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"om", "task":"translation_from", "metric":"bleu", - "score":0.1783139223 + "score":0.0470010342 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"om", "task":"translation_from", "metric":"chrf", - "score":0.4481556757 + "score":0.3053087334 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"om", "task":"translation_to", "metric":"bleu", - "score":0.3002017818 + "score":0.0354609608 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"om", "task":"translation_to", "metric":"chrf", - "score":0.3739762238 + "score":0.3000471846 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"or", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"or", "task":"translation_from", "metric":"bleu", - "score":0.2649575888 + "score":0.1342178934 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"or", "task":"translation_from", "metric":"chrf", - "score":0.5072138807 + "score":0.4186845018 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"or", "task":"translation_to", "metric":"bleu", - "score":0.186903033 + "score":0.0959778877 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"or", "task":"translation_to", "metric":"chrf", - "score":0.411527522 + "score":0.4062370429 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"pa", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.2358876365 + "score":0.3790281875 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.4961149155 + "score":0.5948460259 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.2674122275 + "score":0.4122107278 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.4442281313 + "score":0.5709045042 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ms", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"pl", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.9 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ms", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"pl", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ms", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"pl", "task":"translation_from", "metric":"bleu", - "score":0.3443124421 + "score":0.1956391774 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ms", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"pl", "task":"translation_from", "metric":"chrf", - "score":0.5824988714 + "score":0.4696282098 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ms", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"pl", "task":"translation_to", "metric":"bleu", - "score":0.3763691574 + "score":0.3089097764 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ms", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"pl", "task":"translation_to", "metric":"chrf", - "score":0.6619682382 + "score":0.5592753275 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"my", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"pt", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"my", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.2596129619 + "score":0.2493437671 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"my", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.485235691 + "score":0.4876335319 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"my", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.2234699025 + "score":0.3816451478 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"my", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.4866737746 + "score":0.6189446172 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"om", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ro", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"om", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ro", "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"om", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ro", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":0.7 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"om", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ro", "task":"translation_from", "metric":"bleu", - "score":0.1266863364 + "score":0.2159926241 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"om", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ro", "task":"translation_from", "metric":"chrf", - "score":0.3723937215 + "score":0.485645425 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"om", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ro", "task":"translation_to", "metric":"bleu", - "score":0.0507341481 + "score":0.4231210461 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"om", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ro", "task":"translation_to", "metric":"chrf", - "score":0.3372593565 + "score":0.611328256 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ru", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.2495546416 + "score":0.2106935755 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.505250418 + "score":0.4916756186 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.1370990235 + "score":0.2957139688 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.4188964845 + "score":0.5505026606 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"rw", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"rw", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"rw", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"rw", "task":"translation_from", "metric":"bleu", - "score":0.3898113091 + "score":0.0983614688 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"rw", "task":"translation_from", "metric":"chrf", - "score":0.6349932626 + "score":0.3467631983 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"rw", "task":"translation_to", "metric":"bleu", - "score":0.4218934881 + "score":0.2084502331 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"rw", "task":"translation_to", "metric":"chrf", - "score":0.5699211354 + "score":0.5081363979 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sd", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"mgsm", - "metric":"accuracy", "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sd", "task":"translation_from", "metric":"bleu", - "score":0.2238263799 + "score":0.183239364 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sd", "task":"translation_from", "metric":"chrf", - "score":0.5157447202 + "score":0.4023445581 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sd", "task":"translation_to", "metric":"bleu", - "score":0.3376407171 + "score":0.188899922 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sd", "task":"translation_to", "metric":"chrf", - "score":0.5674744623 + "score":0.3987821089 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"si", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"si", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.2 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"si", "task":"translation_from", "metric":"bleu", - "score":0.2989764302 + "score":0.1067913788 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"si", "task":"translation_from", "metric":"chrf", - "score":0.5575461672 + "score":0.3496287521 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"si", "task":"translation_to", "metric":"bleu", - "score":0.4347143661 + "score":0.1841725143 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"si", "task":"translation_to", "metric":"chrf", - "score":0.6526848356 + "score":0.3632256251 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sn", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sn", "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.1 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sn", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.5 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sn", "task":"translation_from", "metric":"bleu", - "score":0.2156464838 + "score":0.0529920463 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sn", "task":"translation_from", "metric":"chrf", - "score":0.4961661832 + "score":0.282085967 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sn", "task":"translation_to", "metric":"bleu", - "score":0.3525318267 + "score":0.1362552545 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sn", "task":"translation_to", "metric":"chrf", - "score":0.5377697887 + "score":0.4625012714 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"so", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"so", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"so", "task":"translation_from", "metric":"bleu", - "score":0.3052635197 + "score":0.1467149035 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"so", "task":"translation_from", "metric":"chrf", - "score":0.5444415164 + "score":0.3956649623 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"so", "task":"translation_to", "metric":"bleu", - "score":0.319777613 + "score":0.1685063005 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"so", "task":"translation_to", "metric":"chrf", - "score":0.5070316671 + "score":0.4680460244 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sr", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sr", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sr", "task":"translation_from", "metric":"bleu", - "score":0.2373352462 + "score":0.1938115187 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sr", "task":"translation_from", "metric":"chrf", - "score":0.4812305289 + "score":0.4876215653 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sr", "task":"translation_to", "metric":"bleu", - "score":0.3592771753 + "score":0.301648159 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sr", "task":"translation_to", "metric":"chrf", - "score":0.6196466978 + "score":0.5098794037 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"su", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"su", "task":"translation_from", "metric":"bleu", - "score":0.2189074797 + "score":0.1547225512 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"su", "task":"translation_from", "metric":"chrf", - "score":0.458549356 + "score":0.3915293941 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"su", "task":"translation_to", "metric":"bleu", - "score":0.2096038798 + "score":0.1695373764 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"su", "task":"translation_to", "metric":"chrf", - "score":0.48158495 + "score":0.4747320433 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sv", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sv", "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sv", "task":"mmlu", "metric":"accuracy", "score":0.6 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sv", "task":"translation_from", "metric":"bleu", - "score":0.3847076164 + "score":0.2691126673 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sv", "task":"translation_from", "metric":"chrf", - "score":0.5961555843 + "score":0.4857803464 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sv", "task":"translation_to", "metric":"bleu", - "score":0.3031970309 + "score":0.3512121942 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sv", "task":"translation_to", "metric":"chrf", - "score":0.4938747459 + "score":0.6095777745 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sw", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sw", "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.1973765077 + "score":0.1987953868 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.478302799 + "score":0.4232825095 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.390011731 + "score":0.2845246017 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.5192332126 + "score":0.5836686109 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ta", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ta", "task":"translation_from", "metric":"bleu", - "score":0.3027350341 + "score":0.1209729479 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ta", "task":"translation_from", "metric":"chrf", - "score":0.5488245098 + "score":0.3863152501 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ta", "task":"translation_to", "metric":"bleu", - "score":0.3543135567 + "score":0.2257337081 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ta", "task":"translation_to", "metric":"chrf", - "score":0.5739783335 + "score":0.4945472603 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"te", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.2282243664 + "score":0.3081208582 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.4878680978 + "score":0.5470122853 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.2701355148 + "score":0.2720935434 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.4485608146 + "score":0.4603538628 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"uz", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"tg", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"uz", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"tg", "task":"translation_from", "metric":"bleu", - "score":0.2068814622 + "score":0.1562871243 }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"uz", + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"tg", "task":"translation_from", "metric":"chrf", - "score":0.4820023997 + "score":0.4076252967 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"uz", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"tg", "task":"translation_to", "metric":"bleu", - "score":0.1797290418 + "score":0.1559524999 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"uz", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"tg", "task":"translation_to", "metric":"chrf", - "score":0.5053214161 + "score":0.4140020888 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"th", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"mmlu", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"th", + "task":"mgsm", "metric":"accuracy", - "score":0.6 + "score":0.9 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"th", "task":"translation_from", "metric":"bleu", - "score":0.2800966186 + "score":0.1699563701 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"th", "task":"translation_from", "metric":"chrf", - "score":0.5447813345 + "score":0.4279668426 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"th", "task":"translation_to", "metric":"bleu", - "score":0.3743034645 + "score":0.3008412738 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"th", "task":"translation_to", "metric":"chrf", - "score":0.5977965321 + "score":0.4707696326 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ti", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.6 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ti", "task":"translation_from", "metric":"bleu", - "score":0.169474795 + "score":0.0460275677 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ti", "task":"translation_from", "metric":"chrf", - "score":0.4233016879 + "score":0.2471496791 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ti", "task":"translation_to", "metric":"bleu", - "score":0.1115736327 + "score":0.0301094125 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"wuu", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ti", "task":"translation_to", "metric":"chrf", - "score":0.1741292068 + "score":0.0934926984 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"tr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"tr", "task":"translation_from", "metric":"bleu", - "score":0.1722143774 + "score":0.1772339365 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"tr", "task":"translation_from", "metric":"chrf", - "score":0.451617464 + "score":0.4203181275 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"tr", "task":"translation_to", "metric":"bleu", - "score":0.1362044502 + "score":0.3130066985 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"tr", "task":"translation_to", "metric":"chrf", - "score":0.2472412788 + "score":0.5687455638 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"uk", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"uk", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"uk", "task":"translation_from", "metric":"bleu", - "score":0.211203078 + "score":0.2094411351 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"uk", "task":"translation_from", "metric":"chrf", - "score":0.4926704854 + "score":0.4706103434 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"uk", "task":"translation_to", "metric":"bleu", - "score":0.2808125016 + "score":0.3725710921 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"uk", "task":"translation_to", "metric":"chrf", - "score":0.3349070044 + "score":0.5552868727 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"am", + "bcp_47":"umb", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.6 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"am", - "task":"mgsm", - "metric":"accuracy", - "score":0.2 + "bcp_47":"umb", + "task":"translation_from", + "metric":"bleu", + "score":0.0334143542 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"am", - "task":"mmlu", + "bcp_47":"umb", + "task":"translation_from", + "metric":"chrf", + "score":0.1507136538 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"umb", + "task":"translation_to", + "metric":"bleu", + "score":0.0016606076 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"umb", + "task":"translation_to", + "metric":"chrf", + "score":0.0502679049 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ur", + "task":"classification", "metric":"accuracy", - "score":0.5 + "score":0.9 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"am", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.0821675771 + "score":0.1864708336 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"am", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.3261780265 + "score":0.4670816214 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"am", + "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.0581954137 + "score":0.2648238029 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"am", + "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.2133137227 + "score":0.4478960511 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"apc", + "bcp_47":"uz", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"apc", + "bcp_47":"uz", "task":"translation_from", "metric":"bleu", - "score":0.2038935703 + "score":0.1939396294 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"apc", + "bcp_47":"uz", "task":"translation_from", "metric":"chrf", - "score":0.4744865332 + "score":0.4361718347 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"apc", + "bcp_47":"uz", "task":"translation_to", "metric":"bleu", - "score":0.198427289 + "score":0.1189904742 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"apc", + "bcp_47":"uz", "task":"translation_to", "metric":"chrf", - "score":0.4466553325 + "score":0.4347992199 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", + "bcp_47":"vi", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", + "bcp_47":"vi", "task":"mmlu", "metric":"accuracy", "score":0.7 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.2230716751 + "score":0.2392083536 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.4868000305 + "score":0.5109371286 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", + "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.3431634646 + "score":0.3593480951 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", + "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.5539675011 + "score":0.5929525126 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", + "bcp_47":"wo", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.6 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"wo", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"wo", "task":"translation_from", "metric":"bleu", - "score":0.147678651 + "score":0.0586128965 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", + "bcp_47":"wo", "task":"translation_from", "metric":"chrf", - "score":0.3870664018 + "score":0.2347632724 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", + "bcp_47":"wo", "task":"translation_to", "metric":"bleu", - "score":0.1925682475 + "score":0.0021532802 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", + "bcp_47":"wo", "task":"translation_to", "metric":"chrf", - "score":0.424235974 + "score":0.1133302543 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"az", + "bcp_47":"wuu", "task":"classification", "metric":"accuracy", "score":0.8 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"az", + "bcp_47":"wuu", "task":"translation_from", "metric":"bleu", - "score":0.1020059939 + "score":0.160147676 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"az", + "bcp_47":"wuu", "task":"translation_from", "metric":"chrf", - "score":0.3685311802 + "score":0.391740055 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"az", + "bcp_47":"wuu", "task":"translation_to", "metric":"bleu", - "score":0.1584050367 + "score":0.0779637528 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"az", + "bcp_47":"wuu", "task":"translation_to", "metric":"chrf", - "score":0.4078207292 + "score":0.1486256305 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"bho", + "bcp_47":"xh", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"bho", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"xh", "task":"translation_from", "metric":"bleu", - "score":0.1839199068 + "score":0.1080830211 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"bho", + "bcp_47":"xh", "task":"translation_from", "metric":"chrf", - "score":0.4589371965 + "score":0.337342999 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"bho", + "bcp_47":"xh", "task":"translation_to", "metric":"bleu", - "score":0.1754477624 + "score":0.0541477061 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"bho", + "bcp_47":"xh", "task":"translation_to", "metric":"chrf", - "score":0.3729187467 + "score":0.3900223164 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", + "bcp_47":"yo", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", + "bcp_47":"yo", "task":"mgsm", "metric":"accuracy", - "score":0.7 + "score":0.1 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", + "bcp_47":"yo", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.5 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", + "bcp_47":"yo", "task":"translation_from", "metric":"bleu", - "score":0.2104863522 + "score":0.0799412014 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", + "bcp_47":"yo", "task":"translation_from", "metric":"chrf", - "score":0.4534437048 + "score":0.2678562615 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", + "bcp_47":"yo", "task":"translation_to", "metric":"bleu", - "score":0.2824626 + "score":0.0384415516 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", + "bcp_47":"yo", "task":"translation_to", "metric":"chrf", - "score":0.4822940799 + "score":0.2172940187 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", + "bcp_47":"yue", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"mgsm", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 + "score":0.8 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", + "bcp_47":"yue", "task":"translation_from", "metric":"bleu", - "score":0.282506513 + "score":0.1368607253 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", + "bcp_47":"yue", "task":"translation_from", "metric":"chrf", - "score":0.5438865496 + "score":0.4397284879 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", + "bcp_47":"yue", "task":"translation_to", "metric":"bleu", - "score":0.4220387975 + "score":0.1909241711 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", + "bcp_47":"yue", "task":"translation_to", "metric":"chrf", - "score":0.6440212985 + "score":0.2765267822 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", + "bcp_47":"zh", "task":"classification", "metric":"accuracy", "score":0.8 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", + "bcp_47":"zh", "task":"mgsm", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", + "bcp_47":"zh", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", + "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.4926163025 + "score":0.1574414981 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", + "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.6598180449 + "score":0.4616304665 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", + "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.5627424753 + "score":0.2468189144 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", + "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.7654936904 + "score":0.3136635386 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", + "bcp_47":"zu", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", + "bcp_47":"zu", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.2 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", + "bcp_47":"zu", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.6 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", + "bcp_47":"zu", "task":"translation_from", "metric":"bleu", - "score":0.2400384539 + "score":0.1806603372 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", + "bcp_47":"zu", "task":"translation_from", "metric":"chrf", - "score":0.4846098061 + "score":0.4477026286 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", + "bcp_47":"zu", "task":"translation_to", "metric":"bleu", - "score":0.331169359 + "score":0.1983500358 }, { "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", + "bcp_47":"zu", "task":"translation_to", "metric":"chrf", - "score":0.541145091 + "score":0.4823277126 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", + "model":"openai\/gpt-4o-mini", + "bcp_47":"aeb", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"mmlu", + "model":"openai\/gpt-4o-mini", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.2046887048 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.3905043974 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.2440190587 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.4467530618 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"af", + "task":"classification", "metric":"accuracy", - "score":0.7 + "score":0.0 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", + "model":"openai\/gpt-4o-mini", + "bcp_47":"af", "task":"translation_from", "metric":"bleu", - "score":0.1934774812 + "score":0.0 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", + "model":"openai\/gpt-4o-mini", + "bcp_47":"af", "task":"translation_from", "metric":"chrf", - "score":0.4555822394 + "score":0.0 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", + "model":"openai\/gpt-4o-mini", + "bcp_47":"af", "task":"translation_to", "metric":"bleu", - "score":0.1515704996 + "score":0.0 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", + "model":"openai\/gpt-4o-mini", + "bcp_47":"af", "task":"translation_to", "metric":"chrf", - "score":0.4288811212 + "score":0.0 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ak", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"ak", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.5 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ak", "task":"translation_from", "metric":"bleu", - "score":0.3049498802 + "score":0.1088055906 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ak", "task":"translation_from", "metric":"chrf", - "score":0.531726813 + "score":0.2952376966 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ak", "task":"translation_to", "metric":"bleu", - "score":0.2572361601 + "score":0.04860361 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ak", "task":"translation_to", "metric":"chrf", - "score":0.5465796366 + "score":0.2749922921 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", + "model":"openai\/gpt-4o-mini", + "bcp_47":"am", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", + "model":"openai\/gpt-4o-mini", + "bcp_47":"am", "task":"mgsm", "metric":"accuracy", - "score":0.7 + "score":0.2 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", + "model":"openai\/gpt-4o-mini", + "bcp_47":"am", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.5 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", + "model":"openai\/gpt-4o-mini", + "bcp_47":"am", + "task":"translation_from", + "metric":"bleu", + "score":0.080495827 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"am", + "task":"translation_from", + "metric":"chrf", + "score":0.287512266 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"am", + "task":"translation_to", + "metric":"bleu", + "score":0.0649609212 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"am", + "task":"translation_to", + "metric":"chrf", + "score":0.203944936 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"apc", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"apc", "task":"translation_from", "metric":"bleu", - "score":0.2245970544 + "score":0.2086617902 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", + "model":"openai\/gpt-4o-mini", + "bcp_47":"apc", "task":"translation_from", "metric":"chrf", - "score":0.4773636644 + "score":0.4774317011 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", + "model":"openai\/gpt-4o-mini", + "bcp_47":"apc", "task":"translation_to", "metric":"bleu", - "score":0.456500631 + "score":0.2730334942 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", + "model":"openai\/gpt-4o-mini", + "bcp_47":"apc", "task":"translation_to", "metric":"chrf", - "score":0.6519350009 + "score":0.5458981435 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ar", "task":"classification", "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.1811700298 + "score":0.2530052174 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.4450724584 + "score":0.5158812138 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.1152635411 + "score":0.3439536667 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.3751269086 + "score":0.5691908832 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ary", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"mgsm", - "metric":"accuracy", - "score":0.3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ary", "task":"translation_from", "metric":"bleu", - "score":0.1042620188 + "score":0.1377297001 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ary", "task":"translation_from", "metric":"chrf", - "score":0.353512414 + "score":0.4304104417 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ary", "task":"translation_to", "metric":"bleu", - "score":0.1697643488 + "score":0.1906837255 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ary", "task":"translation_to", "metric":"chrf", - "score":0.4858315893 + "score":0.3931621016 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", + "model":"openai\/gpt-4o-mini", + "bcp_47":"arz", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", + "model":"openai\/gpt-4o-mini", + "bcp_47":"arz", "task":"translation_from", "metric":"bleu", - "score":0.3100386494 + "score":0.1573943285 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", + "model":"openai\/gpt-4o-mini", + "bcp_47":"arz", "task":"translation_from", "metric":"chrf", - "score":0.5747433617 + "score":0.4039837102 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", + "model":"openai\/gpt-4o-mini", + "bcp_47":"arz", "task":"translation_to", "metric":"bleu", - "score":0.3858833658 + "score":0.2385684611 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", + "model":"openai\/gpt-4o-mini", + "bcp_47":"arz", "task":"translation_to", "metric":"chrf", - "score":0.5991711103 + "score":0.4690487202 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", + "model":"openai\/gpt-4o-mini", + "bcp_47":"as", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", + "model":"openai\/gpt-4o-mini", + "bcp_47":"as", "task":"translation_from", "metric":"bleu", - "score":0.1907075731 + "score":0.1786795263 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", + "model":"openai\/gpt-4o-mini", + "bcp_47":"as", "task":"translation_from", "metric":"chrf", - "score":0.4662972265 + "score":0.4382834543 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", + "model":"openai\/gpt-4o-mini", + "bcp_47":"as", "task":"translation_to", "metric":"bleu", - "score":0.3386484563 + "score":0.142030089 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", + "model":"openai\/gpt-4o-mini", + "bcp_47":"as", "task":"translation_to", "metric":"chrf", - "score":0.6376664219 + "score":0.3706217658 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", + "model":"openai\/gpt-4o-mini", + "bcp_47":"awa", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"mgsm", - "metric":"accuracy", "score":0.8 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", + "model":"openai\/gpt-4o-mini", + "bcp_47":"awa", "task":"translation_from", "metric":"bleu", - "score":0.2389788634 + "score":0.2061194828 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", + "model":"openai\/gpt-4o-mini", + "bcp_47":"awa", "task":"translation_from", "metric":"chrf", - "score":0.4950691973 + "score":0.38382712 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", + "model":"openai\/gpt-4o-mini", + "bcp_47":"awa", "task":"translation_to", "metric":"bleu", - "score":0.3197810714 + "score":0.2351754729 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", + "model":"openai\/gpt-4o-mini", + "bcp_47":"awa", "task":"translation_to", "metric":"chrf", - "score":0.5649240218 + "score":0.4412955741 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", + "model":"openai\/gpt-4o-mini", + "bcp_47":"az", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"mgsm", - "metric":"accuracy", - "score":0.5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", + "model":"openai\/gpt-4o-mini", + "bcp_47":"az", "task":"translation_from", "metric":"bleu", - "score":0.2240038475 + "score":0.1025818924 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", + "model":"openai\/gpt-4o-mini", + "bcp_47":"az", "task":"translation_from", "metric":"chrf", - "score":0.4860646744 + "score":0.355623252 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", + "model":"openai\/gpt-4o-mini", + "bcp_47":"az", "task":"translation_to", "metric":"bleu", - "score":0.2284065848 + "score":0.1290294373 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", + "model":"openai\/gpt-4o-mini", + "bcp_47":"az", "task":"translation_to", "metric":"chrf", - "score":0.3753787999 + "score":0.3807908275 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", + "model":"openai\/gpt-4o-mini", + "bcp_47":"be", "task":"classification", "metric":"accuracy", "score":0.8 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", + "model":"openai\/gpt-4o-mini", + "bcp_47":"be", "task":"translation_from", "metric":"bleu", - "score":0.1867349669 + "score":0.116157646 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", + "model":"openai\/gpt-4o-mini", + "bcp_47":"be", "task":"translation_from", "metric":"chrf", - "score":0.4122967846 + "score":0.4411553165 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", + "model":"openai\/gpt-4o-mini", + "bcp_47":"be", "task":"translation_to", "metric":"bleu", - "score":0.20591358 + "score":0.2284052455 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", + "model":"openai\/gpt-4o-mini", + "bcp_47":"be", "task":"translation_to", "metric":"chrf", - "score":0.5231507594 + "score":0.4432025312 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", + "model":"openai\/gpt-4o-mini", + "bcp_47":"bho", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", + "model":"openai\/gpt-4o-mini", + "bcp_47":"bho", "task":"translation_from", "metric":"bleu", - "score":0.1659549387 + "score":0.1573424376 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", + "model":"openai\/gpt-4o-mini", + "bcp_47":"bho", "task":"translation_from", "metric":"chrf", - "score":0.4341818109 + "score":0.3813908093 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", + "model":"openai\/gpt-4o-mini", + "bcp_47":"bho", "task":"translation_to", "metric":"bleu", - "score":0.1728970527 + "score":0.1860567167 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", + "model":"openai\/gpt-4o-mini", + "bcp_47":"bho", "task":"translation_to", "metric":"chrf", - "score":0.4006604704 + "score":0.3798747224 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", + "model":"openai\/gpt-4o-mini", + "bcp_47":"bm", "task":"classification", "metric":"accuracy", - "score":0.7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", + "model":"openai\/gpt-4o-mini", + "bcp_47":"bm", "task":"translation_from", "metric":"bleu", - "score":0.1418786679 + "score":0.0 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", + "model":"openai\/gpt-4o-mini", + "bcp_47":"bm", "task":"translation_from", "metric":"chrf", - "score":0.4096096806 + "score":0.0 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", + "model":"openai\/gpt-4o-mini", + "bcp_47":"bm", "task":"translation_to", "metric":"bleu", - "score":0.2767863837 + "score":0.0 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", + "model":"openai\/gpt-4o-mini", + "bcp_47":"bm", "task":"translation_to", "metric":"chrf", - "score":0.343465352 + "score":0.0 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", + "model":"openai\/gpt-4o-mini", + "bcp_47":"bn", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":1.0 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", + "model":"openai\/gpt-4o-mini", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.2649114053 + "score":0.2047894665 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", + "model":"openai\/gpt-4o-mini", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.5258722646 + "score":0.4476643899 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", + "model":"openai\/gpt-4o-mini", + "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.1638513843 + "score":0.3413387194 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", + "model":"openai\/gpt-4o-mini", + "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.3671674679 + "score":0.5056140066 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ca", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ca", "task":"translation_from", "metric":"bleu", - "score":0.1755855974 + "score":0.0 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ca", "task":"translation_from", "metric":"chrf", - "score":0.464470709 + "score":0.0 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ca", "task":"translation_to", "metric":"bleu", - "score":0.2053629902 + "score":0.0 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ca", "task":"translation_to", "metric":"chrf", - "score":0.4466569291 + "score":0.0 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ms", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ceb", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ms", - "task":"mmlu", - "metric":"accuracy", - "score":0.5 + "score":1.0 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ms", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ceb", "task":"translation_from", "metric":"bleu", - "score":0.2391713081 + "score":0.3321604587 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ms", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ceb", "task":"translation_from", "metric":"chrf", - "score":0.5284921106 + "score":0.524735789 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ms", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ceb", "task":"translation_to", "metric":"bleu", - "score":0.3851770392 + "score":0.399945485 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ms", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ceb", "task":"translation_to", "metric":"chrf", - "score":0.6778949951 + "score":0.6275070378 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"my", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ckb", "task":"classification", "metric":"accuracy", - "score":0.6 + "score":1.0 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"my", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ckb", "task":"translation_from", "metric":"bleu", - "score":0.1921402736 + "score":0.0862560502 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"my", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ckb", "task":"translation_from", "metric":"chrf", - "score":0.4286234239 + "score":0.2788047314 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"my", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ckb", "task":"translation_to", "metric":"bleu", - "score":0.226941594 + "score":0.0359802782 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"my", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ckb", "task":"translation_to", "metric":"chrf", - "score":0.4545167964 + "score":0.2225612749 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"om", + "model":"openai\/gpt-4o-mini", + "bcp_47":"cs", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"om", + "model":"openai\/gpt-4o-mini", + "bcp_47":"cs", "task":"mgsm", "metric":"accuracy", - "score":0.3 + "score":0.7 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"om", + "model":"openai\/gpt-4o-mini", + "bcp_47":"cs", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"om", + "model":"openai\/gpt-4o-mini", + "bcp_47":"cs", "task":"translation_from", "metric":"bleu", - "score":0.0470010342 + "score":0.2777777551 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"om", + "model":"openai\/gpt-4o-mini", + "bcp_47":"cs", "task":"translation_from", "metric":"chrf", - "score":0.3053087334 + "score":0.5317009045 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"om", + "model":"openai\/gpt-4o-mini", + "bcp_47":"cs", "task":"translation_to", "metric":"bleu", - "score":0.0354609608 + "score":0.2755276023 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"om", + "model":"openai\/gpt-4o-mini", + "bcp_47":"cs", "task":"translation_to", "metric":"chrf", - "score":0.3000471846 + "score":0.4907555325 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", + "model":"openai\/gpt-4o-mini", + "bcp_47":"de", "task":"classification", "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", "score":0.7 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", + "model":"openai\/gpt-4o-mini", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.1342178934 + "score":0.2840890109 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", + "model":"openai\/gpt-4o-mini", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.4186845018 + "score":0.5146969249 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", + "model":"openai\/gpt-4o-mini", + "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.0959778877 + "score":0.3999539422 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", + "model":"openai\/gpt-4o-mini", + "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.4062370429 + "score":0.6267391818 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", + "model":"openai\/gpt-4o-mini", + "bcp_47":"el", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", + "model":"openai\/gpt-4o-mini", + "bcp_47":"el", "task":"translation_from", "metric":"bleu", - "score":0.3790281875 + "score":0.2595428958 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", + "model":"openai\/gpt-4o-mini", + "bcp_47":"el", "task":"translation_from", "metric":"chrf", - "score":0.5948460259 + "score":0.4813680319 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", + "model":"openai\/gpt-4o-mini", + "bcp_47":"el", "task":"translation_to", "metric":"bleu", - "score":0.4122107278 + "score":0.3306804036 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", + "model":"openai\/gpt-4o-mini", + "bcp_47":"el", "task":"translation_to", "metric":"chrf", - "score":0.5709045042 + "score":0.4976939797 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", + "model":"openai\/gpt-4o-mini", + "bcp_47":"en", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", + "model":"openai\/gpt-4o-mini", + "bcp_47":"en", "task":"mgsm", "metric":"accuracy", - "score":0.7 + "score":1.0 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", + "model":"openai\/gpt-4o-mini", + "bcp_47":"en", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", + "model":"openai\/gpt-4o-mini", + "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.1956391774 + "score":0.5232930808 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", + "model":"openai\/gpt-4o-mini", + "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.4696282098 + "score":0.6688775695 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", + "model":"openai\/gpt-4o-mini", + "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.3089097764 + "score":0.6469796865 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", + "model":"openai\/gpt-4o-mini", + "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.5592753275 + "score":0.8203785308 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", + "model":"openai\/gpt-4o-mini", + "bcp_47":"es", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", + "model":"openai\/gpt-4o-mini", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"es", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", + "model":"openai\/gpt-4o-mini", + "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.2493437671 + "score":0.2793939864 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", + "model":"openai\/gpt-4o-mini", + "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.4876335319 + "score":0.5176409834 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", + "model":"openai\/gpt-4o-mini", + "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.3816451478 + "score":0.4118937163 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", + "model":"openai\/gpt-4o-mini", + "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.6189446172 + "score":0.6353341411 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fa", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fa", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fa", "task":"translation_from", "metric":"bleu", - "score":0.2106935755 + "score":0.2052699799 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fa", "task":"translation_from", "metric":"chrf", - "score":0.4916756186 + "score":0.4764669046 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fa", "task":"translation_to", "metric":"bleu", - "score":0.2957139688 + "score":0.2131911377 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fa", "task":"translation_to", "metric":"chrf", - "score":0.5505026606 + "score":0.4147480093 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fil", "task":"classification", "metric":"accuracy", "score":0.8 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fil", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"fil", "task":"translation_from", "metric":"bleu", - "score":0.183239364 + "score":0.3062563146 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fil", "task":"translation_from", "metric":"chrf", - "score":0.4023445581 + "score":0.4925975136 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fil", "task":"translation_to", "metric":"bleu", - "score":0.188899922 + "score":0.32039199 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fil", "task":"translation_to", "metric":"chrf", - "score":0.3987821089 + "score":0.5717901387 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fr", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fr", "task":"mmlu", "metric":"accuracy", - "score":0.3 + "score":0.9 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.1987953868 + "score":0.2706688563 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.4232825095 + "score":0.5148499232 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.2845246017 + "score":0.4808374237 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.5836686109 + "score":0.6855290209 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fuv", "task":"classification", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fuv", "task":"translation_from", "metric":"bleu", - "score":0.1209729479 + "score":0.0270875349 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fuv", "task":"translation_from", "metric":"chrf", - "score":0.3863152501 + "score":0.2100353402 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fuv", "task":"translation_to", "metric":"bleu", - "score":0.2257337081 + "score":0.052858761 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fuv", "task":"translation_to", "metric":"chrf", - "score":0.4945472603 + "score":0.1950018354 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", + "model":"openai\/gpt-4o-mini", + "bcp_47":"gu", "task":"classification", "metric":"accuracy", - "score":0.8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"mgsm", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.5 + "score":0.9 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", + "model":"openai\/gpt-4o-mini", + "bcp_47":"gu", "task":"translation_from", "metric":"bleu", - "score":0.3081208582 + "score":0.2245042279 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", + "model":"openai\/gpt-4o-mini", + "bcp_47":"gu", "task":"translation_from", "metric":"chrf", - "score":0.5470122853 + "score":0.4426786034 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", + "model":"openai\/gpt-4o-mini", + "bcp_47":"gu", "task":"translation_to", "metric":"bleu", - "score":0.2720935434 + "score":0.1920269509 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", + "model":"openai\/gpt-4o-mini", + "bcp_47":"gu", "task":"translation_to", "metric":"chrf", - "score":0.4603538628 + "score":0.4643025206 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ha", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ha", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.5 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ha", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"ha", "task":"translation_from", "metric":"bleu", - "score":0.1699563701 + "score":0.1154893286 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ha", "task":"translation_from", "metric":"chrf", - "score":0.4279668426 + "score":0.3792147754 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ha", "task":"translation_to", "metric":"bleu", - "score":0.3008412738 + "score":0.2191612695 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ha", "task":"translation_to", "metric":"chrf", - "score":0.4707696326 + "score":0.4879764503 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", + "model":"openai\/gpt-4o-mini", + "bcp_47":"hi", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", + "model":"openai\/gpt-4o-mini", + "bcp_47":"hi", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.9 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", + "model":"openai\/gpt-4o-mini", + "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.1772339365 + "score":0.3473235908 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", + "model":"openai\/gpt-4o-mini", + "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.4203181275 + "score":0.5515454754 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", + "model":"openai\/gpt-4o-mini", + "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.3130066985 + "score":0.3991894826 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", + "model":"openai\/gpt-4o-mini", + "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.5687455638 + "score":0.6121310121 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", + "model":"openai\/gpt-4o-mini", + "bcp_47":"hne", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", + "model":"openai\/gpt-4o-mini", + "bcp_47":"hne", "task":"translation_from", "metric":"bleu", - "score":0.1864708336 + "score":0.247888062 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", + "model":"openai\/gpt-4o-mini", + "bcp_47":"hne", "task":"translation_from", "metric":"chrf", - "score":0.4670816214 + "score":0.4353918541 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", + "model":"openai\/gpt-4o-mini", + "bcp_47":"hne", "task":"translation_to", "metric":"bleu", - "score":0.2648238029 + "score":0.1626119723 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", + "model":"openai\/gpt-4o-mini", + "bcp_47":"hne", "task":"translation_to", "metric":"chrf", - "score":0.4478960511 + "score":0.4423709529 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"uz", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ht", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"uz", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ht", "task":"translation_from", "metric":"bleu", - "score":0.1939396294 + "score":0.0 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"uz", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ht", "task":"translation_from", "metric":"chrf", - "score":0.4361718347 + "score":0.0 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"uz", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ht", "task":"translation_to", "metric":"bleu", - "score":0.1189904742 + "score":0.0 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"uz", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ht", "task":"translation_to", "metric":"chrf", - "score":0.4347992199 + "score":0.0 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", + "model":"openai\/gpt-4o-mini", + "bcp_47":"hu", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"mmlu", + "model":"openai\/gpt-4o-mini", + "bcp_47":"hu", + "task":"mgsm", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", + "model":"openai\/gpt-4o-mini", + "bcp_47":"hu", "task":"translation_from", "metric":"bleu", - "score":0.2392083536 + "score":0.2640028594 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", + "model":"openai\/gpt-4o-mini", + "bcp_47":"hu", "task":"translation_from", "metric":"chrf", - "score":0.5109371286 + "score":0.524505973 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", + "model":"openai\/gpt-4o-mini", + "bcp_47":"hu", "task":"translation_to", "metric":"bleu", - "score":0.3593480951 + "score":0.3929863672 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", + "model":"openai\/gpt-4o-mini", + "bcp_47":"hu", "task":"translation_to", "metric":"chrf", - "score":0.5929525126 + "score":0.5880857849 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"wuu", + "model":"openai\/gpt-4o-mini", + "bcp_47":"id", "task":"classification", "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", "score":0.8 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"wuu", + "model":"openai\/gpt-4o-mini", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.160147676 + "score":0.2522725561 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"wuu", + "model":"openai\/gpt-4o-mini", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.391740055 + "score":0.5212732474 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"wuu", + "model":"openai\/gpt-4o-mini", + "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.0779637528 + "score":0.2850030055 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"wuu", + "model":"openai\/gpt-4o-mini", + "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.1486256305 + "score":0.5970450995 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ig", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"ig", "task":"translation_from", "metric":"bleu", - "score":0.1368607253 + "score":0.1326727529 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ig", "task":"translation_from", "metric":"chrf", - "score":0.4397284879 + "score":0.3646478687 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ig", "task":"translation_to", "metric":"bleu", - "score":0.1909241711 + "score":0.1882093096 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ig", "task":"translation_to", - "metric":"chrf", - "score":0.2765267822 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 + "metric":"chrf", + "score":0.4009607044 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"mmlu", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ilo", + "task":"classification", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ilo", "task":"translation_from", "metric":"bleu", - "score":0.1574414981 + "score":0.1988516559 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ilo", "task":"translation_from", "metric":"chrf", - "score":0.4616304665 + "score":0.405478436 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ilo", "task":"translation_to", "metric":"bleu", - "score":0.2468189144 + "score":0.0961457593 }, { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ilo", "task":"translation_to", "metric":"chrf", - "score":0.3136635386 + "score":0.4060794313 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"am", + "bcp_47":"it", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"am", + "bcp_47":"it", "task":"mgsm", "metric":"accuracy", - "score":0.2 + "score":0.9 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"am", + "bcp_47":"it", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.7 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"am", + "bcp_47":"it", "task":"translation_from", "metric":"bleu", - "score":0.080495827 + "score":0.2746808629 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"am", + "bcp_47":"it", "task":"translation_from", "metric":"chrf", - "score":0.287512266 + "score":0.5180176469 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"am", + "bcp_47":"it", "task":"translation_to", "metric":"bleu", - "score":0.0649609212 + "score":0.3112912727 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"am", + "bcp_47":"it", "task":"translation_to", "metric":"chrf", - "score":0.203944936 + "score":0.5712680542 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"apc", + "bcp_47":"ja", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"apc", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.2086617902 + "score":0.2363319461 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"apc", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.4774317011 + "score":0.4826308954 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"apc", + "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.2730334942 + "score":0.2593036542 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"apc", + "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.5458981435 + "score":0.4231415642 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", + "bcp_47":"jv", "task":"classification", "metric":"accuracy", "score":0.8 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.2530052174 + "score":0.2480055389 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.5158812138 + "score":0.4685108662 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", + "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.3439536667 + "score":0.2241033812 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", + "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.5691908832 + "score":0.5113817494 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", + "bcp_47":"ki", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", + "bcp_47":"ki", "task":"translation_from", "metric":"bleu", - "score":0.1573943285 + "score":0.0 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", + "bcp_47":"ki", "task":"translation_from", "metric":"chrf", - "score":0.4039837102 + "score":0.0 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", + "bcp_47":"ki", "task":"translation_to", "metric":"bleu", - "score":0.2385684611 + "score":0.0 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", + "bcp_47":"ki", "task":"translation_to", "metric":"chrf", - "score":0.4690487202 + "score":0.0 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"az", + "bcp_47":"kk", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"az", + "bcp_47":"kk", "task":"translation_from", "metric":"bleu", - "score":0.1025818924 + "score":0.147911394 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"az", + "bcp_47":"kk", "task":"translation_from", "metric":"chrf", - "score":0.355623252 + "score":0.3985376686 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"az", + "bcp_47":"kk", "task":"translation_to", "metric":"bleu", - "score":0.1290294373 + "score":0.290182238 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"az", + "bcp_47":"kk", "task":"translation_to", "metric":"chrf", - "score":0.3807908275 + "score":0.5572310551 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"bho", + "bcp_47":"km", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"bho", + "bcp_47":"km", "task":"translation_from", "metric":"bleu", - "score":0.1573424376 + "score":0.2772807862 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"bho", + "bcp_47":"km", "task":"translation_from", "metric":"chrf", - "score":0.3813908093 + "score":0.504897576 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"bho", + "bcp_47":"km", "task":"translation_to", "metric":"bleu", - "score":0.1860567167 + "score":0.1404234583 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"bho", + "bcp_47":"km", "task":"translation_to", "metric":"chrf", - "score":0.3798747224 + "score":0.3189837953 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", + "bcp_47":"kn", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"mgsm", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", "score":0.9 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", + "bcp_47":"kn", "task":"translation_from", "metric":"bleu", - "score":0.2047894665 + "score":0.1849035655 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", + "bcp_47":"kn", "task":"translation_from", "metric":"chrf", - "score":0.4476643899 + "score":0.430576325 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", + "bcp_47":"kn", "task":"translation_to", "metric":"bleu", - "score":0.3413387194 + "score":0.2444722013 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", + "bcp_47":"kn", "task":"translation_to", "metric":"chrf", - "score":0.5056140066 + "score":0.4742295195 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"de", + "bcp_47":"ko", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", + "bcp_47":"ko", "task":"mmlu", "metric":"accuracy", "score":0.7 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"de", + "bcp_47":"ko", "task":"translation_from", "metric":"bleu", - "score":0.2840890109 + "score":0.2013601575 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"de", + "bcp_47":"ko", "task":"translation_from", "metric":"chrf", - "score":0.5146969249 + "score":0.4475607863 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"de", + "bcp_47":"ko", "task":"translation_to", "metric":"bleu", - "score":0.3999539422 + "score":0.1980395856 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"de", + "bcp_47":"ko", "task":"translation_to", "metric":"chrf", - "score":0.6267391818 + "score":0.2888993735 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"en", + "bcp_47":"lua", "task":"classification", "metric":"accuracy", "score":0.8 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", + "bcp_47":"lua", "task":"translation_from", "metric":"bleu", - "score":0.5232930808 + "score":0.042643493 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"en", + "bcp_47":"lua", "task":"translation_from", "metric":"chrf", - "score":0.6688775695 + "score":0.2339244707 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"en", + "bcp_47":"lua", "task":"translation_to", "metric":"bleu", - "score":0.6469796865 + "score":0.0143208425 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"en", + "bcp_47":"lua", "task":"translation_to", "metric":"chrf", - "score":0.8203785308 + "score":0.2382431413 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"es", + "bcp_47":"mag", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.9 + "score":0.8 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"es", + "bcp_47":"mag", "task":"translation_from", "metric":"bleu", - "score":0.2793939864 + "score":0.2373436047 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"es", + "bcp_47":"mag", "task":"translation_from", "metric":"chrf", - "score":0.5176409834 + "score":0.4564427975 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"es", + "bcp_47":"mag", "task":"translation_to", "metric":"bleu", - "score":0.4118937163 + "score":0.2754056305 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"es", + "bcp_47":"mag", "task":"translation_to", "metric":"chrf", - "score":0.6353341411 + "score":0.5123611693 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", + "bcp_47":"mai", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 + "score":1.0 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", + "bcp_47":"mai", "task":"translation_from", "metric":"bleu", - "score":0.2052699799 + "score":0.2027297928 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", + "bcp_47":"mai", "task":"translation_from", "metric":"chrf", - "score":0.4764669046 + "score":0.4495211176 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", + "bcp_47":"mai", "task":"translation_to", "metric":"bleu", - "score":0.2131911377 + "score":0.1639594712 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", + "bcp_47":"mai", "task":"translation_to", "metric":"chrf", - "score":0.4147480093 + "score":0.4482904829 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", + "bcp_47":"mg", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", + "bcp_47":"mg", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.5 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", + "bcp_47":"mg", "task":"translation_from", "metric":"bleu", - "score":0.3062563146 + "score":0.2035781185 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", + "bcp_47":"mg", "task":"translation_from", "metric":"chrf", - "score":0.4925975136 + "score":0.4598803974 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", + "bcp_47":"mg", "task":"translation_to", "metric":"bleu", - "score":0.32039199 + "score":0.1964079195 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", + "bcp_47":"mg", "task":"translation_to", "metric":"chrf", - "score":0.5717901387 + "score":0.5179064416 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", + "bcp_47":"ml", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", + "bcp_47":"ml", "task":"translation_from", "metric":"bleu", - "score":0.2706688563 + "score":0.2246064108 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", + "bcp_47":"ml", "task":"translation_from", "metric":"chrf", - "score":0.5148499232 + "score":0.4311975246 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", + "bcp_47":"ml", "task":"translation_to", "metric":"bleu", - "score":0.4808374237 + "score":0.2434125045 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", + "bcp_47":"ml", "task":"translation_to", "metric":"chrf", - "score":0.6855290209 + "score":0.4971145063 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", + "bcp_47":"mr", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.2245042279 + "score":0.1756463826 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.4426786034 + "score":0.3823527701 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", + "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.1920269509 + "score":0.2340922946 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", + "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.4643025206 + "score":0.4581322597 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", + "bcp_47":"ms", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"mgsm", - "metric":"accuracy", - "score":0.5 + "score":0.8 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", + "bcp_47":"ms", "task":"mmlu", "metric":"accuracy", "score":0.5 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", + "bcp_47":"ms", "task":"translation_from", "metric":"bleu", - "score":0.1154893286 + "score":0.2993296846 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", + "bcp_47":"ms", "task":"translation_from", "metric":"chrf", - "score":0.3792147754 + "score":0.5743132494 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", + "bcp_47":"ms", "task":"translation_to", "metric":"bleu", - "score":0.2191612695 + "score":0.3504238332 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", + "bcp_47":"ms", "task":"translation_to", "metric":"chrf", - "score":0.4879764503 + "score":0.6154153931 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", + "bcp_47":"my", "task":"classification", "metric":"accuracy", - "score":1.0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", "score":0.9 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", + "bcp_47":"my", "task":"translation_from", "metric":"bleu", - "score":0.3473235908 + "score":0.1741885177 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", + "bcp_47":"my", "task":"translation_from", "metric":"chrf", - "score":0.5515454754 + "score":0.449774491 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", + "bcp_47":"my", "task":"translation_to", "metric":"bleu", - "score":0.3991894826 + "score":0.2106778 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", + "bcp_47":"my", "task":"translation_to", "metric":"chrf", - "score":0.6121310121 + "score":0.4610458467 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"id", + "bcp_47":"ne", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"id", + "bcp_47":"ne", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"id", + "bcp_47":"ne", "task":"translation_from", "metric":"bleu", - "score":0.2522725561 + "score":0.2483418024 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"id", + "bcp_47":"ne", "task":"translation_from", "metric":"chrf", - "score":0.5212732474 + "score":0.4432537254 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"id", + "bcp_47":"ne", "task":"translation_to", "metric":"bleu", - "score":0.2850030055 + "score":0.2305902219 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"id", + "bcp_47":"ne", "task":"translation_to", "metric":"chrf", - "score":0.5970450995 + "score":0.5017217229 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"it", + "bcp_47":"nl", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"it", + "bcp_47":"nl", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"it", + "bcp_47":"nl", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"it", + "bcp_47":"nl", "task":"translation_from", "metric":"bleu", - "score":0.2746808629 + "score":0.2523126947 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"it", + "bcp_47":"nl", "task":"translation_from", "metric":"chrf", - "score":0.5180176469 + "score":0.4772912105 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"it", + "bcp_47":"nl", "task":"translation_to", "metric":"bleu", - "score":0.3112912727 + "score":0.3639443469 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"it", + "bcp_47":"nl", "task":"translation_to", "metric":"chrf", - "score":0.5712680542 + "score":0.6252850371 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", + "bcp_47":"ny", "task":"classification", "metric":"accuracy", "score":0.8 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", + "bcp_47":"ny", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.4 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", + "bcp_47":"ny", "task":"translation_from", "metric":"bleu", - "score":0.2363319461 + "score":0.0835095719 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", + "bcp_47":"ny", "task":"translation_from", "metric":"chrf", - "score":0.4826308954 + "score":0.2797853634 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", + "bcp_47":"ny", "task":"translation_to", "metric":"bleu", - "score":0.2593036542 + "score":0.0779315192 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", + "bcp_47":"ny", "task":"translation_to", "metric":"chrf", - "score":0.4231415642 + "score":0.4121236337 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", + "bcp_47":"om", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"om", "task":"translation_from", "metric":"bleu", - "score":0.2480055389 + "score":0.0511068522 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", + "bcp_47":"om", "task":"translation_from", "metric":"chrf", - "score":0.4685108662 + "score":0.2702934215 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", + "bcp_47":"om", "task":"translation_to", "metric":"bleu", - "score":0.2241033812 + "score":0.0724907554 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", + "bcp_47":"om", "task":"translation_to", "metric":"chrf", - "score":0.5113817494 + "score":0.345324531 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", + "bcp_47":"or", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", + "bcp_47":"or", "task":"translation_from", "metric":"bleu", - "score":0.1849035655 + "score":0.1164462601 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", + "bcp_47":"or", "task":"translation_from", "metric":"chrf", - "score":0.430576325 + "score":0.3729006132 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", + "bcp_47":"or", "task":"translation_to", "metric":"bleu", - "score":0.2444722013 + "score":0.1379248705 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", + "bcp_47":"or", "task":"translation_to", "metric":"chrf", - "score":0.4742295195 + "score":0.4079943111 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", + "bcp_47":"pa", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.2013601575 + "score":0.3640514137 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.4475607863 + "score":0.5847142015 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", + "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.1980395856 + "score":0.3988016179 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", + "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.2888993735 + "score":0.5745254523 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", + "bcp_47":"pl", "task":"classification", "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", "score":0.9 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", + "bcp_47":"pl", "task":"translation_from", "metric":"bleu", - "score":0.2246064108 + "score":0.2319955399 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", + "bcp_47":"pl", "task":"translation_from", "metric":"chrf", - "score":0.4311975246 + "score":0.4971130964 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", + "bcp_47":"pl", "task":"translation_to", "metric":"bleu", - "score":0.2434125045 + "score":0.293769398 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", + "bcp_47":"pl", "task":"translation_to", "metric":"chrf", - "score":0.4971145063 + "score":0.535772663 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", + "bcp_47":"pt", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.1756463826 + "score":0.3014354397 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.3823527701 + "score":0.5315937202 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", + "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.2340922946 + "score":0.4535066637 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", + "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.4581322597 + "score":0.6773057972 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ms", + "bcp_47":"ro", "task":"classification", "metric":"accuracy", "score":0.8 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ms", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"ro", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.7 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ms", + "bcp_47":"ro", "task":"translation_from", "metric":"bleu", - "score":0.2993296846 + "score":0.2532461677 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ms", + "bcp_47":"ro", "task":"translation_from", "metric":"chrf", - "score":0.5743132494 + "score":0.5201960699 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ms", + "bcp_47":"ro", "task":"translation_to", "metric":"bleu", - "score":0.3504238332 + "score":0.5052082065 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ms", + "bcp_47":"ro", "task":"translation_to", "metric":"chrf", - "score":0.6154153931 + "score":0.6686611337 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"my", + "bcp_47":"ru", "task":"classification", "metric":"accuracy", + "score":1.0 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", "score":0.9 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"my", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.1741885177 + "score":0.2270580453 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"my", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.449774491 + "score":0.5034759488 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"my", + "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.2106778 + "score":0.3258505825 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"my", + "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.4610458467 + "score":0.5592402358 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"om", + "bcp_47":"rw", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"om", + "bcp_47":"rw", "task":"mgsm", "metric":"accuracy", "score":0.3 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"om", + "bcp_47":"rw", "task":"mmlu", "metric":"accuracy", "score":0.6 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"om", + "bcp_47":"rw", "task":"translation_from", "metric":"bleu", - "score":0.0511068522 + "score":0.0829790682 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"om", + "bcp_47":"rw", "task":"translation_from", "metric":"chrf", - "score":0.2702934215 + "score":0.337986391 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"om", + "bcp_47":"rw", "task":"translation_to", "metric":"bleu", - "score":0.0724907554 + "score":0.2129352292 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"om", + "bcp_47":"rw", "task":"translation_to", "metric":"chrf", - "score":0.345324531 + "score":0.5084793087 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"or", + "bcp_47":"sd", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"or", + "bcp_47":"sd", "task":"translation_from", "metric":"bleu", - "score":0.1164462601 + "score":0.15024418 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"or", + "bcp_47":"sd", "task":"translation_from", "metric":"chrf", - "score":0.3729006132 + "score":0.3597265355 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"or", + "bcp_47":"sd", "task":"translation_to", "metric":"bleu", - "score":0.1379248705 + "score":0.2369214411 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"or", + "bcp_47":"sd", "task":"translation_to", "metric":"chrf", - "score":0.4079943111 + "score":0.4711257499 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", + "bcp_47":"si", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", + "bcp_47":"si", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"si", "task":"translation_from", "metric":"bleu", - "score":0.3640514137 + "score":0.0980707024 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", + "bcp_47":"si", "task":"translation_from", "metric":"chrf", - "score":0.5847142015 + "score":0.3109100287 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", + "bcp_47":"si", "task":"translation_to", "metric":"bleu", - "score":0.3988016179 + "score":0.1934430032 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", + "bcp_47":"si", "task":"translation_to", "metric":"chrf", - "score":0.5745254523 + "score":0.3560526886 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", + "bcp_47":"sn", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", + "bcp_47":"sn", "task":"mgsm", "metric":"accuracy", - "score":0.7 + "score":0.3 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", + "bcp_47":"sn", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.5 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", + "bcp_47":"sn", "task":"translation_from", "metric":"bleu", - "score":0.2319955399 + "score":0.0582100604 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", + "bcp_47":"sn", "task":"translation_from", "metric":"chrf", - "score":0.4971130964 + "score":0.3075785834 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", + "bcp_47":"sn", "task":"translation_to", "metric":"bleu", - "score":0.293769398 + "score":0.1011833785 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", + "bcp_47":"sn", "task":"translation_to", "metric":"chrf", - "score":0.535772663 + "score":0.4367282377 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", + "bcp_47":"so", "task":"classification", "metric":"accuracy", "score":0.9 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", + "bcp_47":"so", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", + "bcp_47":"so", "task":"translation_from", "metric":"bleu", - "score":0.3014354397 + "score":0.1531795055 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", + "bcp_47":"so", "task":"translation_from", "metric":"chrf", - "score":0.5315937202 + "score":0.3616443224 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", + "bcp_47":"so", "task":"translation_to", "metric":"bleu", - "score":0.4535066637 + "score":0.2049307012 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", + "bcp_47":"so", "task":"translation_to", "metric":"chrf", - "score":0.6773057972 + "score":0.4719724156 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", + "bcp_47":"sr", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"mgsm", + "bcp_47":"sr", + "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":1.0 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"mmlu", + "bcp_47":"sr", + "task":"translation_from", + "metric":"bleu", + "score":0.2199024767 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"sr", + "task":"translation_from", + "metric":"chrf", + "score":0.4907562634 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"sr", + "task":"translation_to", + "metric":"bleu", + "score":0.3830980295 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"sr", + "task":"translation_to", + "metric":"chrf", + "score":0.5736359642 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"su", + "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", + "bcp_47":"su", "task":"translation_from", "metric":"bleu", - "score":0.2270580453 + "score":0.2379030124 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", + "bcp_47":"su", "task":"translation_from", "metric":"chrf", - "score":0.5034759488 + "score":0.4403417868 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", + "bcp_47":"su", "task":"translation_to", "metric":"bleu", - "score":0.3258505825 + "score":0.2238060743 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", + "bcp_47":"su", "task":"translation_to", "metric":"chrf", - "score":0.5592402358 + "score":0.5243303769 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", + "bcp_47":"sv", "task":"classification", "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", "score":0.9 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", + "bcp_47":"sv", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"sv", "task":"translation_from", "metric":"bleu", - "score":0.15024418 + "score":0.2852268785 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", + "bcp_47":"sv", "task":"translation_from", "metric":"chrf", - "score":0.3597265355 + "score":0.5304479976 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", + "bcp_47":"sv", "task":"translation_to", "metric":"bleu", - "score":0.2369214411 + "score":0.3829618265 }, { "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", + "bcp_47":"sv", "task":"translation_to", "metric":"chrf", - "score":0.4711257499 + "score":0.6326982198 }, { "model":"openai\/gpt-4o-mini", @@ -47711,6 +110893,41 @@ "metric":"chrf", "score":0.5444122929 }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"tg", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"tg", + "task":"translation_from", + "metric":"bleu", + "score":0.1128962774 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"tg", + "task":"translation_from", + "metric":"chrf", + "score":0.3493465213 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"tg", + "task":"translation_to", + "metric":"bleu", + "score":0.1841235337 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"tg", + "task":"translation_to", + "metric":"chrf", + "score":0.417497165 + }, { "model":"openai\/gpt-4o-mini", "bcp_47":"th", @@ -47753,6 +110970,41 @@ "metric":"chrf", "score":0.5010514821 }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"ti", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"ti", + "task":"translation_from", + "metric":"bleu", + "score":0.0408372058 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"ti", + "task":"translation_from", + "metric":"chrf", + "score":0.2042987422 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"ti", + "task":"translation_to", + "metric":"bleu", + "score":0.0231278614 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"ti", + "task":"translation_to", + "metric":"chrf", + "score":0.0849541719 + }, { "model":"openai\/gpt-4o-mini", "bcp_47":"tr", @@ -47795,6 +111047,83 @@ "metric":"chrf", "score":0.5999237379 }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"uk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"uk", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"uk", + "task":"translation_from", + "metric":"bleu", + "score":0.2245951815 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"uk", + "task":"translation_from", + "metric":"chrf", + "score":0.4480996711 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"uk", + "task":"translation_to", + "metric":"bleu", + "score":0.3852002404 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"uk", + "task":"translation_to", + "metric":"chrf", + "score":0.5711778517 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"umb", + "task":"classification", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"umb", + "task":"translation_from", + "metric":"bleu", + "score":0.0415789397 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"umb", + "task":"translation_from", + "metric":"chrf", + "score":0.1350551103 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"umb", + "task":"translation_to", + "metric":"bleu", + "score":0.0010517421 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"umb", + "task":"translation_to", + "metric":"chrf", + "score":0.0968599255 + }, { "model":"openai\/gpt-4o-mini", "bcp_47":"ur", @@ -47907,6 +111236,55 @@ "metric":"chrf", "score":0.514972808 }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"wo", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"wo", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"wo", + "task":"translation_from", + "metric":"bleu", + "score":0.08218909 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"wo", + "task":"translation_from", + "metric":"chrf", + "score":0.2632475474 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"wo", + "task":"translation_to", + "metric":"bleu", + "score":0.0383287658 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"wo", + "task":"translation_to", + "metric":"chrf", + "score":0.1924695915 + }, { "model":"openai\/gpt-4o-mini", "bcp_47":"wuu", @@ -47942,6 +111320,104 @@ "metric":"chrf", "score":0.1706758411 }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"xh", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"xh", + "task":"translation_from", + "metric":"bleu", + "score":0.158569201 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"xh", + "task":"translation_from", + "metric":"chrf", + "score":0.3926886149 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"xh", + "task":"translation_to", + "metric":"bleu", + "score":0.0591321886 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"xh", + "task":"translation_to", + "metric":"chrf", + "score":0.3427023375 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"yo", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"yo", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"yo", + "task":"translation_from", + "metric":"bleu", + "score":0.079919346 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"yo", + "task":"translation_from", + "metric":"chrf", + "score":0.279919938 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"yo", + "task":"translation_to", + "metric":"bleu", + "score":0.0720231313 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"yo", + "task":"translation_to", + "metric":"chrf", + "score":0.2187010976 + }, { "model":"openai\/gpt-4o-mini", "bcp_47":"yue", @@ -48025,5 +111501,54 @@ "task":"translation_to", "metric":"chrf", "score":0.3274827604 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"zu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"zu", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"zu", + "task":"translation_from", + "metric":"bleu", + "score":0.1866603918 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"zu", + "task":"translation_from", + "metric":"chrf", + "score":0.4108538087 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"zu", + "task":"translation_to", + "metric":"bleu", + "score":0.164847197 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"zu", + "task":"translation_to", + "metric":"chrf", + "score":0.4524644478 } ] \ No newline at end of file