Spaces:
Build error
Build error
completed results: max_new_tokens = 2048 and new addition of Phi-3.5-mini (3.8B)
Browse files- notebooks/00b_Data Analysis_Few_Shots.ipynb +2 -2
- notebooks/00c_Data Analysis_Fine_Tuned.ipynb +0 -0
- notebooks/00e_Data Analysis_Fine_Tuned_RPP_MNT_2048.ipynb +0 -0
- results/mac-results_few_shots.csv +2 -2
- results/mac-results_few_shots_metrics.csv +2 -2
- results/mac-results_fine_tuned.csv +2 -2
- results/mac-results_fine_tuned_metrics.csv +2 -2
- results/mac-results_rpp_with_mnt_2048_metrics.csv +18 -10
notebooks/00b_Data Analysis_Few_Shots.ipynb
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a33a8dc2231bdcafd2a175e0c6c6de1039d8779f0a384e645c6f9018b6930ea
|
3 |
+
size 3538126
|
notebooks/00c_Data Analysis_Fine_Tuned.ipynb
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
notebooks/00e_Data Analysis_Fine_Tuned_RPP_MNT_2048.ipynb
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
results/mac-results_few_shots.csv
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5eee20d96e97977b074da72907f0e00ab38105f55665b502a5686cbc8bf7da42
|
3 |
+
size 6372725
|
results/mac-results_few_shots_metrics.csv
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:36826dcad77fd126f2aec3afc445ad64ad9ccf086b0dd3c31685646d4ee57c42
|
3 |
+
size 10540
|
results/mac-results_fine_tuned.csv
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8875b9912b2866e0614391accb2bf41dfc9445d93984ac64c6da9ce18660fb35
|
3 |
+
size 10710407
|
results/mac-results_fine_tuned_metrics.csv
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:00d4b8d25ebd4696bc7589fce93e25b58a46686715ead9a205cc8c9bdfef31c7
|
3 |
+
size 11002
|
results/mac-results_rpp_with_mnt_2048_metrics.csv
CHANGED
@@ -1,8 +1,10 @@
|
|
1 |
model,rpp,meteor,spbleu,bleu_1,rouge_l,ews_score,repetition_score,total_repetitions,rap,num_incomplete_translations,num_max_output_tokens,eval_time
|
2 |
-
Qwen/Qwen2-72B-Instruct,1.00,0.47892081926016034,18.953782447211417,0.18953782447211412,0.4521569211424892,0.0,0.09885260370697264,0.09885260370697264,0.4768835566987496,0,0,15.
|
3 |
-
Qwen/Qwen2-72B-Instruct,1.02,0.47968366756320546,19.0137490702917,0.190137490702917,0.45197054564395384,0.0,0.08120035304501325,0.08120035304501325,0.47800479714301924,0,0,15.
|
4 |
-
Qwen/Qwen2-72B-Instruct,1.04,0.476362681282195,18.52063321160408,0.1852063321160408,0.44894205112535357,0.0,0.10503089143865843,0.10503089143865843,0.4742108804113156,0,0,15.
|
5 |
-
Qwen/Qwen2-72B-Instruct,1.06,0.46796363839506494,17.982473951038504,0.17982473951038513,0.441041000758417,0.0,0.07325684024713151,0.07325684024713151,0.466484924380041,0,0,15.
|
|
|
|
|
6 |
Qwen/Qwen2-7B-Instruct,1.00,0.442240791493943,14.38814929350883,0.1438814929350883,0.4161653982436496,0.0,12.81288614298323,12.81288614298323,0.3256127432585341,6,2,2.2162400706090026
|
7 |
Qwen/Qwen2-7B-Instruct,1.02,0.4400998640836595,15.16172261831792,0.1516172261831792,0.41646468384393903,0.0,7.1562224183583405,7.1562224183583405,0.356523119707599,6,1,1.586054721977052
|
8 |
Qwen/Qwen2-7B-Instruct,1.04,0.4390136558190875,14.958631815014014,0.14958631815014015,0.41437075031278525,0.0,0.1853486319505737,0.1853486319505737,0.43553983411076963,1,0,1.0123565754633717
|
@@ -15,12 +17,18 @@ internlm/internlm2_5-7b-chat,1.04,0.4154585167056314,13.534659133050223,0.135346
|
|
15 |
internlm/internlm2_5-7b-chat,1.06,0.40395886478553783,12.346740971499404,0.12346740971499397,0.38739729431897413,0.0,6.533980582524272,6.533980582524272,0.3315547851383537,1,1,2.153574580759047
|
16 |
internlm/internlm2_5-7b-chat,1.08,0.3873176839854818,11.075674965706343,0.11075674965706349,0.3727703497077143,0.0,9.820829655781113,9.820829655781113,0.2985977687581126,1,1,2.148278905560459
|
17 |
internlm/internlm2_5-7b-chat,1.10,0.3769306874386757,10.305163787094209,0.10305163787094214,0.3636303538397795,0.0,6.525154457193292,6.525154457193292,0.30942993176825007,1,1,2.172109443954104
|
18 |
-
|
19 |
-
|
20 |
-
|
21 |
-
|
22 |
-
|
23 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
24 |
shenzhi-wang/Llama3.1-8B-Chinese-Chat,1.00,0.43363250166217604,15.209540658023398,0.1520954065802339,0.4087331128794971,0.0,5.798764342453663,5.798764342453663,0.36177551894565085,0,1,1.7625772285966461
|
25 |
shenzhi-wang/Llama3.1-8B-Chinese-Chat,1.02,0.4329054166518245,15.19102241646024,0.1519102241646024,0.4070425935096388,0.0,5.77846425419241,5.77846425419241,0.3613372514106729,0,1,1.7493380406001766
|
26 |
shenzhi-wang/Llama3.1-8B-Chinese-Chat,1.04,0.43204787009562073,15.051351661582961,0.15051351661582968,0.40610700867871297,0.0,0.11827007943512798,0.11827007943512798,0.42985292605837966,0,0,1.0467784642541924
|
|
|
1 |
model,rpp,meteor,spbleu,bleu_1,rouge_l,ews_score,repetition_score,total_repetitions,rap,num_incomplete_translations,num_max_output_tokens,eval_time
|
2 |
+
Qwen/Qwen2-72B-Instruct,1.00,0.47892081926016034,18.953782447211417,0.18953782447211412,0.4521569211424892,0.0,0.09885260370697264,0.09885260370697264,0.4768835566987496,0,0,15.977934686672551
|
3 |
+
Qwen/Qwen2-72B-Instruct,1.02,0.47968366756320546,19.0137490702917,0.190137490702917,0.45197054564395384,0.0,0.08120035304501325,0.08120035304501325,0.47800479714301924,0,0,15.785525154457194
|
4 |
+
Qwen/Qwen2-72B-Instruct,1.04,0.476362681282195,18.52063321160408,0.1852063321160408,0.44894205112535357,0.0,0.10503089143865843,0.10503089143865843,0.4742108804113156,0,0,15.759046778464255
|
5 |
+
Qwen/Qwen2-72B-Instruct,1.06,0.46796363839506494,17.982473951038504,0.17982473951038513,0.441041000758417,0.0,0.07325684024713151,0.07325684024713151,0.466484924380041,0,0,15.851721094439542
|
6 |
+
Qwen/Qwen2-72B-Instruct,1.08,0.45975781977116453,17.067954025424825,0.17067954025424834,0.43174454568405374,0.0,0.04766107678729038,0.04766107678729038,0.45881038677745906,0,0,15.924095322153574
|
7 |
+
Qwen/Qwen2-72B-Instruct,1.10,0.4515778511124262,16.22452191616505,0.16224521916165044,0.4243494436012768,0.0,0.05736981465136805,0.05736981465136805,0.4504587226091121,0,0,15.984995586937334
|
8 |
Qwen/Qwen2-7B-Instruct,1.00,0.442240791493943,14.38814929350883,0.1438814929350883,0.4161653982436496,0.0,12.81288614298323,12.81288614298323,0.3256127432585341,6,2,2.2162400706090026
|
9 |
Qwen/Qwen2-7B-Instruct,1.02,0.4400998640836595,15.16172261831792,0.1516172261831792,0.41646468384393903,0.0,7.1562224183583405,7.1562224183583405,0.356523119707599,6,1,1.586054721977052
|
10 |
Qwen/Qwen2-7B-Instruct,1.04,0.4390136558190875,14.958631815014014,0.14958631815014015,0.41437075031278525,0.0,0.1853486319505737,0.1853486319505737,0.43553983411076963,1,0,1.0123565754633717
|
|
|
17 |
internlm/internlm2_5-7b-chat,1.06,0.40395886478553783,12.346740971499404,0.12346740971499397,0.38739729431897413,0.0,6.533980582524272,6.533980582524272,0.3315547851383537,1,1,2.153574580759047
|
18 |
internlm/internlm2_5-7b-chat,1.08,0.3873176839854818,11.075674965706343,0.11075674965706349,0.3727703497077143,0.0,9.820829655781113,9.820829655781113,0.2985977687581126,1,1,2.148278905560459
|
19 |
internlm/internlm2_5-7b-chat,1.10,0.3769306874386757,10.305163787094209,0.10305163787094214,0.3636303538397795,0.0,6.525154457193292,6.525154457193292,0.30942993176825007,1,1,2.172109443954104
|
20 |
+
microsoft/Phi-3.5-mini-instruct,1.00,0.37968315453481294,8.71296896471494,0.08712968964714936,0.35850654380084257,0.0,28.42630185348632,28.42630185348632,0.23960387748577275,0,6,5.484554280670785
|
21 |
+
microsoft/Phi-3.5-mini-instruct,1.02,0.3780585837553919,10.291240080163629,0.10291240080163629,0.3548291746069422,0.0,10.696381288614297,10.696381288614297,0.2873016094123469,0,2,2.6337157987643423
|
22 |
+
microsoft/Phi-3.5-mini-instruct,1.04,0.35471613338457425,8.966881655527896,0.08966881655527896,0.33033473881366876,0.0,3.7484554280670785,3.7484554280670785,0.3116318162898625,0,1,1.9285083848190645
|
23 |
+
microsoft/Phi-3.5-mini-instruct,1.06,0.3298733737040869,7.076233088011138,0.07076233088011138,0.3021292838048098,0.0,0.10767872903795234,0.10767872903795234,0.3283460949961551,0,0,1.3159752868490733
|
24 |
+
microsoft/Phi-3.5-mini-instruct,1.08,0.3054541022592767,5.105510599247868,0.05105510599247869,0.2734682521006445,0.0,3.29567519858782,3.29567519858782,0.2718263558255611,0,1,2.054721977052074
|
25 |
+
microsoft/Phi-3.5-mini-instruct,1.10,0.2903831801547132,4.091958857999118,0.04091958857999117,0.25172729782510583,0.0,0.07766990291262135,0.07766990291262135,0.28941072284774055,0,0,1.9638128861429833
|
26 |
+
shenzhi-wang/Llama3.1-70B-Chinese-Chat,1.00,0.46111105085070175,17.87914973742753,0.17879149737427524,0.4340569906195885,0.0,0.088261253309797,0.088261253309797,0.4593579935085897,0,0,16.17828773168579
|
27 |
+
shenzhi-wang/Llama3.1-70B-Chinese-Chat,1.02,0.45715172190795766,17.436884594979905,0.17436884594979907,0.4309998159694175,0.0,0.09267431597528684,0.09267431597528684,0.45532756172969063,0,0,15.968225948808474
|
28 |
+
shenzhi-wang/Llama3.1-70B-Chinese-Chat,1.04,0.45604679603642545,17.440173470996626,0.17440173470996626,0.43028250668592427,0.0,0.13062665489849956,0.13062665489849956,0.4534907811633413,0,0,16.050308914386584
|
29 |
+
shenzhi-wang/Llama3.1-70B-Chinese-Chat,1.06,0.45204163612198556,16.89523258317781,0.16895232583177808,0.42594768159318286,0.0,0.12533097969991175,0.12533097969991175,0.44960959510411197,0,0,15.972639011473962
|
30 |
+
shenzhi-wang/Llama3.1-70B-Chinese-Chat,1.08,0.4442106511292453,16.16623784482793,0.16166237844827927,0.4196173445876259,0.0,0.18711385701676964,0.18711385701676964,0.4406628043373358,0,0,15.998234774933804
|
31 |
+
shenzhi-wang/Llama3.1-70B-Chinese-Chat,1.10,0.43798379261381615,15.601722576240661,0.1560172257624066,0.4135114396257313,0.0,0.08649602824360106,0.08649602824360106,0.4363516968290564,0,0,16.018534863195057
|
32 |
shenzhi-wang/Llama3.1-8B-Chinese-Chat,1.00,0.43363250166217604,15.209540658023398,0.1520954065802339,0.4087331128794971,0.0,5.798764342453663,5.798764342453663,0.36177551894565085,0,1,1.7625772285966461
|
33 |
shenzhi-wang/Llama3.1-8B-Chinese-Chat,1.02,0.4329054166518245,15.19102241646024,0.1519102241646024,0.4070425935096388,0.0,5.77846425419241,5.77846425419241,0.3613372514106729,0,1,1.7493380406001766
|
34 |
shenzhi-wang/Llama3.1-8B-Chinese-Chat,1.04,0.43204787009562073,15.051351661582961,0.15051351661582968,0.40610700867871297,0.0,0.11827007943512798,0.11827007943512798,0.42985292605837966,0,0,1.0467784642541924
|