dh-mc commited on
Commit
a35e6bd
1 Parent(s): 8f3ae45

completed results: max_new_tokens = 2048 and new addition of Phi-3.5-mini (3.8B)

Browse files
notebooks/00b_Data Analysis_Few_Shots.ipynb CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4d7af735cc4e9c4395e8bba07f2d212edc159f0f8f8cf83281f25f1ea8c2d717
3
- size 3332561
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a33a8dc2231bdcafd2a175e0c6c6de1039d8779f0a384e645c6f9018b6930ea
3
+ size 3538126
notebooks/00c_Data Analysis_Fine_Tuned.ipynb CHANGED
The diff for this file is too large to render. See raw diff
 
notebooks/00e_Data Analysis_Fine_Tuned_RPP_MNT_2048.ipynb CHANGED
The diff for this file is too large to render. See raw diff
 
results/mac-results_few_shots.csv CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8f723eef48aef85396c145f7d720349203ec2071fc6483f10b787b39a0f46c7a
3
- size 5592490
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5eee20d96e97977b074da72907f0e00ab38105f55665b502a5686cbc8bf7da42
3
+ size 6372725
results/mac-results_few_shots_metrics.csv CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:945e48d5773ce3a870e793e410c79148bd34c1b427c7bcd8e9e5ec140e574fa7
3
- size 9379
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36826dcad77fd126f2aec3afc445ad64ad9ccf086b0dd3c31685646d4ee57c42
3
+ size 10540
results/mac-results_fine_tuned.csv CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f0564bf0b1589e346ae507a61b254da0f53cf4130fbf997f51cd44d77b505bba
3
- size 11490642
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8875b9912b2866e0614391accb2bf41dfc9445d93984ac64c6da9ce18660fb35
3
+ size 10710407
results/mac-results_fine_tuned_metrics.csv CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:13b905223cb46875da8cb216aa36068a02ee6a98411bda6fda445bd95c5b28a2
3
- size 7339
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00d4b8d25ebd4696bc7589fce93e25b58a46686715ead9a205cc8c9bdfef31c7
3
+ size 11002
results/mac-results_rpp_with_mnt_2048_metrics.csv CHANGED
@@ -1,8 +1,10 @@
1
  model,rpp,meteor,spbleu,bleu_1,rouge_l,ews_score,repetition_score,total_repetitions,rap,num_incomplete_translations,num_max_output_tokens,eval_time
2
- Qwen/Qwen2-72B-Instruct,1.00,0.47892081926016034,18.953782447211417,0.18953782447211412,0.4521569211424892,0.0,0.09885260370697264,0.09885260370697264,0.4768835566987496,0,0,15.931156222418359
3
- Qwen/Qwen2-72B-Instruct,1.02,0.47968366756320546,19.0137490702917,0.190137490702917,0.45197054564395384,0.0,0.08120035304501325,0.08120035304501325,0.47800479714301924,0,0,15.855251544571933
4
- Qwen/Qwen2-72B-Instruct,1.04,0.476362681282195,18.52063321160408,0.1852063321160408,0.44894205112535357,0.0,0.10503089143865843,0.10503089143865843,0.4742108804113156,0,0,15.78640776699029
5
- Qwen/Qwen2-72B-Instruct,1.06,0.46796363839506494,17.982473951038504,0.17982473951038513,0.441041000758417,0.0,0.07325684024713151,0.07325684024713151,0.466484924380041,0,0,15.872021182700795
 
 
6
  Qwen/Qwen2-7B-Instruct,1.00,0.442240791493943,14.38814929350883,0.1438814929350883,0.4161653982436496,0.0,12.81288614298323,12.81288614298323,0.3256127432585341,6,2,2.2162400706090026
7
  Qwen/Qwen2-7B-Instruct,1.02,0.4400998640836595,15.16172261831792,0.1516172261831792,0.41646468384393903,0.0,7.1562224183583405,7.1562224183583405,0.356523119707599,6,1,1.586054721977052
8
  Qwen/Qwen2-7B-Instruct,1.04,0.4390136558190875,14.958631815014014,0.14958631815014015,0.41437075031278525,0.0,0.1853486319505737,0.1853486319505737,0.43553983411076963,1,0,1.0123565754633717
@@ -15,12 +17,18 @@ internlm/internlm2_5-7b-chat,1.04,0.4154585167056314,13.534659133050223,0.135346
15
  internlm/internlm2_5-7b-chat,1.06,0.40395886478553783,12.346740971499404,0.12346740971499397,0.38739729431897413,0.0,6.533980582524272,6.533980582524272,0.3315547851383537,1,1,2.153574580759047
16
  internlm/internlm2_5-7b-chat,1.08,0.3873176839854818,11.075674965706343,0.11075674965706349,0.3727703497077143,0.0,9.820829655781113,9.820829655781113,0.2985977687581126,1,1,2.148278905560459
17
  internlm/internlm2_5-7b-chat,1.10,0.3769306874386757,10.305163787094209,0.10305163787094214,0.3636303538397795,0.0,6.525154457193292,6.525154457193292,0.30942993176825007,1,1,2.172109443954104
18
- shenzhi-wang/Llama3.1-70B-Chinese-Chat,1.00,0.46111105085070175,17.87914973742753,0.17879149737427524,0.4340569906195885,0.0,0.088261253309797,0.088261253309797,0.4593579935085897,0,0,16.127978817299205
19
- shenzhi-wang/Llama3.1-70B-Chinese-Chat,1.02,0.45715172190795766,17.436884594979905,0.17436884594979907,0.4309998159694175,0.0,0.09267431597528684,0.09267431597528684,0.45532756172969063,0,0,15.987643424536628
20
- shenzhi-wang/Llama3.1-70B-Chinese-Chat,1.04,0.45604679603642545,17.440173470996626,0.17440173470996626,0.43028250668592427,0.0,0.13062665489849956,0.13062665489849956,0.4534907811633413,0,0,15.958517210944395
21
- shenzhi-wang/Llama3.1-70B-Chinese-Chat,1.06,0.45204163612198556,16.89523258317781,0.16895232583177808,0.42594768159318286,0.0,0.12533097969991175,0.12533097969991175,0.44960959510411197,0,0,15.998234774933804
22
- shenzhi-wang/Llama3.1-70B-Chinese-Chat,1.08,0.4442106511292453,16.16623784482793,0.16166237844827927,0.4196173445876259,0.0,0.18711385701676964,0.18711385701676964,0.4406628043373358,0,0,15.89143865842895
23
- shenzhi-wang/Llama3.1-70B-Chinese-Chat,1.10,0.43798379261381615,15.601722576240661,0.1560172257624066,0.4135114396257313,0.0,0.08649602824360106,0.08649602824360106,0.4363516968290564,0,0,15.981465136804943
 
 
 
 
 
 
24
  shenzhi-wang/Llama3.1-8B-Chinese-Chat,1.00,0.43363250166217604,15.209540658023398,0.1520954065802339,0.4087331128794971,0.0,5.798764342453663,5.798764342453663,0.36177551894565085,0,1,1.7625772285966461
25
  shenzhi-wang/Llama3.1-8B-Chinese-Chat,1.02,0.4329054166518245,15.19102241646024,0.1519102241646024,0.4070425935096388,0.0,5.77846425419241,5.77846425419241,0.3613372514106729,0,1,1.7493380406001766
26
  shenzhi-wang/Llama3.1-8B-Chinese-Chat,1.04,0.43204787009562073,15.051351661582961,0.15051351661582968,0.40610700867871297,0.0,0.11827007943512798,0.11827007943512798,0.42985292605837966,0,0,1.0467784642541924
 
1
  model,rpp,meteor,spbleu,bleu_1,rouge_l,ews_score,repetition_score,total_repetitions,rap,num_incomplete_translations,num_max_output_tokens,eval_time
2
+ Qwen/Qwen2-72B-Instruct,1.00,0.47892081926016034,18.953782447211417,0.18953782447211412,0.4521569211424892,0.0,0.09885260370697264,0.09885260370697264,0.4768835566987496,0,0,15.977934686672551
3
+ Qwen/Qwen2-72B-Instruct,1.02,0.47968366756320546,19.0137490702917,0.190137490702917,0.45197054564395384,0.0,0.08120035304501325,0.08120035304501325,0.47800479714301924,0,0,15.785525154457194
4
+ Qwen/Qwen2-72B-Instruct,1.04,0.476362681282195,18.52063321160408,0.1852063321160408,0.44894205112535357,0.0,0.10503089143865843,0.10503089143865843,0.4742108804113156,0,0,15.759046778464255
5
+ Qwen/Qwen2-72B-Instruct,1.06,0.46796363839506494,17.982473951038504,0.17982473951038513,0.441041000758417,0.0,0.07325684024713151,0.07325684024713151,0.466484924380041,0,0,15.851721094439542
6
+ Qwen/Qwen2-72B-Instruct,1.08,0.45975781977116453,17.067954025424825,0.17067954025424834,0.43174454568405374,0.0,0.04766107678729038,0.04766107678729038,0.45881038677745906,0,0,15.924095322153574
7
+ Qwen/Qwen2-72B-Instruct,1.10,0.4515778511124262,16.22452191616505,0.16224521916165044,0.4243494436012768,0.0,0.05736981465136805,0.05736981465136805,0.4504587226091121,0,0,15.984995586937334
8
  Qwen/Qwen2-7B-Instruct,1.00,0.442240791493943,14.38814929350883,0.1438814929350883,0.4161653982436496,0.0,12.81288614298323,12.81288614298323,0.3256127432585341,6,2,2.2162400706090026
9
  Qwen/Qwen2-7B-Instruct,1.02,0.4400998640836595,15.16172261831792,0.1516172261831792,0.41646468384393903,0.0,7.1562224183583405,7.1562224183583405,0.356523119707599,6,1,1.586054721977052
10
  Qwen/Qwen2-7B-Instruct,1.04,0.4390136558190875,14.958631815014014,0.14958631815014015,0.41437075031278525,0.0,0.1853486319505737,0.1853486319505737,0.43553983411076963,1,0,1.0123565754633717
 
17
  internlm/internlm2_5-7b-chat,1.06,0.40395886478553783,12.346740971499404,0.12346740971499397,0.38739729431897413,0.0,6.533980582524272,6.533980582524272,0.3315547851383537,1,1,2.153574580759047
18
  internlm/internlm2_5-7b-chat,1.08,0.3873176839854818,11.075674965706343,0.11075674965706349,0.3727703497077143,0.0,9.820829655781113,9.820829655781113,0.2985977687581126,1,1,2.148278905560459
19
  internlm/internlm2_5-7b-chat,1.10,0.3769306874386757,10.305163787094209,0.10305163787094214,0.3636303538397795,0.0,6.525154457193292,6.525154457193292,0.30942993176825007,1,1,2.172109443954104
20
+ microsoft/Phi-3.5-mini-instruct,1.00,0.37968315453481294,8.71296896471494,0.08712968964714936,0.35850654380084257,0.0,28.42630185348632,28.42630185348632,0.23960387748577275,0,6,5.484554280670785
21
+ microsoft/Phi-3.5-mini-instruct,1.02,0.3780585837553919,10.291240080163629,0.10291240080163629,0.3548291746069422,0.0,10.696381288614297,10.696381288614297,0.2873016094123469,0,2,2.6337157987643423
22
+ microsoft/Phi-3.5-mini-instruct,1.04,0.35471613338457425,8.966881655527896,0.08966881655527896,0.33033473881366876,0.0,3.7484554280670785,3.7484554280670785,0.3116318162898625,0,1,1.9285083848190645
23
+ microsoft/Phi-3.5-mini-instruct,1.06,0.3298733737040869,7.076233088011138,0.07076233088011138,0.3021292838048098,0.0,0.10767872903795234,0.10767872903795234,0.3283460949961551,0,0,1.3159752868490733
24
+ microsoft/Phi-3.5-mini-instruct,1.08,0.3054541022592767,5.105510599247868,0.05105510599247869,0.2734682521006445,0.0,3.29567519858782,3.29567519858782,0.2718263558255611,0,1,2.054721977052074
25
+ microsoft/Phi-3.5-mini-instruct,1.10,0.2903831801547132,4.091958857999118,0.04091958857999117,0.25172729782510583,0.0,0.07766990291262135,0.07766990291262135,0.28941072284774055,0,0,1.9638128861429833
26
+ shenzhi-wang/Llama3.1-70B-Chinese-Chat,1.00,0.46111105085070175,17.87914973742753,0.17879149737427524,0.4340569906195885,0.0,0.088261253309797,0.088261253309797,0.4593579935085897,0,0,16.17828773168579
27
+ shenzhi-wang/Llama3.1-70B-Chinese-Chat,1.02,0.45715172190795766,17.436884594979905,0.17436884594979907,0.4309998159694175,0.0,0.09267431597528684,0.09267431597528684,0.45532756172969063,0,0,15.968225948808474
28
+ shenzhi-wang/Llama3.1-70B-Chinese-Chat,1.04,0.45604679603642545,17.440173470996626,0.17440173470996626,0.43028250668592427,0.0,0.13062665489849956,0.13062665489849956,0.4534907811633413,0,0,16.050308914386584
29
+ shenzhi-wang/Llama3.1-70B-Chinese-Chat,1.06,0.45204163612198556,16.89523258317781,0.16895232583177808,0.42594768159318286,0.0,0.12533097969991175,0.12533097969991175,0.44960959510411197,0,0,15.972639011473962
30
+ shenzhi-wang/Llama3.1-70B-Chinese-Chat,1.08,0.4442106511292453,16.16623784482793,0.16166237844827927,0.4196173445876259,0.0,0.18711385701676964,0.18711385701676964,0.4406628043373358,0,0,15.998234774933804
31
+ shenzhi-wang/Llama3.1-70B-Chinese-Chat,1.10,0.43798379261381615,15.601722576240661,0.1560172257624066,0.4135114396257313,0.0,0.08649602824360106,0.08649602824360106,0.4363516968290564,0,0,16.018534863195057
32
  shenzhi-wang/Llama3.1-8B-Chinese-Chat,1.00,0.43363250166217604,15.209540658023398,0.1520954065802339,0.4087331128794971,0.0,5.798764342453663,5.798764342453663,0.36177551894565085,0,1,1.7625772285966461
33
  shenzhi-wang/Llama3.1-8B-Chinese-Chat,1.02,0.4329054166518245,15.19102241646024,0.1519102241646024,0.4070425935096388,0.0,5.77846425419241,5.77846425419241,0.3613372514106729,0,1,1.7493380406001766
34
  shenzhi-wang/Llama3.1-8B-Chinese-Chat,1.04,0.43204787009562073,15.051351661582961,0.15051351661582968,0.40610700867871297,0.0,0.11827007943512798,0.11827007943512798,0.42985292605837966,0,0,1.0467784642541924