Diogo-V commited on
Commit
be54340
1 Parent(s): 6b6b063

Adds final graphs

Browse files
Files changed (40) hide show
  1. results/best_param_per_func_with_baselines/tinyllama/4/best_param_per_func_with_baselines.png +0 -0
  2. results/best_param_per_func_with_baselines/tinyllama/5/best_param_per_func_with_baselines.png +0 -0
  3. results/best_param_per_func_with_baselines/tinyllama/6/best_param_per_func_with_baselines.png +0 -0
  4. results/best_param_per_func_with_baselines/tinyllama/7/best_param_per_func_with_baselines.png +0 -0
  5. results/best_param_per_func_with_baselines/tinyllama/8/best_param_per_func_with_baselines.png +0 -0
  6. results/bitwidth_acc_decay_per_function/tinyllama.png +0 -0
  7. results/df.tsv +19 -62
  8. results/func_by_param_init_method/tinyllama/4/comb_1.png +0 -0
  9. results/func_by_param_init_method/tinyllama/4/comb_15.png +0 -0
  10. results/func_by_param_init_method/tinyllama/4/comb_16.png +0 -0
  11. results/func_by_param_init_method/tinyllama/4/comb_4.png +0 -0
  12. results/func_by_param_init_method/tinyllama/4/comb_6.png +0 -0
  13. results/func_by_param_init_method/tinyllama/4/comb_8.png +0 -0
  14. results/func_by_param_init_method/tinyllama/5/comb_1.png +0 -0
  15. results/func_by_param_init_method/tinyllama/5/comb_15.png +0 -0
  16. results/func_by_param_init_method/tinyllama/5/comb_16.png +0 -0
  17. results/func_by_param_init_method/tinyllama/5/comb_4.png +0 -0
  18. results/func_by_param_init_method/tinyllama/5/comb_6.png +0 -0
  19. results/func_by_param_init_method/tinyllama/5/comb_8.png +0 -0
  20. results/func_by_param_init_method/tinyllama/6/comb_1.png +0 -0
  21. results/func_by_param_init_method/tinyllama/6/comb_15.png +0 -0
  22. results/func_by_param_init_method/tinyllama/6/comb_16.png +0 -0
  23. results/func_by_param_init_method/tinyllama/6/comb_4.png +0 -0
  24. results/func_by_param_init_method/tinyllama/6/comb_6.png +0 -0
  25. results/func_by_param_init_method/tinyllama/6/comb_8.png +0 -0
  26. results/func_by_param_init_method/tinyllama/7/comb_1.png +0 -0
  27. results/func_by_param_init_method/tinyllama/7/comb_12.png +0 -0
  28. results/func_by_param_init_method/tinyllama/7/comb_15.png +0 -0
  29. results/func_by_param_init_method/tinyllama/7/comb_16.png +0 -0
  30. results/func_by_param_init_method/tinyllama/7/comb_4.png +0 -0
  31. results/func_by_param_init_method/tinyllama/7/comb_6.png +0 -0
  32. results/func_by_param_init_method/tinyllama/7/comb_8.png +0 -0
  33. results/func_by_param_init_method/tinyllama/8/comb_1.png +0 -0
  34. results/func_by_param_init_method/tinyllama/8/comb_12.png +0 -0
  35. results/func_by_param_init_method/tinyllama/8/comb_15.png +0 -0
  36. results/func_by_param_init_method/tinyllama/8/comb_16.png +0 -0
  37. results/func_by_param_init_method/tinyllama/8/comb_4.png +0 -0
  38. results/func_by_param_init_method/tinyllama/8/comb_6.png +0 -0
  39. results/func_by_param_init_method/tinyllama/8/comb_8.png +0 -0
  40. results/results.txt +70 -113
results/best_param_per_func_with_baselines/tinyllama/4/best_param_per_func_with_baselines.png CHANGED
results/best_param_per_func_with_baselines/tinyllama/5/best_param_per_func_with_baselines.png CHANGED
results/best_param_per_func_with_baselines/tinyllama/6/best_param_per_func_with_baselines.png CHANGED
results/best_param_per_func_with_baselines/tinyllama/7/best_param_per_func_with_baselines.png CHANGED
results/best_param_per_func_with_baselines/tinyllama/8/best_param_per_func_with_baselines.png CHANGED
results/bitwidth_acc_decay_per_function/tinyllama.png CHANGED
results/df.tsv CHANGED
@@ -1,6 +1,6 @@
1
  accuracy bits clip dataset method model params peak_mem_alloc_mb peak_mem_reserv_mb perplexity time_ms wer
2
  0.3641674816608429 4 0.0 wikitext ao_woq tinyllama fixed 741.692928 866.123776 7.043089866638184 18.421297 0.0
3
- 0.37713611125946045 8 0.0 wikitext ao_woq tinyllama fixed 1631.725568 1988.100096 6.605966091156006 15.539978 0.0
4
  0.0 4 0.0 wikitext comb_17 tinyllama rnd_search_t_cos 1895.561216 2157.969408 1.110665202140808 19.820667 0.0
5
  0.0 5 0.0 wikitext comb_17 tinyllama rnd_search_t_cos 1895.561216 2157.969408 1.110665202140808 19.820667 0.0
6
  0.0 6 0.0 wikitext comb_17 tinyllama rnd_search_t_cos 1895.561216 2157.969408 1.110665202140808 19.820667 0.0
@@ -14,13 +14,13 @@ accuracy bits clip dataset method model params peak_mem_alloc_mb peak_mem_reserv
14
  0.3492738604545593 5 0.0 wikitext comb_15 tinyllama rnd_search_t_cos 1896.032256 2157.969408 7.59440803527832 14.804527 0.0
15
  0.3748057782649994 6 0.0 wikitext comb_15 tinyllama rnd_search_t_cos 1896.032256 2157.969408 6.820615768432617 15.094575 0.0
16
  0.3736913502216339 7 0.0 wikitext comb_15 tinyllama rnd_search_t_cos 1896.032256 2157.969408 6.751235485076904 15.129384 0.0
17
- 0.32529547810554504 4 0.0 wikitext comb_15 tinyllama rnd_search_t_cos 1896.032256 2157.969408 8.292394638061523 15.266298 0.0
18
  0.376629501581192 8 0.0 wikitext comb_15 tinyllama rnd_search_t_cos 1896.032256 2157.969408 6.648813247680664 15.610503 0.0
19
- 0.37727120518684387 8 0.0 wikitext woq tinyllama fixed 1896.111616 2160.06656 6.604811191558838 15.927165 0.0
20
  0.3676123023033142 5 0.0 wikitext woq tinyllama fixed 1896.111616 2160.06656 6.966304302215576 16.687837 0.0
21
  0.3763255476951599 7 0.0 wikitext woq tinyllama fixed 1896.111616 2160.06656 6.663349628448486 16.806651 0.0
22
  0.3469773828983307 4 0.0 wikitext woq tinyllama fixed 1896.111616 2160.06656 7.655362606048584 66.058771 0.0
23
- 0.37858834862709045 6 0.0 wikitext woq tinyllama fixed 1896.111616 2160.06656 6.501583099365234 67.418015 0.0
24
  0.0 4 0.0 wikitext comb_12 tinyllama rnd_search_t_cos 1897.394176 2160.06656 1.145394206047058 27.563773 0.0
25
  0.0 5 0.0 wikitext comb_12 tinyllama rnd_search_t_cos 1897.394176 2160.06656 1.145394206047058 27.563773 0.0
26
  0.0 6 0.0 wikitext comb_12 tinyllama rnd_search_t_cos 1897.394176 2160.06656 1.145394206047058 27.563773 0.0
@@ -29,84 +29,41 @@ accuracy bits clip dataset method model params peak_mem_alloc_mb peak_mem_reserv
29
  0.0 6 0.0 wikitext comb_18 tinyllama rnd_search_t_cos 1897.394176 2160.06656 1.1098952293395996 27.570311 0.0
30
  0.0 7 0.0 wikitext comb_18 tinyllama rnd_search_t_cos 1897.394176 2160.06656 1.1098952293395996 27.570311 0.0
31
  0.0 8 0.0 wikitext comb_18 tinyllama rnd_search_t_cos 1897.394176 2160.06656 1.1098952293395996 27.570311 0.0
32
- 0.004761905409395695 7 0.0 wikitext comb_12 tinyllama rnd_search_t_cos 1897.394176 2160.06656 1.109161138534546 27.592245 0.0
33
  0.0 4 0.0 wikitext comb_10 tinyllama rnd_search_t_cos 1897.394176 2160.06656 1.1163378953933716 27.698181 0.0
34
  0.0 5 0.0 wikitext comb_10 tinyllama rnd_search_t_cos 1897.394176 2160.06656 1.1163378953933716 27.698181 0.0
35
  0.0 6 0.0 wikitext comb_10 tinyllama rnd_search_t_cos 1897.394176 2160.06656 1.1163378953933716 27.698181 0.0
36
  0.0 7 0.0 wikitext comb_10 tinyllama rnd_search_t_cos 1897.394176 2160.06656 1.1163378953933716 27.698181 0.0
37
  0.0 8 0.0 wikitext comb_10 tinyllama rnd_search_t_cos 1897.394176 2160.06656 1.1163378953933716 27.698181 0.0
38
- 0.37514355778694153 6 0.0 wikitext comb_8 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.78739070892334 27.790898 0.0
39
  0.376156747341156 8 0.0 wikitext comb_4 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.630317687988281 27.814126 0.0
40
  0.3734549283981323 6 0.0 wikitext comb_4 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.796349048614502 27.820068 0.0
41
- 0.26254647970199585 8 0.0 wikitext comb_12 tinyllama rnd_search_t_cos 1897.865216 2160.06656 11.513182640075684 27.840571 0.0
42
- 0.34839582443237305 5 0.0 wikitext comb_4 tinyllama rnd_search_t_cos 1897.865216 2160.06656 7.647418022155762 27.847983 0.0
43
  0.3727119565010071 7 0.0 wikitext comb_8 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.718999862670898 27.887398 0.0
44
- 0.37510979175567627 7 0.0 wikitext comb_6 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.765981674194336 27.897337 0.0
45
- 0.35717666149139404 5 0.0 wikitext comb_8 tinyllama rnd_search_t_cos 1897.865216 2160.06656 7.300607204437256 27.898576 0.0
46
- 0.32806485891342163 4 0.0 wikitext comb_6 tinyllama rnd_search_t_cos 1897.865216 2160.06656 8.234101295471191 27.919429 0.0
47
- 0.32080379128456116 4 0.0 wikitext comb_4 tinyllama rnd_search_t_cos 1897.865216 2160.06656 8.386785507202148 27.93508 0.0
48
  0.3131374716758728 4 0.0 wikitext comb_8 tinyllama rnd_search_t_cos 1897.865216 2160.06656 8.788942337036133 27.95638 0.0
49
  0.3746369481086731 6 0.0 wikitext comb_6 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.822465896606445 27.985409 0.0
50
  0.3722391128540039 7 0.0 wikitext comb_1 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.787343502044678 27.986104 0.0
51
- 0.37497466802597046 6 0.0 wikitext comb_1 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.805139541625977 28.016486 0.0
52
  0.3236069083213806 4 0.0 wikitext comb_1 tinyllama rnd_search_t_cos 1897.865216 2160.06656 8.328503608703613 28.020534 0.0
53
  0.3750084638595581 8 0.0 wikitext comb_6 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.664987087249756 28.03746 0.0
54
- 0.37436679005622864 8 0.0 wikitext comb_8 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.7002363204956055 28.046061 0.0
55
- 0.35471126437187195 5 0.0 wikitext comb_6 tinyllama rnd_search_t_cos 1897.865216 2160.06656 7.370707988739014 28.099499 0.0
56
  0.3736575245857239 6 0.0 wikitext comb_16 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.787633895874023 35.160303 0.0
57
- 0.32056736946105957 4 0.0 wikitext comb_16 tinyllama rnd_search_t_cos 1897.865216 2160.06656 8.467190742492676 35.206603 0.0
58
  0.3745693862438202 7 0.0 wikitext comb_16 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.77103328704834 35.208994 0.0
59
  0.3473488688468933 5 0.0 wikitext comb_16 tinyllama rnd_search_t_cos 1897.865216 2160.06656 7.646571636199951 35.212547 0.0
60
- 0.37666332721710205 8 0.0 wikitext comb_16 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.642916202545166 35.446694 0.0
61
  0.3745694160461426 7 0.0 wikitext comb_4 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.72044563293457 74.097814 0.0
62
- 0.37683215737342834 8 0.0 wikitext comb_1 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.651950836181641 93.118894 0.0
63
  0.3527524769306183 5 0.0 wikitext comb_1 tinyllama rnd_search_t_cos 1897.865216 2160.06656 7.499456882476807 93.750203 0.0
64
- 0.0 8 0.0 wikitext comb_5_t tinyllama rnd_search_t_cos 1904.146432 2174.746624 1.1093064546585083 26.186495 0.0
65
- 0.04212454706430435 8 0.0 wikitext comb_17_t tinyllama rnd_search_t_cos 1904.09728 2178.940928 1.2985304594039917 19.83594 0.0
66
- 0.4716987609863281 6 0.0 wikitext comb_15_t tinyllama rnd_search_t_cos 1904.551936 2178.940928 3.7289092540740967 14.556232 0.0
67
- 0.3973657488822937 4 0.0 wikitext comb_15_t tinyllama rnd_search_t_cos 1904.551936 2178.940928 5.701084136962891 15.057053 0.0
68
- 0.45427221059799194 5 0.0 wikitext comb_15_t tinyllama rnd_search_t_cos 1904.551936 2178.940928 4.304772853851318 15.347903 0.0
69
- 0.46936845779418945 7 0.0 wikitext comb_15_t tinyllama rnd_search_t_cos 1904.551936 2178.940928 3.6145713329315186 15.671561 0.0
70
- 0.43931108713150024 8 0.0 wikitext comb_15_t tinyllama rnd_search_t_cos 1904.551936 2178.940928 3.9724502563476562 47.707188 0.0
71
- 0.4452211856842041 8 0.0 wikitext woq_t tinyllama fixed 1904.631296 2181.03808 3.924962282180786 15.956677 0.0
72
- 0.47075313329696655 7 0.0 wikitext woq_t tinyllama fixed 1904.631296 2181.03808 3.660214424133301 16.348675 0.0
73
- 0.4528537690639496 5 0.0 wikitext woq_t tinyllama fixed 1904.631296 2181.03808 4.42483377456665 16.366052 0.0
74
- 0.4612968862056732 6 0.0 wikitext woq_t tinyllama fixed 1904.631296 2181.03808 3.779924154281616 16.870858 0.0
75
- 0.39648768305778503 4 0.0 wikitext woq_t tinyllama fixed 1904.631296 2181.03808 5.761601448059082 65.856696 0.0
76
- 0.0158730186522007 8 0.0 wikitext comb_10_t tinyllama rnd_search_t_cos 1905.921024 2181.03808 1.147719144821167 27.826014 0.0
77
- 0.13154339790344238 6 0.0 wikitext comb_12_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 23.68007469177246 27.735822 0.0
78
- 0.12546437978744507 8 0.0 wikitext comb_12_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 23.399200439453125 27.75806 0.0
79
- 0.47490713000297546 6 0.0 wikitext comb_6_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 3.746734619140625 27.769552 0.0
80
- 0.12546437978744507 7 0.0 wikitext comb_12_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 21.65581512451172 27.8162 0.0
81
- 0.4027355909347534 4 0.0 wikitext comb_1_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 5.609149932861328 27.82333 0.0
82
- 0.4416751265525818 8 0.0 wikitext comb_8_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 4.001720905303955 27.839803 0.0
83
- 0.467646062374115 6 0.0 wikitext comb_4_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 3.811641216278076 27.84338 0.0
84
- 0.46382978558540344 5 0.0 wikitext comb_8_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 4.091793060302734 27.844181 0.0
85
- 0.4553191661834717 5 0.0 wikitext comb_6_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 4.374711036682129 27.884053 0.0
86
- 0.3977372646331787 4 0.0 wikitext comb_8_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 5.561113357543945 27.886438 0.0
87
- 0.47105708718299866 7 0.0 wikitext comb_6_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 3.645103931427002 27.901748 0.0
88
- 0.4689632058143616 7 0.0 wikitext comb_1_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 3.678706169128418 27.903886 0.0
89
- 0.46990883350372314 7 0.0 wikitext comb_8_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 3.6156325340270996 27.919573 0.0
90
- 0.46372848749160767 6 0.0 wikitext comb_1_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 3.766780138015747 27.928961 0.0
91
- 0.45812228322029114 5 0.0 wikitext comb_4_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 4.280441761016846 27.931659 0.0
92
- 0.12104019522666931 8 0.0 wikitext comb_18_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 39.476627349853516 27.935854 0.0
93
- 0.4764944314956665 8 0.0 wikitext comb_4_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 3.731606960296631 27.972789 0.0
94
- 0.4374873638153076 8 0.0 wikitext comb_6_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 3.956845998764038 28.034313 0.0
95
- 0.40087810158729553 4 0.0 wikitext comb_6_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 5.790101051330566 28.052892 0.0
96
- 0.3941236138343811 4 0.0 wikitext comb_4_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 5.85722541809082 28.091564 0.0
97
- 0.47207027673721313 7 0.0 wikitext comb_4_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 3.570634603500366 28.131657 0.0
98
- 0.4493752121925354 8 0.0 wikitext comb_1_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 3.9227662086486816 28.16754 0.0
99
- 0.4734211564064026 6 0.0 wikitext comb_16_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 3.703791618347168 35.2082 0.0
100
- 0.4717325270175934 7 0.0 wikitext comb_16_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 3.6275858879089355 35.244539 0.0
101
- 0.39902064204216003 4 0.0 wikitext comb_16_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 5.773286819458008 35.27738 0.0
102
- 0.44332998991012573 8 0.0 wikitext comb_16_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 3.890549421310425 35.392824 0.0
103
- 0.4575481116771698 5 0.0 wikitext comb_16_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 4.395427227020264 35.603151 0.0
104
- 0.4595406949520111 5 0.0 wikitext comb_1_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 4.108213424682617 92.241717 0.0
105
- 0.4745018780231476 6 0.0 wikitext comb_8_t tinyllama rnd_search_t_cos 1906.384896 2181.03808 3.743009090423584 93.968884 0.0
106
  0.0 4 0.0 wikitext comb_3 tinyllama rnd_search_t_cos 1381.170176 2487.222272 1.1207027435302734 0.510374 0.0
107
  0.0 5 0.0 wikitext comb_3 tinyllama rnd_search_t_cos 1381.170176 2487.222272 1.1207027435302734 0.510374 0.0
108
  0.0 6 0.0 wikitext comb_3 tinyllama rnd_search_t_cos 1381.170176 2487.222272 1.1207027435302734 0.510374 0.0
109
  0.0 7 0.0 wikitext comb_3 tinyllama rnd_search_t_cos 1381.170176 2487.222272 1.1207027435302734 0.510374 0.0
110
  0.0 8 0.0 wikitext comb_3 tinyllama rnd_search_t_cos 1381.170176 2487.222272 1.1207027435302734 0.510374 0.0
111
- 0.0 8 0.0 wikitext comb_3_t tinyllama rnd_search_t_cos 1389.689856 2499.805184 1.112532615661621 0.489505 0.0
112
- 0.37814927101135254 32 0.0 wikitext base tinyllama ---- 4470.547968 4485.808128 6.595952033996582 11.494127 0.0
 
1
  accuracy bits clip dataset method model params peak_mem_alloc_mb peak_mem_reserv_mb perplexity time_ms wer
2
  0.3641674816608429 4 0.0 wikitext ao_woq tinyllama fixed 741.692928 866.123776 7.043089866638184 18.421297 0.0
3
+ 0.3771361112594604 8 0.0 wikitext ao_woq tinyllama fixed 1631.725568 1988.100096 6.605966091156006 15.539978 0.0
4
  0.0 4 0.0 wikitext comb_17 tinyllama rnd_search_t_cos 1895.561216 2157.969408 1.110665202140808 19.820667 0.0
5
  0.0 5 0.0 wikitext comb_17 tinyllama rnd_search_t_cos 1895.561216 2157.969408 1.110665202140808 19.820667 0.0
6
  0.0 6 0.0 wikitext comb_17 tinyllama rnd_search_t_cos 1895.561216 2157.969408 1.110665202140808 19.820667 0.0
 
14
  0.3492738604545593 5 0.0 wikitext comb_15 tinyllama rnd_search_t_cos 1896.032256 2157.969408 7.59440803527832 14.804527 0.0
15
  0.3748057782649994 6 0.0 wikitext comb_15 tinyllama rnd_search_t_cos 1896.032256 2157.969408 6.820615768432617 15.094575 0.0
16
  0.3736913502216339 7 0.0 wikitext comb_15 tinyllama rnd_search_t_cos 1896.032256 2157.969408 6.751235485076904 15.129384 0.0
17
+ 0.325295478105545 4 0.0 wikitext comb_15 tinyllama rnd_search_t_cos 1896.032256 2157.969408 8.292394638061523 15.266298 0.0
18
  0.376629501581192 8 0.0 wikitext comb_15 tinyllama rnd_search_t_cos 1896.032256 2157.969408 6.648813247680664 15.610503 0.0
19
+ 0.3772712051868438 8 0.0 wikitext woq tinyllama fixed 1896.111616 2160.06656 6.604811191558838 15.927165 0.0
20
  0.3676123023033142 5 0.0 wikitext woq tinyllama fixed 1896.111616 2160.06656 6.966304302215576 16.687837 0.0
21
  0.3763255476951599 7 0.0 wikitext woq tinyllama fixed 1896.111616 2160.06656 6.663349628448486 16.806651 0.0
22
  0.3469773828983307 4 0.0 wikitext woq tinyllama fixed 1896.111616 2160.06656 7.655362606048584 66.058771 0.0
23
+ 0.3785883486270904 6 0.0 wikitext woq tinyllama fixed 1896.111616 2160.06656 6.501583099365234 67.418015 0.0
24
  0.0 4 0.0 wikitext comb_12 tinyllama rnd_search_t_cos 1897.394176 2160.06656 1.145394206047058 27.563773 0.0
25
  0.0 5 0.0 wikitext comb_12 tinyllama rnd_search_t_cos 1897.394176 2160.06656 1.145394206047058 27.563773 0.0
26
  0.0 6 0.0 wikitext comb_12 tinyllama rnd_search_t_cos 1897.394176 2160.06656 1.145394206047058 27.563773 0.0
 
29
  0.0 6 0.0 wikitext comb_18 tinyllama rnd_search_t_cos 1897.394176 2160.06656 1.1098952293395996 27.570311 0.0
30
  0.0 7 0.0 wikitext comb_18 tinyllama rnd_search_t_cos 1897.394176 2160.06656 1.1098952293395996 27.570311 0.0
31
  0.0 8 0.0 wikitext comb_18 tinyllama rnd_search_t_cos 1897.394176 2160.06656 1.1098952293395996 27.570311 0.0
32
+ 0.0047619054093956 7 0.0 wikitext comb_12 tinyllama rnd_search_t_cos 1897.394176 2160.06656 1.109161138534546 27.592245 0.0
33
  0.0 4 0.0 wikitext comb_10 tinyllama rnd_search_t_cos 1897.394176 2160.06656 1.1163378953933716 27.698181 0.0
34
  0.0 5 0.0 wikitext comb_10 tinyllama rnd_search_t_cos 1897.394176 2160.06656 1.1163378953933716 27.698181 0.0
35
  0.0 6 0.0 wikitext comb_10 tinyllama rnd_search_t_cos 1897.394176 2160.06656 1.1163378953933716 27.698181 0.0
36
  0.0 7 0.0 wikitext comb_10 tinyllama rnd_search_t_cos 1897.394176 2160.06656 1.1163378953933716 27.698181 0.0
37
  0.0 8 0.0 wikitext comb_10 tinyllama rnd_search_t_cos 1897.394176 2160.06656 1.1163378953933716 27.698181 0.0
38
+ 0.3751435577869415 6 0.0 wikitext comb_8 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.78739070892334 27.790898 0.0
39
  0.376156747341156 8 0.0 wikitext comb_4 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.630317687988281 27.814126 0.0
40
  0.3734549283981323 6 0.0 wikitext comb_4 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.796349048614502 27.820068 0.0
41
+ 0.2625464797019958 8 0.0 wikitext comb_12 tinyllama rnd_search_t_cos 1897.865216 2160.06656 11.513182640075684 27.840571 0.0
42
+ 0.348395824432373 5 0.0 wikitext comb_4 tinyllama rnd_search_t_cos 1897.865216 2160.06656 7.647418022155762 27.847983 0.0
43
  0.3727119565010071 7 0.0 wikitext comb_8 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.718999862670898 27.887398 0.0
44
+ 0.3751097917556762 7 0.0 wikitext comb_6 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.765981674194336 27.897337 0.0
45
+ 0.357176661491394 5 0.0 wikitext comb_8 tinyllama rnd_search_t_cos 1897.865216 2160.06656 7.300607204437256 27.898576 0.0
46
+ 0.3280648589134216 4 0.0 wikitext comb_6 tinyllama rnd_search_t_cos 1897.865216 2160.06656 8.234101295471191 27.919429 0.0
47
+ 0.3208037912845611 4 0.0 wikitext comb_4 tinyllama rnd_search_t_cos 1897.865216 2160.06656 8.386785507202148 27.93508 0.0
48
  0.3131374716758728 4 0.0 wikitext comb_8 tinyllama rnd_search_t_cos 1897.865216 2160.06656 8.788942337036133 27.95638 0.0
49
  0.3746369481086731 6 0.0 wikitext comb_6 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.822465896606445 27.985409 0.0
50
  0.3722391128540039 7 0.0 wikitext comb_1 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.787343502044678 27.986104 0.0
51
+ 0.3749746680259704 6 0.0 wikitext comb_1 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.805139541625977 28.016486 0.0
52
  0.3236069083213806 4 0.0 wikitext comb_1 tinyllama rnd_search_t_cos 1897.865216 2160.06656 8.328503608703613 28.020534 0.0
53
  0.3750084638595581 8 0.0 wikitext comb_6 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.664987087249756 28.03746 0.0
54
+ 0.3743667900562286 8 0.0 wikitext comb_8 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.7002363204956055 28.046061 0.0
55
+ 0.3547112643718719 5 0.0 wikitext comb_6 tinyllama rnd_search_t_cos 1897.865216 2160.06656 7.370707988739014 28.099499 0.0
56
  0.3736575245857239 6 0.0 wikitext comb_16 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.787633895874023 35.160303 0.0
57
+ 0.3205673694610595 4 0.0 wikitext comb_16 tinyllama rnd_search_t_cos 1897.865216 2160.06656 8.467190742492676 35.206603 0.0
58
  0.3745693862438202 7 0.0 wikitext comb_16 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.77103328704834 35.208994 0.0
59
  0.3473488688468933 5 0.0 wikitext comb_16 tinyllama rnd_search_t_cos 1897.865216 2160.06656 7.646571636199951 35.212547 0.0
60
+ 0.376663327217102 8 0.0 wikitext comb_16 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.642916202545166 35.446694 0.0
61
  0.3745694160461426 7 0.0 wikitext comb_4 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.72044563293457 74.097814 0.0
62
+ 0.3768321573734283 8 0.0 wikitext comb_1 tinyllama rnd_search_t_cos 1897.865216 2160.06656 6.651950836181641 93.118894 0.0
63
  0.3527524769306183 5 0.0 wikitext comb_1 tinyllama rnd_search_t_cos 1897.865216 2160.06656 7.499456882476807 93.750203 0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
64
  0.0 4 0.0 wikitext comb_3 tinyllama rnd_search_t_cos 1381.170176 2487.222272 1.1207027435302734 0.510374 0.0
65
  0.0 5 0.0 wikitext comb_3 tinyllama rnd_search_t_cos 1381.170176 2487.222272 1.1207027435302734 0.510374 0.0
66
  0.0 6 0.0 wikitext comb_3 tinyllama rnd_search_t_cos 1381.170176 2487.222272 1.1207027435302734 0.510374 0.0
67
  0.0 7 0.0 wikitext comb_3 tinyllama rnd_search_t_cos 1381.170176 2487.222272 1.1207027435302734 0.510374 0.0
68
  0.0 8 0.0 wikitext comb_3 tinyllama rnd_search_t_cos 1381.170176 2487.222272 1.1207027435302734 0.510374 0.0
69
+ 0.3781492710113525 32 0.0 wikitext base tinyllama ---- 4470.547968 4485.808128 6.595952033996582 11.494127 0.0
 
results/func_by_param_init_method/tinyllama/4/comb_1.png CHANGED
results/func_by_param_init_method/tinyllama/4/comb_15.png CHANGED
results/func_by_param_init_method/tinyllama/4/comb_16.png CHANGED
results/func_by_param_init_method/tinyllama/4/comb_4.png CHANGED
results/func_by_param_init_method/tinyllama/4/comb_6.png CHANGED
results/func_by_param_init_method/tinyllama/4/comb_8.png CHANGED
results/func_by_param_init_method/tinyllama/5/comb_1.png CHANGED
results/func_by_param_init_method/tinyllama/5/comb_15.png CHANGED
results/func_by_param_init_method/tinyllama/5/comb_16.png CHANGED
results/func_by_param_init_method/tinyllama/5/comb_4.png CHANGED
results/func_by_param_init_method/tinyllama/5/comb_6.png CHANGED
results/func_by_param_init_method/tinyllama/5/comb_8.png CHANGED
results/func_by_param_init_method/tinyllama/6/comb_1.png CHANGED
results/func_by_param_init_method/tinyllama/6/comb_15.png CHANGED
results/func_by_param_init_method/tinyllama/6/comb_16.png CHANGED
results/func_by_param_init_method/tinyllama/6/comb_4.png CHANGED
results/func_by_param_init_method/tinyllama/6/comb_6.png CHANGED
results/func_by_param_init_method/tinyllama/6/comb_8.png CHANGED
results/func_by_param_init_method/tinyllama/7/comb_1.png CHANGED
results/func_by_param_init_method/tinyllama/7/comb_12.png CHANGED
results/func_by_param_init_method/tinyllama/7/comb_15.png CHANGED
results/func_by_param_init_method/tinyllama/7/comb_16.png CHANGED
results/func_by_param_init_method/tinyllama/7/comb_4.png CHANGED
results/func_by_param_init_method/tinyllama/7/comb_6.png CHANGED
results/func_by_param_init_method/tinyllama/7/comb_8.png CHANGED
results/func_by_param_init_method/tinyllama/8/comb_1.png CHANGED
results/func_by_param_init_method/tinyllama/8/comb_12.png CHANGED
results/func_by_param_init_method/tinyllama/8/comb_15.png CHANGED
results/func_by_param_init_method/tinyllama/8/comb_16.png CHANGED
results/func_by_param_init_method/tinyllama/8/comb_4.png CHANGED
results/func_by_param_init_method/tinyllama/8/comb_6.png CHANGED
results/func_by_param_init_method/tinyllama/8/comb_8.png CHANGED
results/results.txt CHANGED
@@ -1,113 +1,70 @@
1
- | | accuracy | bits | clip | dataset | method | model | params | peak_mem_alloc_mb | peak_mem_reserv_mb | perplexity | time_ms | wer |
2
- |----:|-----------:|-------:|-------:|:----------|:----------|:----------|:-----------------|--------------------:|---------------------:|-------------:|----------:|------:|
3
- | 0 | 0.364167 | 4 | 0 | wikitext | ao_woq | tinyllama | fixed | 741.693 | 866.124 | 7.04309 | 18.4213 | 0 |
4
- | 1 | 0.377136 | 8 | 0 | wikitext | ao_woq | tinyllama | fixed | 1631.73 | 1988.1 | 6.60597 | 15.54 | 0 |
5
- | 2 | 0 | 4 | 0 | wikitext | comb_17 | tinyllama | rnd_search_t_cos | 1895.56 | 2157.97 | 1.11067 | 19.8207 | 0 |
6
- | 3 | 0 | 5 | 0 | wikitext | comb_17 | tinyllama | rnd_search_t_cos | 1895.56 | 2157.97 | 1.11067 | 19.8207 | 0 |
7
- | 4 | 0 | 6 | 0 | wikitext | comb_17 | tinyllama | rnd_search_t_cos | 1895.56 | 2157.97 | 1.11067 | 19.8207 | 0 |
8
- | 5 | 0 | 7 | 0 | wikitext | comb_17 | tinyllama | rnd_search_t_cos | 1895.56 | 2157.97 | 1.11067 | 19.8207 | 0 |
9
- | 6 | 0 | 8 | 0 | wikitext | comb_17 | tinyllama | rnd_search_t_cos | 1895.56 | 2157.97 | 1.11067 | 19.8207 | 0 |
10
- | 7 | 0 | 4 | 0 | wikitext | comb_5 | tinyllama | rnd_search_t_cos | 1895.56 | 2157.97 | 1.10931 | 26.1773 | 0 |
11
- | 8 | 0 | 5 | 0 | wikitext | comb_5 | tinyllama | rnd_search_t_cos | 1895.56 | 2157.97 | 1.10931 | 26.1773 | 0 |
12
- | 9 | 0 | 6 | 0 | wikitext | comb_5 | tinyllama | rnd_search_t_cos | 1895.56 | 2157.97 | 1.10931 | 26.1773 | 0 |
13
- | 10 | 0 | 7 | 0 | wikitext | comb_5 | tinyllama | rnd_search_t_cos | 1895.56 | 2157.97 | 1.10931 | 26.1773 | 0 |
14
- | 11 | 0 | 8 | 0 | wikitext | comb_5 | tinyllama | rnd_search_t_cos | 1895.56 | 2157.97 | 1.10931 | 26.1773 | 0 |
15
- | 12 | 0.349274 | 5 | 0 | wikitext | comb_15 | tinyllama | rnd_search_t_cos | 1896.03 | 2157.97 | 7.59441 | 14.8045 | 0 |
16
- | 13 | 0.374806 | 6 | 0 | wikitext | comb_15 | tinyllama | rnd_search_t_cos | 1896.03 | 2157.97 | 6.82062 | 15.0946 | 0 |
17
- | 14 | 0.373691 | 7 | 0 | wikitext | comb_15 | tinyllama | rnd_search_t_cos | 1896.03 | 2157.97 | 6.75124 | 15.1294 | 0 |
18
- | 15 | 0.325295 | 4 | 0 | wikitext | comb_15 | tinyllama | rnd_search_t_cos | 1896.03 | 2157.97 | 8.29239 | 15.2663 | 0 |
19
- | 16 | 0.37663 | 8 | 0 | wikitext | comb_15 | tinyllama | rnd_search_t_cos | 1896.03 | 2157.97 | 6.64881 | 15.6105 | 0 |
20
- | 17 | 0.377271 | 8 | 0 | wikitext | woq | tinyllama | fixed | 1896.11 | 2160.07 | 6.60481 | 15.9272 | 0 |
21
- | 18 | 0.367612 | 5 | 0 | wikitext | woq | tinyllama | fixed | 1896.11 | 2160.07 | 6.9663 | 16.6878 | 0 |
22
- | 19 | 0.376326 | 7 | 0 | wikitext | woq | tinyllama | fixed | 1896.11 | 2160.07 | 6.66335 | 16.8067 | 0 |
23
- | 20 | 0.346977 | 4 | 0 | wikitext | woq | tinyllama | fixed | 1896.11 | 2160.07 | 7.65536 | 66.0588 | 0 |
24
- | 21 | 0.378588 | 6 | 0 | wikitext | woq | tinyllama | fixed | 1896.11 | 2160.07 | 6.50158 | 67.418 | 0 |
25
- | 22 | 0 | 4 | 0 | wikitext | comb_12 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.14539 | 27.5638 | 0 |
26
- | 23 | 0 | 5 | 0 | wikitext | comb_12 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.14539 | 27.5638 | 0 |
27
- | 24 | 0 | 6 | 0 | wikitext | comb_12 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.14539 | 27.5638 | 0 |
28
- | 25 | 0 | 4 | 0 | wikitext | comb_18 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.1099 | 27.5703 | 0 |
29
- | 26 | 0 | 5 | 0 | wikitext | comb_18 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.1099 | 27.5703 | 0 |
30
- | 27 | 0 | 6 | 0 | wikitext | comb_18 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.1099 | 27.5703 | 0 |
31
- | 28 | 0 | 7 | 0 | wikitext | comb_18 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.1099 | 27.5703 | 0 |
32
- | 29 | 0 | 8 | 0 | wikitext | comb_18 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.1099 | 27.5703 | 0 |
33
- | 30 | 0.00476191 | 7 | 0 | wikitext | comb_12 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.10916 | 27.5922 | 0 |
34
- | 31 | 0 | 4 | 0 | wikitext | comb_10 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.11634 | 27.6982 | 0 |
35
- | 32 | 0 | 5 | 0 | wikitext | comb_10 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.11634 | 27.6982 | 0 |
36
- | 33 | 0 | 6 | 0 | wikitext | comb_10 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.11634 | 27.6982 | 0 |
37
- | 34 | 0 | 7 | 0 | wikitext | comb_10 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.11634 | 27.6982 | 0 |
38
- | 35 | 0 | 8 | 0 | wikitext | comb_10 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.11634 | 27.6982 | 0 |
39
- | 36 | 0.375144 | 6 | 0 | wikitext | comb_8 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.78739 | 27.7909 | 0 |
40
- | 37 | 0.376157 | 8 | 0 | wikitext | comb_4 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.63032 | 27.8141 | 0 |
41
- | 38 | 0.373455 | 6 | 0 | wikitext | comb_4 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.79635 | 27.8201 | 0 |
42
- | 39 | 0.262546 | 8 | 0 | wikitext | comb_12 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 11.5132 | 27.8406 | 0 |
43
- | 40 | 0.348396 | 5 | 0 | wikitext | comb_4 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 7.64742 | 27.848 | 0 |
44
- | 41 | 0.372712 | 7 | 0 | wikitext | comb_8 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.719 | 27.8874 | 0 |
45
- | 42 | 0.37511 | 7 | 0 | wikitext | comb_6 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.76598 | 27.8973 | 0 |
46
- | 43 | 0.357177 | 5 | 0 | wikitext | comb_8 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 7.30061 | 27.8986 | 0 |
47
- | 44 | 0.328065 | 4 | 0 | wikitext | comb_6 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 8.2341 | 27.9194 | 0 |
48
- | 45 | 0.320804 | 4 | 0 | wikitext | comb_4 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 8.38679 | 27.9351 | 0 |
49
- | 46 | 0.313137 | 4 | 0 | wikitext | comb_8 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 8.78894 | 27.9564 | 0 |
50
- | 47 | 0.374637 | 6 | 0 | wikitext | comb_6 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.82247 | 27.9854 | 0 |
51
- | 48 | 0.372239 | 7 | 0 | wikitext | comb_1 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.78734 | 27.9861 | 0 |
52
- | 49 | 0.374975 | 6 | 0 | wikitext | comb_1 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.80514 | 28.0165 | 0 |
53
- | 50 | 0.323607 | 4 | 0 | wikitext | comb_1 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 8.3285 | 28.0205 | 0 |
54
- | 51 | 0.375008 | 8 | 0 | wikitext | comb_6 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.66499 | 28.0375 | 0 |
55
- | 52 | 0.374367 | 8 | 0 | wikitext | comb_8 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.70024 | 28.0461 | 0 |
56
- | 53 | 0.354711 | 5 | 0 | wikitext | comb_6 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 7.37071 | 28.0995 | 0 |
57
- | 54 | 0.373658 | 6 | 0 | wikitext | comb_16 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.78763 | 35.1603 | 0 |
58
- | 55 | 0.320567 | 4 | 0 | wikitext | comb_16 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 8.46719 | 35.2066 | 0 |
59
- | 56 | 0.374569 | 7 | 0 | wikitext | comb_16 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.77103 | 35.209 | 0 |
60
- | 57 | 0.347349 | 5 | 0 | wikitext | comb_16 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 7.64657 | 35.2125 | 0 |
61
- | 58 | 0.376663 | 8 | 0 | wikitext | comb_16 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.64292 | 35.4467 | 0 |
62
- | 59 | 0.374569 | 7 | 0 | wikitext | comb_4 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.72045 | 74.0978 | 0 |
63
- | 60 | 0.376832 | 8 | 0 | wikitext | comb_1 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.65195 | 93.1189 | 0 |
64
- | 61 | 0.352752 | 5 | 0 | wikitext | comb_1 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 7.49946 | 93.7502 | 0 |
65
- | 62 | 0 | 8 | 0 | wikitext | comb_5_t | tinyllama | rnd_search_t_cos | 1904.15 | 2174.75 | 1.10931 | 26.1865 | 0 |
66
- | 63 | 0.0421245 | 8 | 0 | wikitext | comb_17_t | tinyllama | rnd_search_t_cos | 1904.1 | 2178.94 | 1.29853 | 19.8359 | 0 |
67
- | 64 | 0.471699 | 6 | 0 | wikitext | comb_15_t | tinyllama | rnd_search_t_cos | 1904.55 | 2178.94 | 3.72891 | 14.5562 | 0 |
68
- | 65 | 0.397366 | 4 | 0 | wikitext | comb_15_t | tinyllama | rnd_search_t_cos | 1904.55 | 2178.94 | 5.70108 | 15.0571 | 0 |
69
- | 66 | 0.454272 | 5 | 0 | wikitext | comb_15_t | tinyllama | rnd_search_t_cos | 1904.55 | 2178.94 | 4.30477 | 15.3479 | 0 |
70
- | 67 | 0.469368 | 7 | 0 | wikitext | comb_15_t | tinyllama | rnd_search_t_cos | 1904.55 | 2178.94 | 3.61457 | 15.6716 | 0 |
71
- | 68 | 0.439311 | 8 | 0 | wikitext | comb_15_t | tinyllama | rnd_search_t_cos | 1904.55 | 2178.94 | 3.97245 | 47.7072 | 0 |
72
- | 69 | 0.445221 | 8 | 0 | wikitext | woq_t | tinyllama | fixed | 1904.63 | 2181.04 | 3.92496 | 15.9567 | 0 |
73
- | 70 | 0.470753 | 7 | 0 | wikitext | woq_t | tinyllama | fixed | 1904.63 | 2181.04 | 3.66021 | 16.3487 | 0 |
74
- | 71 | 0.452854 | 5 | 0 | wikitext | woq_t | tinyllama | fixed | 1904.63 | 2181.04 | 4.42483 | 16.3661 | 0 |
75
- | 72 | 0.461297 | 6 | 0 | wikitext | woq_t | tinyllama | fixed | 1904.63 | 2181.04 | 3.77992 | 16.8709 | 0 |
76
- | 73 | 0.396488 | 4 | 0 | wikitext | woq_t | tinyllama | fixed | 1904.63 | 2181.04 | 5.7616 | 65.8567 | 0 |
77
- | 74 | 0.015873 | 8 | 0 | wikitext | comb_10_t | tinyllama | rnd_search_t_cos | 1905.92 | 2181.04 | 1.14772 | 27.826 | 0 |
78
- | 75 | 0.131543 | 6 | 0 | wikitext | comb_12_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 23.6801 | 27.7358 | 0 |
79
- | 76 | 0.125464 | 8 | 0 | wikitext | comb_12_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 23.3992 | 27.7581 | 0 |
80
- | 77 | 0.474907 | 6 | 0 | wikitext | comb_6_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 3.74673 | 27.7696 | 0 |
81
- | 78 | 0.125464 | 7 | 0 | wikitext | comb_12_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 21.6558 | 27.8162 | 0 |
82
- | 79 | 0.402736 | 4 | 0 | wikitext | comb_1_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 5.60915 | 27.8233 | 0 |
83
- | 80 | 0.441675 | 8 | 0 | wikitext | comb_8_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 4.00172 | 27.8398 | 0 |
84
- | 81 | 0.467646 | 6 | 0 | wikitext | comb_4_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 3.81164 | 27.8434 | 0 |
85
- | 82 | 0.46383 | 5 | 0 | wikitext | comb_8_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 4.09179 | 27.8442 | 0 |
86
- | 83 | 0.455319 | 5 | 0 | wikitext | comb_6_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 4.37471 | 27.8841 | 0 |
87
- | 84 | 0.397737 | 4 | 0 | wikitext | comb_8_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 5.56111 | 27.8864 | 0 |
88
- | 85 | 0.471057 | 7 | 0 | wikitext | comb_6_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 3.6451 | 27.9017 | 0 |
89
- | 86 | 0.468963 | 7 | 0 | wikitext | comb_1_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 3.67871 | 27.9039 | 0 |
90
- | 87 | 0.469909 | 7 | 0 | wikitext | comb_8_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 3.61563 | 27.9196 | 0 |
91
- | 88 | 0.463728 | 6 | 0 | wikitext | comb_1_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 3.76678 | 27.929 | 0 |
92
- | 89 | 0.458122 | 5 | 0 | wikitext | comb_4_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 4.28044 | 27.9317 | 0 |
93
- | 90 | 0.12104 | 8 | 0 | wikitext | comb_18_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 39.4766 | 27.9359 | 0 |
94
- | 91 | 0.476494 | 8 | 0 | wikitext | comb_4_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 3.73161 | 27.9728 | 0 |
95
- | 92 | 0.437487 | 8 | 0 | wikitext | comb_6_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 3.95685 | 28.0343 | 0 |
96
- | 93 | 0.400878 | 4 | 0 | wikitext | comb_6_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 5.7901 | 28.0529 | 0 |
97
- | 94 | 0.394124 | 4 | 0 | wikitext | comb_4_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 5.85723 | 28.0916 | 0 |
98
- | 95 | 0.47207 | 7 | 0 | wikitext | comb_4_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 3.57063 | 28.1317 | 0 |
99
- | 96 | 0.449375 | 8 | 0 | wikitext | comb_1_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 3.92277 | 28.1675 | 0 |
100
- | 97 | 0.473421 | 6 | 0 | wikitext | comb_16_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 3.70379 | 35.2082 | 0 |
101
- | 98 | 0.471733 | 7 | 0 | wikitext | comb_16_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 3.62759 | 35.2445 | 0 |
102
- | 99 | 0.399021 | 4 | 0 | wikitext | comb_16_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 5.77329 | 35.2774 | 0 |
103
- | 100 | 0.44333 | 8 | 0 | wikitext | comb_16_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 3.89055 | 35.3928 | 0 |
104
- | 101 | 0.457548 | 5 | 0 | wikitext | comb_16_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 4.39543 | 35.6032 | 0 |
105
- | 102 | 0.459541 | 5 | 0 | wikitext | comb_1_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 4.10821 | 92.2417 | 0 |
106
- | 103 | 0.474502 | 6 | 0 | wikitext | comb_8_t | tinyllama | rnd_search_t_cos | 1906.38 | 2181.04 | 3.74301 | 93.9689 | 0 |
107
- | 104 | 0 | 4 | 0 | wikitext | comb_3 | tinyllama | rnd_search_t_cos | 1381.17 | 2487.22 | 1.1207 | 0.510374 | 0 |
108
- | 105 | 0 | 5 | 0 | wikitext | comb_3 | tinyllama | rnd_search_t_cos | 1381.17 | 2487.22 | 1.1207 | 0.510374 | 0 |
109
- | 106 | 0 | 6 | 0 | wikitext | comb_3 | tinyllama | rnd_search_t_cos | 1381.17 | 2487.22 | 1.1207 | 0.510374 | 0 |
110
- | 107 | 0 | 7 | 0 | wikitext | comb_3 | tinyllama | rnd_search_t_cos | 1381.17 | 2487.22 | 1.1207 | 0.510374 | 0 |
111
- | 108 | 0 | 8 | 0 | wikitext | comb_3 | tinyllama | rnd_search_t_cos | 1381.17 | 2487.22 | 1.1207 | 0.510374 | 0 |
112
- | 109 | 0 | 8 | 0 | wikitext | comb_3_t | tinyllama | rnd_search_t_cos | 1389.69 | 2499.81 | 1.11253 | 0.489505 | 0 |
113
- | 110 | 0.378149 | 32 | 0 | wikitext | base | tinyllama | ---- | 4470.55 | 4485.81 | 6.59595 | 11.4941 | 0 |
 
1
+ | | accuracy | bits | clip | dataset | method | model | params | peak_mem_alloc_mb | peak_mem_reserv_mb | perplexity | time_ms | wer |
2
+ |---:|-----------:|-------:|-------:|:----------|:---------|:----------|:-----------------|--------------------:|---------------------:|-------------:|----------:|------:|
3
+ | 0 | 0.3642 | 4 | 0 | wikitext | ao_woq | tinyllama | fixed | 741.693 | 866.124 | 7.0431 | 18.4213 | 0 |
4
+ | 1 | 0.3771 | 8 | 0 | wikitext | ao_woq | tinyllama | fixed | 1631.73 | 1988.1 | 6.606 | 15.54 | 0 |
5
+ | 2 | 0 | 4 | 0 | wikitext | comb_17 | tinyllama | rnd_search_t_cos | 1895.56 | 2157.97 | 1.1107 | 19.8207 | 0 |
6
+ | 3 | 0 | 5 | 0 | wikitext | comb_17 | tinyllama | rnd_search_t_cos | 1895.56 | 2157.97 | 1.1107 | 19.8207 | 0 |
7
+ | 4 | 0 | 6 | 0 | wikitext | comb_17 | tinyllama | rnd_search_t_cos | 1895.56 | 2157.97 | 1.1107 | 19.8207 | 0 |
8
+ | 5 | 0 | 7 | 0 | wikitext | comb_17 | tinyllama | rnd_search_t_cos | 1895.56 | 2157.97 | 1.1107 | 19.8207 | 0 |
9
+ | 6 | 0 | 8 | 0 | wikitext | comb_17 | tinyllama | rnd_search_t_cos | 1895.56 | 2157.97 | 1.1107 | 19.8207 | 0 |
10
+ | 7 | 0 | 4 | 0 | wikitext | comb_5 | tinyllama | rnd_search_t_cos | 1895.56 | 2157.97 | 1.1093 | 26.1773 | 0 |
11
+ | 8 | 0 | 5 | 0 | wikitext | comb_5 | tinyllama | rnd_search_t_cos | 1895.56 | 2157.97 | 1.1093 | 26.1773 | 0 |
12
+ | 9 | 0 | 6 | 0 | wikitext | comb_5 | tinyllama | rnd_search_t_cos | 1895.56 | 2157.97 | 1.1093 | 26.1773 | 0 |
13
+ | 10 | 0 | 7 | 0 | wikitext | comb_5 | tinyllama | rnd_search_t_cos | 1895.56 | 2157.97 | 1.1093 | 26.1773 | 0 |
14
+ | 11 | 0 | 8 | 0 | wikitext | comb_5 | tinyllama | rnd_search_t_cos | 1895.56 | 2157.97 | 1.1093 | 26.1773 | 0 |
15
+ | 12 | 0.3493 | 5 | 0 | wikitext | comb_15 | tinyllama | rnd_search_t_cos | 1896.03 | 2157.97 | 7.5944 | 14.8045 | 0 |
16
+ | 13 | 0.3748 | 6 | 0 | wikitext | comb_15 | tinyllama | rnd_search_t_cos | 1896.03 | 2157.97 | 6.8206 | 15.0946 | 0 |
17
+ | 14 | 0.3737 | 7 | 0 | wikitext | comb_15 | tinyllama | rnd_search_t_cos | 1896.03 | 2157.97 | 6.7512 | 15.1294 | 0 |
18
+ | 15 | 0.3253 | 4 | 0 | wikitext | comb_15 | tinyllama | rnd_search_t_cos | 1896.03 | 2157.97 | 8.2924 | 15.2663 | 0 |
19
+ | 16 | 0.3766 | 8 | 0 | wikitext | comb_15 | tinyllama | rnd_search_t_cos | 1896.03 | 2157.97 | 6.6488 | 15.6105 | 0 |
20
+ | 17 | 0.3773 | 8 | 0 | wikitext | woq | tinyllama | fixed | 1896.11 | 2160.07 | 6.6048 | 15.9272 | 0 |
21
+ | 18 | 0.3676 | 5 | 0 | wikitext | woq | tinyllama | fixed | 1896.11 | 2160.07 | 6.9663 | 16.6878 | 0 |
22
+ | 19 | 0.3763 | 7 | 0 | wikitext | woq | tinyllama | fixed | 1896.11 | 2160.07 | 6.6633 | 16.8067 | 0 |
23
+ | 20 | 0.347 | 4 | 0 | wikitext | woq | tinyllama | fixed | 1896.11 | 2160.07 | 7.6554 | 66.0588 | 0 |
24
+ | 21 | 0.3786 | 6 | 0 | wikitext | woq | tinyllama | fixed | 1896.11 | 2160.07 | 6.5016 | 67.418 | 0 |
25
+ | 22 | 0 | 4 | 0 | wikitext | comb_12 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.1454 | 27.5638 | 0 |
26
+ | 23 | 0 | 5 | 0 | wikitext | comb_12 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.1454 | 27.5638 | 0 |
27
+ | 24 | 0 | 6 | 0 | wikitext | comb_12 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.1454 | 27.5638 | 0 |
28
+ | 25 | 0 | 4 | 0 | wikitext | comb_18 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.1099 | 27.5703 | 0 |
29
+ | 26 | 0 | 5 | 0 | wikitext | comb_18 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.1099 | 27.5703 | 0 |
30
+ | 27 | 0 | 6 | 0 | wikitext | comb_18 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.1099 | 27.5703 | 0 |
31
+ | 28 | 0 | 7 | 0 | wikitext | comb_18 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.1099 | 27.5703 | 0 |
32
+ | 29 | 0 | 8 | 0 | wikitext | comb_18 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.1099 | 27.5703 | 0 |
33
+ | 30 | 0.0048 | 7 | 0 | wikitext | comb_12 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.1092 | 27.5922 | 0 |
34
+ | 31 | 0 | 4 | 0 | wikitext | comb_10 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.1163 | 27.6982 | 0 |
35
+ | 32 | 0 | 5 | 0 | wikitext | comb_10 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.1163 | 27.6982 | 0 |
36
+ | 33 | 0 | 6 | 0 | wikitext | comb_10 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.1163 | 27.6982 | 0 |
37
+ | 34 | 0 | 7 | 0 | wikitext | comb_10 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.1163 | 27.6982 | 0 |
38
+ | 35 | 0 | 8 | 0 | wikitext | comb_10 | tinyllama | rnd_search_t_cos | 1897.39 | 2160.07 | 1.1163 | 27.6982 | 0 |
39
+ | 36 | 0.3751 | 6 | 0 | wikitext | comb_8 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.7874 | 27.7909 | 0 |
40
+ | 37 | 0.3762 | 8 | 0 | wikitext | comb_4 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.6303 | 27.8141 | 0 |
41
+ | 38 | 0.3735 | 6 | 0 | wikitext | comb_4 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.7963 | 27.8201 | 0 |
42
+ | 39 | 0.2625 | 8 | 0 | wikitext | comb_12 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 11.5132 | 27.8406 | 0 |
43
+ | 40 | 0.3484 | 5 | 0 | wikitext | comb_4 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 7.6474 | 27.848 | 0 |
44
+ | 41 | 0.3727 | 7 | 0 | wikitext | comb_8 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.719 | 27.8874 | 0 |
45
+ | 42 | 0.3751 | 7 | 0 | wikitext | comb_6 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.766 | 27.8973 | 0 |
46
+ | 43 | 0.3572 | 5 | 0 | wikitext | comb_8 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 7.3006 | 27.8986 | 0 |
47
+ | 44 | 0.3281 | 4 | 0 | wikitext | comb_6 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 8.2341 | 27.9194 | 0 |
48
+ | 45 | 0.3208 | 4 | 0 | wikitext | comb_4 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 8.3868 | 27.9351 | 0 |
49
+ | 46 | 0.3131 | 4 | 0 | wikitext | comb_8 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 8.7889 | 27.9564 | 0 |
50
+ | 47 | 0.3746 | 6 | 0 | wikitext | comb_6 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.8225 | 27.9854 | 0 |
51
+ | 48 | 0.3722 | 7 | 0 | wikitext | comb_1 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.7873 | 27.9861 | 0 |
52
+ | 49 | 0.375 | 6 | 0 | wikitext | comb_1 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.8051 | 28.0165 | 0 |
53
+ | 50 | 0.3236 | 4 | 0 | wikitext | comb_1 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 8.3285 | 28.0205 | 0 |
54
+ | 51 | 0.375 | 8 | 0 | wikitext | comb_6 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.665 | 28.0375 | 0 |
55
+ | 52 | 0.3744 | 8 | 0 | wikitext | comb_8 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.7002 | 28.0461 | 0 |
56
+ | 53 | 0.3547 | 5 | 0 | wikitext | comb_6 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 7.3707 | 28.0995 | 0 |
57
+ | 54 | 0.3737 | 6 | 0 | wikitext | comb_16 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.7876 | 35.1603 | 0 |
58
+ | 55 | 0.3206 | 4 | 0 | wikitext | comb_16 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 8.4672 | 35.2066 | 0 |
59
+ | 56 | 0.3746 | 7 | 0 | wikitext | comb_16 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.771 | 35.209 | 0 |
60
+ | 57 | 0.3473 | 5 | 0 | wikitext | comb_16 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 7.6466 | 35.2125 | 0 |
61
+ | 58 | 0.3767 | 8 | 0 | wikitext | comb_16 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.6429 | 35.4467 | 0 |
62
+ | 59 | 0.3746 | 7 | 0 | wikitext | comb_4 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.7204 | 74.0978 | 0 |
63
+ | 60 | 0.3768 | 8 | 0 | wikitext | comb_1 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 6.652 | 93.1189 | 0 |
64
+ | 61 | 0.3528 | 5 | 0 | wikitext | comb_1 | tinyllama | rnd_search_t_cos | 1897.87 | 2160.07 | 7.4995 | 93.7502 | 0 |
65
+ | 62 | 0 | 4 | 0 | wikitext | comb_3 | tinyllama | rnd_search_t_cos | 1381.17 | 2487.22 | 1.1207 | 0.5104 | 0 |
66
+ | 63 | 0 | 5 | 0 | wikitext | comb_3 | tinyllama | rnd_search_t_cos | 1381.17 | 2487.22 | 1.1207 | 0.5104 | 0 |
67
+ | 64 | 0 | 6 | 0 | wikitext | comb_3 | tinyllama | rnd_search_t_cos | 1381.17 | 2487.22 | 1.1207 | 0.5104 | 0 |
68
+ | 65 | 0 | 7 | 0 | wikitext | comb_3 | tinyllama | rnd_search_t_cos | 1381.17 | 2487.22 | 1.1207 | 0.5104 | 0 |
69
+ | 66 | 0 | 8 | 0 | wikitext | comb_3 | tinyllama | rnd_search_t_cos | 1381.17 | 2487.22 | 1.1207 | 0.5104 | 0 |
70
+ | 67 | 0.3781 | 32 | 0 | wikitext | base | tinyllama | ---- | 4470.55 | 4485.81 | 6.596 | 11.4941 | 0 |