diff --git a/results/best_param_per_func_with_baselines/tinyllama/4/best_param_per_func_with_baselines.png b/results/best_param_per_func_with_baselines/tinyllama/4/best_param_per_func_with_baselines.png new file mode 100644 index 0000000000000000000000000000000000000000..189f52e5052484cfd0247260f1e542029512d29e Binary files /dev/null and b/results/best_param_per_func_with_baselines/tinyllama/4/best_param_per_func_with_baselines.png differ diff --git a/results/best_param_per_func_with_baselines/tinyllama/5/best_param_per_func_with_baselines.png b/results/best_param_per_func_with_baselines/tinyllama/5/best_param_per_func_with_baselines.png new file mode 100644 index 0000000000000000000000000000000000000000..8556dd27e6dc0aaea972ee96d2d151fef3d68aea Binary files /dev/null and b/results/best_param_per_func_with_baselines/tinyllama/5/best_param_per_func_with_baselines.png differ diff --git a/results/best_param_per_func_with_baselines/tinyllama/6/best_param_per_func_with_baselines.png b/results/best_param_per_func_with_baselines/tinyllama/6/best_param_per_func_with_baselines.png new file mode 100644 index 0000000000000000000000000000000000000000..98c0b23b379d85266f6ce6656b598b78ac2c3350 Binary files /dev/null and b/results/best_param_per_func_with_baselines/tinyllama/6/best_param_per_func_with_baselines.png differ diff --git a/results/best_param_per_func_with_baselines/tinyllama/7/best_param_per_func_with_baselines.png b/results/best_param_per_func_with_baselines/tinyllama/7/best_param_per_func_with_baselines.png new file mode 100644 index 0000000000000000000000000000000000000000..74d04830a5216cc89b16b868c5c4228084f0a01e Binary files /dev/null and b/results/best_param_per_func_with_baselines/tinyllama/7/best_param_per_func_with_baselines.png differ diff --git a/results/best_param_per_func_with_baselines/tinyllama/8/best_param_per_func_with_baselines.png b/results/best_param_per_func_with_baselines/tinyllama/8/best_param_per_func_with_baselines.png new file mode 100644 index 0000000000000000000000000000000000000000..6c467d64ff42884d512b0fb08197beaec18d76aa Binary files /dev/null and b/results/best_param_per_func_with_baselines/tinyllama/8/best_param_per_func_with_baselines.png differ diff --git a/results/bitwidth_acc_decay_per_function/tinyllama.png b/results/bitwidth_acc_decay_per_function/tinyllama.png new file mode 100644 index 0000000000000000000000000000000000000000..9778c9b6deb64718548a449c21093857cfa2a850 Binary files /dev/null and b/results/bitwidth_acc_decay_per_function/tinyllama.png differ diff --git a/results/df.tsv b/results/df.tsv new file mode 100644 index 0000000000000000000000000000000000000000..5c0b58d9d2f767701c58c5af7e2204365a240829 --- /dev/null +++ b/results/df.tsv @@ -0,0 +1,101 @@ +accuracy bits clip dataset method model params peak_mem_alloc_mb peak_mem_reserv_mb perplexity time_ms wer +0.3641674816608429 4 0.0 wikitext ao_woq tinyllama fixed 741.692928 866.123776 7.043089866638184 18.620178 0.0 +0.37713611125946045 8 0.0 wikitext ao_woq tinyllama fixed 1631.725568 1988.100096 6.605966091156006 15.563149 0.0 +0.0 4 0.0 wikitext comb_4 tinyllama nlr_t_lin 1895.561216 2157.969408 1.110665202140808 19.42599 0.0 +0.0 5 0.0 wikitext comb_4 tinyllama nlr_t_lin 1895.561216 2157.969408 1.110665202140808 19.42599 0.0 +0.0 6 0.0 wikitext comb_4 tinyllama nlr_t_lin 1895.561216 2157.969408 1.110665202140808 19.42599 0.0 +0.0 7 0.0 wikitext comb_4 tinyllama nlr_t_lin 1895.561216 2157.969408 1.110665202140808 19.42599 0.0 +0.0 8 0.0 wikitext comb_4 tinyllama nlr_t_lin 1895.561216 2157.969408 1.110665202140808 19.42599 0.0 +0.0 4 0.0 wikitext comb_7 tinyllama nlr_t_lin 1895.561216 2157.969408 1.1093063354492188 25.803776 0.0 +0.0 5 0.0 wikitext comb_7 tinyllama nlr_t_lin 1895.561216 2157.969408 1.1093063354492188 25.803776 0.0 +0.0 6 0.0 wikitext comb_7 tinyllama nlr_t_lin 1895.561216 2157.969408 1.1093063354492188 25.803776 0.0 +0.0 7 0.0 wikitext comb_7 tinyllama nlr_t_lin 1895.561216 2157.969408 1.1093063354492188 25.803776 0.0 +0.0 8 0.0 wikitext comb_7 tinyllama nlr_t_lin 1895.561216 2157.969408 1.1093063354492188 25.803776 0.0 +0.3744005560874939 7 0.0 wikitext comb_15 tinyllama nlr_t_lin 1896.032256 2157.969408 6.7555317878723145 14.687863 0.0 +0.33991897106170654 4 0.0 wikitext comb_15 tinyllama nlr_t_lin 1896.032256 2157.969408 7.798645496368408 15.139578 0.0 +0.36467409133911133 5 0.0 wikitext comb_15 tinyllama nlr_t_lin 1896.032256 2157.969408 7.099495887756348 15.188495 0.0 +0.377001017332077 8 0.0 wikitext comb_15 tinyllama nlr_t_lin 1896.032256 2157.969408 6.6611247062683105 15.278928 0.0 +0.37767645716667175 6 0.0 wikitext comb_15 tinyllama nlr_t_lin 1896.032256 2157.969408 6.699794292449951 15.651638 0.0 +0.3763255476951599 7 0.0 wikitext woq tinyllama fixed 1896.111616 2160.06656 6.663349628448486 16.096653 0.0 +0.3676123023033142 5 0.0 wikitext woq tinyllama fixed 1896.111616 2160.06656 6.966304302215576 16.134821 0.0 +0.37727120518684387 8 0.0 wikitext woq tinyllama fixed 1896.111616 2160.06656 6.604811191558838 16.272615 0.0 +0.37858834862709045 6 0.0 wikitext woq tinyllama fixed 1896.111616 2160.06656 6.501583099365234 16.296258 0.0 +0.3469773828983307 4 0.0 wikitext woq tinyllama fixed 1896.111616 2160.06656 7.655362606048584 16.419508 0.0 +0.0 4 0.0 wikitext comb_1 tinyllama nlr_t_lin 1897.394176 2160.06656 1.1162694692611694 27.063747 0.0 +0.0 5 0.0 wikitext comb_1 tinyllama nlr_t_lin 1897.394176 2160.06656 1.1162694692611694 27.063747 0.0 +0.007936508394777775 7 0.0 wikitext comb_1 tinyllama nlr_t_lin 1897.394176 2160.06656 1.108918309211731 27.189807 0.0 +0.014285716228187084 6 0.0 wikitext comb_1 tinyllama nlr_t_lin 1897.394176 2160.06656 1.1324244737625122 27.21905 0.0 +0.37436679005622864 7 0.0 wikitext comb_18 tinyllama nlr_t_lin 1897.865216 2160.06656 6.747983455657959 27.402022 0.0 +0.3764606714248657 6 0.0 wikitext comb_8 tinyllama nlr_t_lin 1897.865216 2160.06656 6.674111366271973 27.402278 0.0 +0.33944615721702576 4 0.0 wikitext comb_18 tinyllama nlr_t_lin 1897.865216 2160.06656 7.924208641052246 27.415199 0.0 +0.3669368624687195 5 0.0 wikitext comb_8 tinyllama nlr_t_lin 1897.865216 2160.06656 7.094004154205322 27.424887 0.0 +0.3660925626754761 5 0.0 wikitext comb_18 tinyllama nlr_t_lin 1897.865216 2160.06656 7.09657621383667 27.437879 0.0 +0.376629501581192 8 0.0 wikitext comb_10 tinyllama nlr_t_lin 1897.865216 2160.06656 6.645826816558838 27.441238 0.0 +0.3788585066795349 6 0.0 wikitext comb_12 tinyllama nlr_t_lin 1897.865216 2160.06656 6.6869425773620605 27.447294 0.0 +0.3676798641681671 5 0.0 wikitext comb_10 tinyllama nlr_t_lin 1897.865216 2160.06656 7.077613830566406 27.450546 0.0 +0.3750759959220886 7 0.0 wikitext comb_8 tinyllama nlr_t_lin 1897.865216 2160.06656 6.729586124420166 27.452787 0.0 +0.37720364332199097 7 0.0 wikitext comb_12 tinyllama nlr_t_lin 1897.865216 2160.06656 6.737154960632324 27.454265 0.0 +0.1677473932504654 4 0.0 wikitext comb_10 tinyllama nlr_t_lin 1897.865216 2160.06656 20.69113540649414 27.456986 0.0 +0.3408645987510681 4 0.0 wikitext comb_12 tinyllama nlr_t_lin 1897.865216 2160.06656 7.797614097595215 27.48183 0.0 +0.376156747341156 8 0.0 wikitext comb_12 tinyllama nlr_t_lin 1897.865216 2160.06656 6.652891635894775 27.483249 0.0 +0.36781492829322815 5 0.0 wikitext comb_12 tinyllama nlr_t_lin 1897.865216 2160.06656 7.096789360046387 27.485402 0.0 +0.2542722225189209 8 0.0 wikitext comb_1 tinyllama nlr_t_lin 1897.865216 2160.06656 10.974504470825195 27.497876 0.0 +0.3774062693119049 7 0.0 wikitext comb_10 tinyllama nlr_t_lin 1897.865216 2160.06656 6.703912734985352 27.4991 0.0 +0.37744003534317017 6 0.0 wikitext comb_18 tinyllama nlr_t_lin 1897.865216 2160.06656 6.721346378326416 27.508581 0.0 +0.37460318207740784 8 0.0 wikitext comb_8 tinyllama nlr_t_lin 1897.865216 2160.06656 6.66512393951416 27.522588 0.0 +0.3782505989074707 6 0.0 wikitext comb_10 tinyllama nlr_t_lin 1897.865216 2160.06656 6.680172443389893 27.528717 0.0 +0.3761904537677765 8 0.0 wikitext comb_18 tinyllama nlr_t_lin 1897.865216 2160.06656 6.640418529510498 27.529249 0.0 +0.3412022888660431 4 0.0 wikitext comb_8 tinyllama nlr_t_lin 1897.865216 2160.06656 7.811379909515381 27.538141 0.0 +0.3776426911354065 6 0.0 wikitext comb_3 tinyllama nlr_t_lin 1897.865216 2160.06656 6.704628944396973 34.644507 0.0 +0.36541712284088135 5 0.0 wikitext comb_3 tinyllama nlr_t_lin 1897.865216 2160.06656 7.113305568695068 34.653955 0.0 +0.3375886380672455 4 0.0 wikitext comb_3 tinyllama nlr_t_lin 1897.865216 2160.06656 7.9102630615234375 34.675708 0.0 +0.3746369481086731 7 0.0 wikitext comb_3 tinyllama nlr_t_lin 1897.865216 2160.06656 6.742989540100098 34.691848 0.0 +0.37673085927963257 8 0.0 wikitext comb_3 tinyllama nlr_t_lin 1897.865216 2160.06656 6.630740165710449 34.720062 0.0 +0.0 8 0.0 wikitext comb_7_t tinyllama nlr_t_lin 1904.146432 2174.746624 1.1093063354492188 25.924527 0.0 +0.02063492313027382 8 0.0 wikitext comb_4_t tinyllama nlr_t_lin 1904.080896 2178.940928 1.1070170402526855 19.549906 0.0 +0.4691658616065979 7 0.0 wikitext comb_15_t tinyllama nlr_t_lin 1904.551936 2178.940928 3.586782693862915 15.042203 0.0 +0.4721716046333313 6 0.0 wikitext comb_15_t tinyllama nlr_t_lin 1904.551936 2178.940928 3.745493173599243 15.135254 0.0 +0.4073285758495331 4 0.0 wikitext comb_15_t tinyllama nlr_t_lin 1904.551936 2178.940928 5.53889799118042 15.146649 0.0 +0.45879772305488586 5 0.0 wikitext comb_15_t tinyllama nlr_t_lin 1904.551936 2178.940928 4.2737226486206055 15.162692 0.0 +0.4478554427623749 8 0.0 wikitext comb_15_t tinyllama nlr_t_lin 1904.551936 2178.940928 3.9899139404296875 15.255927 0.0 +0.4716312289237976 7 0.0 wikitext woq_t tinyllama fixed 1904.631296 2181.03808 3.6278960704803467 15.447449 0.0 +0.39476528763771057 4 0.0 wikitext woq_t tinyllama fixed 1904.631296 2181.03808 5.693153381347656 16.155616 0.0 +0.45319148898124695 5 0.0 wikitext woq_t tinyllama fixed 1904.631296 2181.03808 4.351770877838135 16.21261 0.0 +0.45180681347846985 8 0.0 wikitext woq_t tinyllama fixed 1904.631296 2181.03808 3.8591816425323486 16.247682 0.0 +0.4667342007160187 6 0.0 wikitext woq_t tinyllama fixed 1904.631296 2181.03808 3.7766106128692627 16.613178 0.0 +0.46264776587486267 6 0.0 wikitext comb_8_t tinyllama nlr_t_lin 1906.384896 2181.03808 3.8822555541992188 27.391845 0.0 +0.12546437978744507 8 0.0 wikitext comb_1_t tinyllama nlr_t_lin 1906.384896 2181.03808 23.425905227661133 27.392397 0.0 +0.1343127340078354 6 0.0 wikitext comb_1_t tinyllama nlr_t_lin 1906.384896 2181.03808 23.099044799804688 27.39869 0.0 +0.46727457642555237 6 0.0 wikitext comb_18_t tinyllama nlr_t_lin 1906.384896 2181.03808 3.753908157348633 27.410599 0.0 +0.4711921811103821 6 0.0 wikitext comb_10_t tinyllama nlr_t_lin 1906.384896 2181.03808 3.7106194496154785 27.411855 0.0 +0.40834179520606995 4 0.0 wikitext comb_10_t tinyllama nlr_t_lin 1906.384896 2181.03808 5.6778764724731445 27.416885 0.0 +0.45626479387283325 5 0.0 wikitext comb_8_t tinyllama nlr_t_lin 1906.384896 2181.03808 4.395241737365723 27.42478 0.0 +0.406349241733551 4 0.0 wikitext comb_12_t tinyllama nlr_t_lin 1906.384896 2181.03808 5.512465476989746 27.431829 0.0 +0.4123269021511078 4 0.0 wikitext comb_18_t tinyllama nlr_t_lin 1906.384896 2181.03808 5.4710283279418945 27.432534 0.0 +0.13009119033813477 7 0.0 wikitext comb_1_t tinyllama nlr_t_lin 1906.384896 2181.03808 22.35222053527832 27.444736 0.0 +0.4095238149166107 4 0.0 wikitext comb_8_t tinyllama nlr_t_lin 1906.384896 2181.03808 5.589878082275391 27.44879 0.0 +0.4690307378768921 7 0.0 wikitext comb_10_t tinyllama nlr_t_lin 1906.384896 2181.03808 3.7180914878845215 27.469848 0.0 +0.46541711688041687 7 0.0 wikitext comb_8_t tinyllama nlr_t_lin 1906.384896 2181.03808 3.704385280609131 27.469945 0.0 +0.12445119768381119 5 0.0 wikitext comb_1_t tinyllama nlr_t_lin 1906.384896 2181.03808 23.370811462402344 27.471032 0.0 +0.445997953414917 8 0.0 wikitext comb_10_t tinyllama nlr_t_lin 1906.384896 2181.03808 4.003555774688721 27.499694 0.0 +0.4650118350982666 6 0.0 wikitext comb_12_t tinyllama nlr_t_lin 1906.384896 2181.03808 3.7818164825439453 27.523071 0.0 +0.46889564394950867 7 0.0 wikitext comb_12_t tinyllama nlr_t_lin 1906.384896 2181.03808 3.7109317779541016 27.53212 0.0 +0.44410672783851624 8 0.0 wikitext comb_12_t tinyllama nlr_t_lin 1906.384896 2181.03808 3.909205913543701 27.538954 0.0 +0.4576832056045532 5 0.0 wikitext comb_12_t tinyllama nlr_t_lin 1906.384896 2181.03808 4.175211429595947 27.544406 0.0 +0.44815942645072937 8 0.0 wikitext comb_8_t tinyllama nlr_t_lin 1906.384896 2181.03808 3.942722797393799 27.552825 0.0 +0.47146233916282654 7 0.0 wikitext comb_18_t tinyllama nlr_t_lin 1906.384896 2181.03808 3.6000452041625977 27.559089 0.0 +0.4557919502258301 5 0.0 wikitext comb_18_t tinyllama nlr_t_lin 1906.384896 2181.03808 4.278509616851807 27.605508 0.0 +0.44653835892677307 8 0.0 wikitext comb_18_t tinyllama nlr_t_lin 1906.384896 2181.03808 3.8636558055877686 27.610646 0.0 +0.4560621678829193 5 0.0 wikitext comb_10_t tinyllama nlr_t_lin 1906.384896 2181.03808 4.2374267578125 27.630033 0.0 +0.45650121569633484 5 0.0 wikitext comb_3_t tinyllama nlr_t_lin 1906.384896 2181.03808 4.177881717681885 34.587916 0.0 +0.46919959783554077 6 0.0 wikitext comb_3_t tinyllama nlr_t_lin 1906.384896 2181.03808 3.851466655731201 34.65105 0.0 +0.4524822533130646 8 0.0 wikitext comb_3_t tinyllama nlr_t_lin 1906.384896 2181.03808 3.8512980937957764 34.679813 0.0 +0.4706518054008484 7 0.0 wikitext comb_3_t tinyllama nlr_t_lin 1906.384896 2181.03808 3.625946044921875 34.699284 0.0 +0.40827423334121704 4 0.0 wikitext comb_3_t tinyllama nlr_t_lin 1906.384896 2181.03808 5.55847692489624 34.772857 0.0 +0.0 4 0.0 wikitext comb_11 tinyllama nlr_t_lin 1381.170176 2487.222272 1.1250394582748413 0.501952 0.0 +0.0 5 0.0 wikitext comb_11 tinyllama nlr_t_lin 1381.170176 2487.222272 1.1250394582748413 0.501952 0.0 +0.0 6 0.0 wikitext comb_11 tinyllama nlr_t_lin 1381.170176 2487.222272 1.1250394582748413 0.501952 0.0 +0.0 7 0.0 wikitext comb_11 tinyllama nlr_t_lin 1381.170176 2487.222272 1.1250394582748413 0.501952 0.0 +0.0 8 0.0 wikitext comb_11 tinyllama nlr_t_lin 1381.170176 2487.222272 1.1250394582748413 0.501952 0.0 +0.0 8 0.0 wikitext comb_11_t tinyllama nlr_t_lin 1389.689856 2499.805184 1.1078732013702393 0.506853 0.0 +0.37814927101135254 32 0.0 wikitext base tinyllama ---- 4470.547968 4485.808128 6.595952033996582 11.791439 0.0 diff --git a/results/func_by_param_init_method/tinyllama/4/comb_10.png b/results/func_by_param_init_method/tinyllama/4/comb_10.png new file mode 100644 index 0000000000000000000000000000000000000000..b3dc69f6ed87b5e92d2cfc2b8b108570551ae38e Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/4/comb_10.png differ diff --git a/results/func_by_param_init_method/tinyllama/4/comb_10_t.png b/results/func_by_param_init_method/tinyllama/4/comb_10_t.png new file mode 100644 index 0000000000000000000000000000000000000000..a0ccb76a75abdb0843a5229f628a5bc47954432c Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/4/comb_10_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/4/comb_12.png b/results/func_by_param_init_method/tinyllama/4/comb_12.png new file mode 100644 index 0000000000000000000000000000000000000000..18c0ae02e5dff1cf3511528e6c3c4af5f584161f Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/4/comb_12.png differ diff --git a/results/func_by_param_init_method/tinyllama/4/comb_12_t.png b/results/func_by_param_init_method/tinyllama/4/comb_12_t.png new file mode 100644 index 0000000000000000000000000000000000000000..bf204290e0ab53cfa20696bd23b638f94189bf08 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/4/comb_12_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/4/comb_15.png b/results/func_by_param_init_method/tinyllama/4/comb_15.png new file mode 100644 index 0000000000000000000000000000000000000000..6299b369ca54eb467239106bb570245a9d96bf78 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/4/comb_15.png differ diff --git a/results/func_by_param_init_method/tinyllama/4/comb_15_t.png b/results/func_by_param_init_method/tinyllama/4/comb_15_t.png new file mode 100644 index 0000000000000000000000000000000000000000..1d8db8abd2e7401abf8d0a645deb489857778498 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/4/comb_15_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/4/comb_18.png b/results/func_by_param_init_method/tinyllama/4/comb_18.png new file mode 100644 index 0000000000000000000000000000000000000000..69fa484f9857440b6aa73ace638bdd540059d5d2 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/4/comb_18.png differ diff --git a/results/func_by_param_init_method/tinyllama/4/comb_18_t.png b/results/func_by_param_init_method/tinyllama/4/comb_18_t.png new file mode 100644 index 0000000000000000000000000000000000000000..f33c6c00bf8f5af51a8487de79192fa796303613 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/4/comb_18_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/4/comb_3.png b/results/func_by_param_init_method/tinyllama/4/comb_3.png new file mode 100644 index 0000000000000000000000000000000000000000..5b7261d44fd828ae34cb60748a89234cc714c947 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/4/comb_3.png differ diff --git a/results/func_by_param_init_method/tinyllama/4/comb_3_t.png b/results/func_by_param_init_method/tinyllama/4/comb_3_t.png new file mode 100644 index 0000000000000000000000000000000000000000..95d884e2d770b8541f899b51d06f09f869327cb2 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/4/comb_3_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/4/comb_8.png b/results/func_by_param_init_method/tinyllama/4/comb_8.png new file mode 100644 index 0000000000000000000000000000000000000000..6a8532e0860a4e1e98590c8a57c41487993cee28 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/4/comb_8.png differ diff --git a/results/func_by_param_init_method/tinyllama/4/comb_8_t.png b/results/func_by_param_init_method/tinyllama/4/comb_8_t.png new file mode 100644 index 0000000000000000000000000000000000000000..ccad743f97961a5145cdabb4f72c2dbebf1c77bd Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/4/comb_8_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/5/comb_10.png b/results/func_by_param_init_method/tinyllama/5/comb_10.png new file mode 100644 index 0000000000000000000000000000000000000000..c939952a9fe99e7d5c578da8c02142be38a03ccb Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/5/comb_10.png differ diff --git a/results/func_by_param_init_method/tinyllama/5/comb_10_t.png b/results/func_by_param_init_method/tinyllama/5/comb_10_t.png new file mode 100644 index 0000000000000000000000000000000000000000..7e3277915347320f6d83b974e673edf23c5557f2 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/5/comb_10_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/5/comb_12.png b/results/func_by_param_init_method/tinyllama/5/comb_12.png new file mode 100644 index 0000000000000000000000000000000000000000..f2dcb256356f98085dbb447567c38c02e05d800a Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/5/comb_12.png differ diff --git a/results/func_by_param_init_method/tinyllama/5/comb_12_t.png b/results/func_by_param_init_method/tinyllama/5/comb_12_t.png new file mode 100644 index 0000000000000000000000000000000000000000..0c1546769fc76e94a866f616c1207a8b27760cbb Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/5/comb_12_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/5/comb_15.png b/results/func_by_param_init_method/tinyllama/5/comb_15.png new file mode 100644 index 0000000000000000000000000000000000000000..c5eb3202872d7533aa624747dfc60f3d9e9c5561 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/5/comb_15.png differ diff --git a/results/func_by_param_init_method/tinyllama/5/comb_15_t.png b/results/func_by_param_init_method/tinyllama/5/comb_15_t.png new file mode 100644 index 0000000000000000000000000000000000000000..eb5d19f5b4475037f23c0aed45c1e679aece9b6d Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/5/comb_15_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/5/comb_18.png b/results/func_by_param_init_method/tinyllama/5/comb_18.png new file mode 100644 index 0000000000000000000000000000000000000000..09d5a83a9293f34f00aa062a115c423c1e371b04 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/5/comb_18.png differ diff --git a/results/func_by_param_init_method/tinyllama/5/comb_18_t.png b/results/func_by_param_init_method/tinyllama/5/comb_18_t.png new file mode 100644 index 0000000000000000000000000000000000000000..382b47548d73c5212c99c75626cdbc176a82c693 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/5/comb_18_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/5/comb_1_t.png b/results/func_by_param_init_method/tinyllama/5/comb_1_t.png new file mode 100644 index 0000000000000000000000000000000000000000..c33951805b105a6451e95c2980e13bf4b5c2d0a1 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/5/comb_1_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/5/comb_3.png b/results/func_by_param_init_method/tinyllama/5/comb_3.png new file mode 100644 index 0000000000000000000000000000000000000000..8c4a48988132ccd0182376a193f6ae7a232689b3 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/5/comb_3.png differ diff --git a/results/func_by_param_init_method/tinyllama/5/comb_3_t.png b/results/func_by_param_init_method/tinyllama/5/comb_3_t.png new file mode 100644 index 0000000000000000000000000000000000000000..aa904b49b156b4343e055ab2fc28dfcdf8c3103f Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/5/comb_3_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/5/comb_8.png b/results/func_by_param_init_method/tinyllama/5/comb_8.png new file mode 100644 index 0000000000000000000000000000000000000000..585d6cd8a47b69fd63e68dcaad3a52d9d02890c9 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/5/comb_8.png differ diff --git a/results/func_by_param_init_method/tinyllama/5/comb_8_t.png b/results/func_by_param_init_method/tinyllama/5/comb_8_t.png new file mode 100644 index 0000000000000000000000000000000000000000..e31a098b6fe4664ffb4bc94594d2524a63142607 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/5/comb_8_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/6/comb_1.png b/results/func_by_param_init_method/tinyllama/6/comb_1.png new file mode 100644 index 0000000000000000000000000000000000000000..3a6407dcb70d9179a87035f9183dbae904e7c25a Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/6/comb_1.png differ diff --git a/results/func_by_param_init_method/tinyllama/6/comb_10.png b/results/func_by_param_init_method/tinyllama/6/comb_10.png new file mode 100644 index 0000000000000000000000000000000000000000..5b8c3c56672e2001655ded937aac0031d57a36ce Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/6/comb_10.png differ diff --git a/results/func_by_param_init_method/tinyllama/6/comb_10_t.png b/results/func_by_param_init_method/tinyllama/6/comb_10_t.png new file mode 100644 index 0000000000000000000000000000000000000000..de18323b8b7a5afccf57c6ecabdae34c30ce6a37 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/6/comb_10_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/6/comb_12.png b/results/func_by_param_init_method/tinyllama/6/comb_12.png new file mode 100644 index 0000000000000000000000000000000000000000..a2ef0629c9d8434da0d310a98979d4b85d0638b5 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/6/comb_12.png differ diff --git a/results/func_by_param_init_method/tinyllama/6/comb_12_t.png b/results/func_by_param_init_method/tinyllama/6/comb_12_t.png new file mode 100644 index 0000000000000000000000000000000000000000..3f1a6a06baa00b62677609332de3735cb3de44ee Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/6/comb_12_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/6/comb_15.png b/results/func_by_param_init_method/tinyllama/6/comb_15.png new file mode 100644 index 0000000000000000000000000000000000000000..9515604757e29a732203a902034d0a9a0acc6a97 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/6/comb_15.png differ diff --git a/results/func_by_param_init_method/tinyllama/6/comb_15_t.png b/results/func_by_param_init_method/tinyllama/6/comb_15_t.png new file mode 100644 index 0000000000000000000000000000000000000000..9248e0d6075763a54a8645a043e4b9bb351cc27c Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/6/comb_15_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/6/comb_18.png b/results/func_by_param_init_method/tinyllama/6/comb_18.png new file mode 100644 index 0000000000000000000000000000000000000000..f14ec04cf659542e4fe281f44a4d1004e7f7e104 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/6/comb_18.png differ diff --git a/results/func_by_param_init_method/tinyllama/6/comb_18_t.png b/results/func_by_param_init_method/tinyllama/6/comb_18_t.png new file mode 100644 index 0000000000000000000000000000000000000000..ef36c1707c8aa916ef665cac78ce8395766e6ec2 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/6/comb_18_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/6/comb_1_t.png b/results/func_by_param_init_method/tinyllama/6/comb_1_t.png new file mode 100644 index 0000000000000000000000000000000000000000..977a8d2a911c5dd6b4eb62937dc252b5bdf83d00 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/6/comb_1_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/6/comb_3.png b/results/func_by_param_init_method/tinyllama/6/comb_3.png new file mode 100644 index 0000000000000000000000000000000000000000..1820d2b727aa1508c32027c5228a7132da347050 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/6/comb_3.png differ diff --git a/results/func_by_param_init_method/tinyllama/6/comb_3_t.png b/results/func_by_param_init_method/tinyllama/6/comb_3_t.png new file mode 100644 index 0000000000000000000000000000000000000000..abcdadcb96c977700eb94fba1d0365ddc7a16ed9 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/6/comb_3_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/6/comb_8.png b/results/func_by_param_init_method/tinyllama/6/comb_8.png new file mode 100644 index 0000000000000000000000000000000000000000..56d26ae800061fbc2b95704c26c6fecb436685f6 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/6/comb_8.png differ diff --git a/results/func_by_param_init_method/tinyllama/6/comb_8_t.png b/results/func_by_param_init_method/tinyllama/6/comb_8_t.png new file mode 100644 index 0000000000000000000000000000000000000000..3afd3da16ffaeaa7651975e1b8904555626d3629 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/6/comb_8_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/7/comb_1.png b/results/func_by_param_init_method/tinyllama/7/comb_1.png new file mode 100644 index 0000000000000000000000000000000000000000..ed5cd0231cdf385924a778a6b5d9134e2b360a3b Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/7/comb_1.png differ diff --git a/results/func_by_param_init_method/tinyllama/7/comb_10.png b/results/func_by_param_init_method/tinyllama/7/comb_10.png new file mode 100644 index 0000000000000000000000000000000000000000..74ba79950014674b9e8452191b2b18d4e2886d7b Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/7/comb_10.png differ diff --git a/results/func_by_param_init_method/tinyllama/7/comb_10_t.png b/results/func_by_param_init_method/tinyllama/7/comb_10_t.png new file mode 100644 index 0000000000000000000000000000000000000000..82206c3124f4975bb42a70c2b50887c274c42518 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/7/comb_10_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/7/comb_12.png b/results/func_by_param_init_method/tinyllama/7/comb_12.png new file mode 100644 index 0000000000000000000000000000000000000000..eadd2ebbcdd366ffd9c65ecc49e3486c6bb3029e Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/7/comb_12.png differ diff --git a/results/func_by_param_init_method/tinyllama/7/comb_12_t.png b/results/func_by_param_init_method/tinyllama/7/comb_12_t.png new file mode 100644 index 0000000000000000000000000000000000000000..35dba095a23ce5d586268469ef1d8995c3d052a8 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/7/comb_12_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/7/comb_15.png b/results/func_by_param_init_method/tinyllama/7/comb_15.png new file mode 100644 index 0000000000000000000000000000000000000000..6c3f667b13fceb14f91a7ed57ca2d1b720189a36 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/7/comb_15.png differ diff --git a/results/func_by_param_init_method/tinyllama/7/comb_15_t.png b/results/func_by_param_init_method/tinyllama/7/comb_15_t.png new file mode 100644 index 0000000000000000000000000000000000000000..36b2d8f4c68fd4caba7d3b5227544832b06bb6cc Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/7/comb_15_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/7/comb_18.png b/results/func_by_param_init_method/tinyllama/7/comb_18.png new file mode 100644 index 0000000000000000000000000000000000000000..38dbbfc3dc457735b7c8d09c32bb5b5757aa888c Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/7/comb_18.png differ diff --git a/results/func_by_param_init_method/tinyllama/7/comb_18_t.png b/results/func_by_param_init_method/tinyllama/7/comb_18_t.png new file mode 100644 index 0000000000000000000000000000000000000000..844dbe4ffcceb4cf04f7ebd4bcee7dbdfe6a6449 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/7/comb_18_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/7/comb_1_t.png b/results/func_by_param_init_method/tinyllama/7/comb_1_t.png new file mode 100644 index 0000000000000000000000000000000000000000..f62d3de9c9f28c1894c2ff3c6fb062bb63005da2 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/7/comb_1_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/7/comb_3.png b/results/func_by_param_init_method/tinyllama/7/comb_3.png new file mode 100644 index 0000000000000000000000000000000000000000..ac00567d37efaea071014e964a99f7c8f627ae6d Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/7/comb_3.png differ diff --git a/results/func_by_param_init_method/tinyllama/7/comb_3_t.png b/results/func_by_param_init_method/tinyllama/7/comb_3_t.png new file mode 100644 index 0000000000000000000000000000000000000000..bb5163598470059d7bafbbdd9af7adf2b8afd332 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/7/comb_3_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/7/comb_8.png b/results/func_by_param_init_method/tinyllama/7/comb_8.png new file mode 100644 index 0000000000000000000000000000000000000000..766e4d372ae4d0d6189758e1c9e1dc0fba13ec44 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/7/comb_8.png differ diff --git a/results/func_by_param_init_method/tinyllama/7/comb_8_t.png b/results/func_by_param_init_method/tinyllama/7/comb_8_t.png new file mode 100644 index 0000000000000000000000000000000000000000..4ff6fc79d641a50590b7cdea3ac00c5b8308fae7 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/7/comb_8_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/8/comb_1.png b/results/func_by_param_init_method/tinyllama/8/comb_1.png new file mode 100644 index 0000000000000000000000000000000000000000..9f8ea5760f3d7ab193e6a4b4e4a0a43e70321398 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/8/comb_1.png differ diff --git a/results/func_by_param_init_method/tinyllama/8/comb_10.png b/results/func_by_param_init_method/tinyllama/8/comb_10.png new file mode 100644 index 0000000000000000000000000000000000000000..f301205f168b1610e12efb5055b56cd099656a60 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/8/comb_10.png differ diff --git a/results/func_by_param_init_method/tinyllama/8/comb_10_t.png b/results/func_by_param_init_method/tinyllama/8/comb_10_t.png new file mode 100644 index 0000000000000000000000000000000000000000..5e2e0388e7512aa51d88c353382373ef44f348dc Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/8/comb_10_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/8/comb_12.png b/results/func_by_param_init_method/tinyllama/8/comb_12.png new file mode 100644 index 0000000000000000000000000000000000000000..efc5a2ad8e22d41b7c2b7f16f3e193732d866891 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/8/comb_12.png differ diff --git a/results/func_by_param_init_method/tinyllama/8/comb_12_t.png b/results/func_by_param_init_method/tinyllama/8/comb_12_t.png new file mode 100644 index 0000000000000000000000000000000000000000..bfa34b9c1e192f0cee6de7c2a4d2aeb1126f18ba Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/8/comb_12_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/8/comb_15.png b/results/func_by_param_init_method/tinyllama/8/comb_15.png new file mode 100644 index 0000000000000000000000000000000000000000..ac01ab432724b1a56464fd8bbe8b3a68bf18f3fc Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/8/comb_15.png differ diff --git a/results/func_by_param_init_method/tinyllama/8/comb_15_t.png b/results/func_by_param_init_method/tinyllama/8/comb_15_t.png new file mode 100644 index 0000000000000000000000000000000000000000..4b75f9026e94c227e2c2e5c053eba207eb461bc2 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/8/comb_15_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/8/comb_18.png b/results/func_by_param_init_method/tinyllama/8/comb_18.png new file mode 100644 index 0000000000000000000000000000000000000000..893f82963551c82a1da03d0c5701d6b0c6b66bda Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/8/comb_18.png differ diff --git a/results/func_by_param_init_method/tinyllama/8/comb_18_t.png b/results/func_by_param_init_method/tinyllama/8/comb_18_t.png new file mode 100644 index 0000000000000000000000000000000000000000..1f0d5d70bbd3873b003e017a8542e2de4af41635 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/8/comb_18_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/8/comb_1_t.png b/results/func_by_param_init_method/tinyllama/8/comb_1_t.png new file mode 100644 index 0000000000000000000000000000000000000000..594ccd6ff253373af6a2b5d6861741c87ef054de Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/8/comb_1_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/8/comb_3.png b/results/func_by_param_init_method/tinyllama/8/comb_3.png new file mode 100644 index 0000000000000000000000000000000000000000..eaca7143baac8839b096e3c3b0aadb38650bdcc1 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/8/comb_3.png differ diff --git a/results/func_by_param_init_method/tinyllama/8/comb_3_t.png b/results/func_by_param_init_method/tinyllama/8/comb_3_t.png new file mode 100644 index 0000000000000000000000000000000000000000..26a7330ec4e590053e9742308a998a98f6e2e65c Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/8/comb_3_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/8/comb_4_t.png b/results/func_by_param_init_method/tinyllama/8/comb_4_t.png new file mode 100644 index 0000000000000000000000000000000000000000..8abc728b4849b644eea180378ccf10c169d669b7 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/8/comb_4_t.png differ diff --git a/results/func_by_param_init_method/tinyllama/8/comb_8.png b/results/func_by_param_init_method/tinyllama/8/comb_8.png new file mode 100644 index 0000000000000000000000000000000000000000..e398257af9634d8a0e175fc0198b29664896629b Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/8/comb_8.png differ diff --git a/results/func_by_param_init_method/tinyllama/8/comb_8_t.png b/results/func_by_param_init_method/tinyllama/8/comb_8_t.png new file mode 100644 index 0000000000000000000000000000000000000000..59052884dad882984cb27a396c8fdf66729c3217 Binary files /dev/null and b/results/func_by_param_init_method/tinyllama/8/comb_8_t.png differ diff --git a/results/results.txt b/results/results.txt new file mode 100644 index 0000000000000000000000000000000000000000..01a0a3f8cf61d433f60bfa6a20ffd4dbce9203b8 --- /dev/null +++ b/results/results.txt @@ -0,0 +1,102 @@ +| | accuracy | bits | clip | dataset | method | model | params | peak_mem_alloc_mb | peak_mem_reserv_mb | perplexity | time_ms | wer | +|---:|-----------:|-------:|-------:|:----------|:----------|:----------|:----------|--------------------:|---------------------:|-------------:|----------:|------:| +| 0 | 0.364167 | 4 | 0 | wikitext | ao_woq | tinyllama | fixed | 741.693 | 866.124 | 7.04309 | 18.6202 | 0 | +| 1 | 0.377136 | 8 | 0 | wikitext | ao_woq | tinyllama | fixed | 1631.73 | 1988.1 | 6.60597 | 15.5631 | 0 | +| 2 | 0 | 4 | 0 | wikitext | comb_4 | tinyllama | nlr_t_lin | 1895.56 | 2157.97 | 1.11067 | 19.426 | 0 | +| 3 | 0 | 5 | 0 | wikitext | comb_4 | tinyllama | nlr_t_lin | 1895.56 | 2157.97 | 1.11067 | 19.426 | 0 | +| 4 | 0 | 6 | 0 | wikitext | comb_4 | tinyllama | nlr_t_lin | 1895.56 | 2157.97 | 1.11067 | 19.426 | 0 | +| 5 | 0 | 7 | 0 | wikitext | comb_4 | tinyllama | nlr_t_lin | 1895.56 | 2157.97 | 1.11067 | 19.426 | 0 | +| 6 | 0 | 8 | 0 | wikitext | comb_4 | tinyllama | nlr_t_lin | 1895.56 | 2157.97 | 1.11067 | 19.426 | 0 | +| 7 | 0 | 4 | 0 | wikitext | comb_7 | tinyllama | nlr_t_lin | 1895.56 | 2157.97 | 1.10931 | 25.8038 | 0 | +| 8 | 0 | 5 | 0 | wikitext | comb_7 | tinyllama | nlr_t_lin | 1895.56 | 2157.97 | 1.10931 | 25.8038 | 0 | +| 9 | 0 | 6 | 0 | wikitext | comb_7 | tinyllama | nlr_t_lin | 1895.56 | 2157.97 | 1.10931 | 25.8038 | 0 | +| 10 | 0 | 7 | 0 | wikitext | comb_7 | tinyllama | nlr_t_lin | 1895.56 | 2157.97 | 1.10931 | 25.8038 | 0 | +| 11 | 0 | 8 | 0 | wikitext | comb_7 | tinyllama | nlr_t_lin | 1895.56 | 2157.97 | 1.10931 | 25.8038 | 0 | +| 12 | 0.374401 | 7 | 0 | wikitext | comb_15 | tinyllama | nlr_t_lin | 1896.03 | 2157.97 | 6.75553 | 14.6879 | 0 | +| 13 | 0.339919 | 4 | 0 | wikitext | comb_15 | tinyllama | nlr_t_lin | 1896.03 | 2157.97 | 7.79865 | 15.1396 | 0 | +| 14 | 0.364674 | 5 | 0 | wikitext | comb_15 | tinyllama | nlr_t_lin | 1896.03 | 2157.97 | 7.0995 | 15.1885 | 0 | +| 15 | 0.377001 | 8 | 0 | wikitext | comb_15 | tinyllama | nlr_t_lin | 1896.03 | 2157.97 | 6.66112 | 15.2789 | 0 | +| 16 | 0.377676 | 6 | 0 | wikitext | comb_15 | tinyllama | nlr_t_lin | 1896.03 | 2157.97 | 6.69979 | 15.6516 | 0 | +| 17 | 0.376326 | 7 | 0 | wikitext | woq | tinyllama | fixed | 1896.11 | 2160.07 | 6.66335 | 16.0967 | 0 | +| 18 | 0.367612 | 5 | 0 | wikitext | woq | tinyllama | fixed | 1896.11 | 2160.07 | 6.9663 | 16.1348 | 0 | +| 19 | 0.377271 | 8 | 0 | wikitext | woq | tinyllama | fixed | 1896.11 | 2160.07 | 6.60481 | 16.2726 | 0 | +| 20 | 0.378588 | 6 | 0 | wikitext | woq | tinyllama | fixed | 1896.11 | 2160.07 | 6.50158 | 16.2963 | 0 | +| 21 | 0.346977 | 4 | 0 | wikitext | woq | tinyllama | fixed | 1896.11 | 2160.07 | 7.65536 | 16.4195 | 0 | +| 22 | 0 | 4 | 0 | wikitext | comb_1 | tinyllama | nlr_t_lin | 1897.39 | 2160.07 | 1.11627 | 27.0637 | 0 | +| 23 | 0 | 5 | 0 | wikitext | comb_1 | tinyllama | nlr_t_lin | 1897.39 | 2160.07 | 1.11627 | 27.0637 | 0 | +| 24 | 0.00793651 | 7 | 0 | wikitext | comb_1 | tinyllama | nlr_t_lin | 1897.39 | 2160.07 | 1.10892 | 27.1898 | 0 | +| 25 | 0.0142857 | 6 | 0 | wikitext | comb_1 | tinyllama | nlr_t_lin | 1897.39 | 2160.07 | 1.13242 | 27.219 | 0 | +| 26 | 0.374367 | 7 | 0 | wikitext | comb_18 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 6.74798 | 27.402 | 0 | +| 27 | 0.376461 | 6 | 0 | wikitext | comb_8 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 6.67411 | 27.4023 | 0 | +| 28 | 0.339446 | 4 | 0 | wikitext | comb_18 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 7.92421 | 27.4152 | 0 | +| 29 | 0.366937 | 5 | 0 | wikitext | comb_8 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 7.094 | 27.4249 | 0 | +| 30 | 0.366093 | 5 | 0 | wikitext | comb_18 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 7.09658 | 27.4379 | 0 | +| 31 | 0.37663 | 8 | 0 | wikitext | comb_10 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 6.64583 | 27.4412 | 0 | +| 32 | 0.378859 | 6 | 0 | wikitext | comb_12 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 6.68694 | 27.4473 | 0 | +| 33 | 0.36768 | 5 | 0 | wikitext | comb_10 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 7.07761 | 27.4505 | 0 | +| 34 | 0.375076 | 7 | 0 | wikitext | comb_8 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 6.72959 | 27.4528 | 0 | +| 35 | 0.377204 | 7 | 0 | wikitext | comb_12 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 6.73715 | 27.4543 | 0 | +| 36 | 0.167747 | 4 | 0 | wikitext | comb_10 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 20.6911 | 27.457 | 0 | +| 37 | 0.340865 | 4 | 0 | wikitext | comb_12 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 7.79761 | 27.4818 | 0 | +| 38 | 0.376157 | 8 | 0 | wikitext | comb_12 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 6.65289 | 27.4832 | 0 | +| 39 | 0.367815 | 5 | 0 | wikitext | comb_12 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 7.09679 | 27.4854 | 0 | +| 40 | 0.254272 | 8 | 0 | wikitext | comb_1 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 10.9745 | 27.4979 | 0 | +| 41 | 0.377406 | 7 | 0 | wikitext | comb_10 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 6.70391 | 27.4991 | 0 | +| 42 | 0.37744 | 6 | 0 | wikitext | comb_18 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 6.72135 | 27.5086 | 0 | +| 43 | 0.374603 | 8 | 0 | wikitext | comb_8 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 6.66512 | 27.5226 | 0 | +| 44 | 0.378251 | 6 | 0 | wikitext | comb_10 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 6.68017 | 27.5287 | 0 | +| 45 | 0.37619 | 8 | 0 | wikitext | comb_18 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 6.64042 | 27.5292 | 0 | +| 46 | 0.341202 | 4 | 0 | wikitext | comb_8 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 7.81138 | 27.5381 | 0 | +| 47 | 0.377643 | 6 | 0 | wikitext | comb_3 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 6.70463 | 34.6445 | 0 | +| 48 | 0.365417 | 5 | 0 | wikitext | comb_3 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 7.11331 | 34.654 | 0 | +| 49 | 0.337589 | 4 | 0 | wikitext | comb_3 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 7.91026 | 34.6757 | 0 | +| 50 | 0.374637 | 7 | 0 | wikitext | comb_3 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 6.74299 | 34.6918 | 0 | +| 51 | 0.376731 | 8 | 0 | wikitext | comb_3 | tinyllama | nlr_t_lin | 1897.87 | 2160.07 | 6.63074 | 34.7201 | 0 | +| 52 | 0 | 8 | 0 | wikitext | comb_7_t | tinyllama | nlr_t_lin | 1904.15 | 2174.75 | 1.10931 | 25.9245 | 0 | +| 53 | 0.0206349 | 8 | 0 | wikitext | comb_4_t | tinyllama | nlr_t_lin | 1904.08 | 2178.94 | 1.10702 | 19.5499 | 0 | +| 54 | 0.469166 | 7 | 0 | wikitext | comb_15_t | tinyllama | nlr_t_lin | 1904.55 | 2178.94 | 3.58678 | 15.0422 | 0 | +| 55 | 0.472172 | 6 | 0 | wikitext | comb_15_t | tinyllama | nlr_t_lin | 1904.55 | 2178.94 | 3.74549 | 15.1353 | 0 | +| 56 | 0.407329 | 4 | 0 | wikitext | comb_15_t | tinyllama | nlr_t_lin | 1904.55 | 2178.94 | 5.5389 | 15.1466 | 0 | +| 57 | 0.458798 | 5 | 0 | wikitext | comb_15_t | tinyllama | nlr_t_lin | 1904.55 | 2178.94 | 4.27372 | 15.1627 | 0 | +| 58 | 0.447855 | 8 | 0 | wikitext | comb_15_t | tinyllama | nlr_t_lin | 1904.55 | 2178.94 | 3.98991 | 15.2559 | 0 | +| 59 | 0.471631 | 7 | 0 | wikitext | woq_t | tinyllama | fixed | 1904.63 | 2181.04 | 3.6279 | 15.4474 | 0 | +| 60 | 0.394765 | 4 | 0 | wikitext | woq_t | tinyllama | fixed | 1904.63 | 2181.04 | 5.69315 | 16.1556 | 0 | +| 61 | 0.453191 | 5 | 0 | wikitext | woq_t | tinyllama | fixed | 1904.63 | 2181.04 | 4.35177 | 16.2126 | 0 | +| 62 | 0.451807 | 8 | 0 | wikitext | woq_t | tinyllama | fixed | 1904.63 | 2181.04 | 3.85918 | 16.2477 | 0 | +| 63 | 0.466734 | 6 | 0 | wikitext | woq_t | tinyllama | fixed | 1904.63 | 2181.04 | 3.77661 | 16.6132 | 0 | +| 64 | 0.462648 | 6 | 0 | wikitext | comb_8_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 3.88226 | 27.3918 | 0 | +| 65 | 0.125464 | 8 | 0 | wikitext | comb_1_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 23.4259 | 27.3924 | 0 | +| 66 | 0.134313 | 6 | 0 | wikitext | comb_1_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 23.099 | 27.3987 | 0 | +| 67 | 0.467275 | 6 | 0 | wikitext | comb_18_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 3.75391 | 27.4106 | 0 | +| 68 | 0.471192 | 6 | 0 | wikitext | comb_10_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 3.71062 | 27.4119 | 0 | +| 69 | 0.408342 | 4 | 0 | wikitext | comb_10_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 5.67788 | 27.4169 | 0 | +| 70 | 0.456265 | 5 | 0 | wikitext | comb_8_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 4.39524 | 27.4248 | 0 | +| 71 | 0.406349 | 4 | 0 | wikitext | comb_12_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 5.51247 | 27.4318 | 0 | +| 72 | 0.412327 | 4 | 0 | wikitext | comb_18_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 5.47103 | 27.4325 | 0 | +| 73 | 0.130091 | 7 | 0 | wikitext | comb_1_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 22.3522 | 27.4447 | 0 | +| 74 | 0.409524 | 4 | 0 | wikitext | comb_8_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 5.58988 | 27.4488 | 0 | +| 75 | 0.469031 | 7 | 0 | wikitext | comb_10_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 3.71809 | 27.4698 | 0 | +| 76 | 0.465417 | 7 | 0 | wikitext | comb_8_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 3.70439 | 27.4699 | 0 | +| 77 | 0.124451 | 5 | 0 | wikitext | comb_1_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 23.3708 | 27.471 | 0 | +| 78 | 0.445998 | 8 | 0 | wikitext | comb_10_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 4.00356 | 27.4997 | 0 | +| 79 | 0.465012 | 6 | 0 | wikitext | comb_12_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 3.78182 | 27.5231 | 0 | +| 80 | 0.468896 | 7 | 0 | wikitext | comb_12_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 3.71093 | 27.5321 | 0 | +| 81 | 0.444107 | 8 | 0 | wikitext | comb_12_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 3.90921 | 27.539 | 0 | +| 82 | 0.457683 | 5 | 0 | wikitext | comb_12_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 4.17521 | 27.5444 | 0 | +| 83 | 0.448159 | 8 | 0 | wikitext | comb_8_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 3.94272 | 27.5528 | 0 | +| 84 | 0.471462 | 7 | 0 | wikitext | comb_18_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 3.60005 | 27.5591 | 0 | +| 85 | 0.455792 | 5 | 0 | wikitext | comb_18_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 4.27851 | 27.6055 | 0 | +| 86 | 0.446538 | 8 | 0 | wikitext | comb_18_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 3.86366 | 27.6106 | 0 | +| 87 | 0.456062 | 5 | 0 | wikitext | comb_10_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 4.23743 | 27.63 | 0 | +| 88 | 0.456501 | 5 | 0 | wikitext | comb_3_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 4.17788 | 34.5879 | 0 | +| 89 | 0.4692 | 6 | 0 | wikitext | comb_3_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 3.85147 | 34.651 | 0 | +| 90 | 0.452482 | 8 | 0 | wikitext | comb_3_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 3.8513 | 34.6798 | 0 | +| 91 | 0.470652 | 7 | 0 | wikitext | comb_3_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 3.62595 | 34.6993 | 0 | +| 92 | 0.408274 | 4 | 0 | wikitext | comb_3_t | tinyllama | nlr_t_lin | 1906.38 | 2181.04 | 5.55848 | 34.7729 | 0 | +| 93 | 0 | 4 | 0 | wikitext | comb_11 | tinyllama | nlr_t_lin | 1381.17 | 2487.22 | 1.12504 | 0.501952 | 0 | +| 94 | 0 | 5 | 0 | wikitext | comb_11 | tinyllama | nlr_t_lin | 1381.17 | 2487.22 | 1.12504 | 0.501952 | 0 | +| 95 | 0 | 6 | 0 | wikitext | comb_11 | tinyllama | nlr_t_lin | 1381.17 | 2487.22 | 1.12504 | 0.501952 | 0 | +| 96 | 0 | 7 | 0 | wikitext | comb_11 | tinyllama | nlr_t_lin | 1381.17 | 2487.22 | 1.12504 | 0.501952 | 0 | +| 97 | 0 | 8 | 0 | wikitext | comb_11 | tinyllama | nlr_t_lin | 1381.17 | 2487.22 | 1.12504 | 0.501952 | 0 | +| 98 | 0 | 8 | 0 | wikitext | comb_11_t | tinyllama | nlr_t_lin | 1389.69 | 2499.81 | 1.10787 | 0.506853 | 0 | +| 99 | 0.378149 | 32 | 0 | wikitext | base | tinyllama | ---- | 4470.55 | 4485.81 | 6.59595 | 11.7914 | 0 | \ No newline at end of file