| | accuracy | bits | clip | dataset | method | model | params | peak_mem_alloc_mb | peak_mem_reserv_mb | perplexity | time_ms | wer | |---:|-----------:|-------:|-------:|:----------|:---------|:--------|:---------|--------------------:|---------------------:|-------------:|----------:|------:| | 0 | 0.427795 | 4 | 0 | wikitext | ao_woq | llama3 | fixed | 5542.36 | 7163.87 | 5.35836 | 39.207 | 0 | | 1 | 0.443735 | 8 | 0 | wikitext | ao_woq | llama3 | fixed | 12110.4 | 14040.4 | 5.20864 | 52.5034 | 0 | | 2 | 0 | 4 | 0 | wikitext | comb_1 | llama3 | norm_nlr | 14178.7 | 15367.9 | 1.35769 | 122.248 | 0 | | 3 | 0 | 5 | 0 | wikitext | comb_1 | llama3 | norm_nlr | 14178.7 | 15367.9 | 1.35769 | 122.248 | 0 | | 4 | 0 | 6 | 0 | wikitext | comb_1 | llama3 | norm_nlr | 14178.7 | 15367.9 | 1.35769 | 122.248 | 0 | | 5 | 0 | 7 | 0 | wikitext | comb_1 | llama3 | norm_nlr | 14178.7 | 15367.9 | 1.35769 | 122.248 | 0 | | 6 | 0 | 8 | 0 | wikitext | comb_1 | llama3 | norm_nlr | 14178.7 | 15367.9 | 1.35769 | 122.248 | 0 | | 7 | 0 | 4 | 0 | wikitext | comb_9 | llama3 | norm_nlr | 14178.7 | 15367.9 | 1.12481 | 146.192 | 0 | | 8 | 0 | 5 | 0 | wikitext | comb_9 | llama3 | norm_nlr | 14178.7 | 15367.9 | 1.12481 | 146.192 | 0 | | 9 | 0 | 6 | 0 | wikitext | comb_9 | llama3 | norm_nlr | 14178.7 | 15367.9 | 1.12481 | 146.192 | 0 | | 10 | 0 | 7 | 0 | wikitext | comb_9 | llama3 | norm_nlr | 14178.7 | 15367.9 | 1.12481 | 146.192 | 0 | | 11 | 0 | 8 | 0 | wikitext | comb_9 | llama3 | norm_nlr | 14178.7 | 15367.9 | 1.12481 | 146.192 | 0 | | 12 | 0.380108 | 4 | 0 | wikitext | comb_5 | llama3 | norm_nlr | 14179.2 | 15367.9 | 6.15098 | 68.7494 | 0 | | 13 | 0.442857 | 7 | 0 | wikitext | comb_5 | llama3 | norm_nlr | 14179.2 | 15367.9 | 5.24819 | 68.9355 | 0 | | 14 | 0.443735 | 8 | 0 | wikitext | comb_5 | llama3 | norm_nlr | 14179.2 | 15367.9 | 5.20864 | 68.9602 | 0 | | 15 | 0.435664 | 5 | 0 | wikitext | comb_5 | llama3 | norm_nlr | 14179.2 | 15367.9 | 5.44902 | 68.9898 | 0 | | 16 | 0.440493 | 6 | 0 | wikitext | comb_5 | llama3 | norm_nlr | 14179.2 | 15367.9 | 5.19914 | 69.026 | 0 | | 17 | 0.442756 | 7 | 0 | wikitext | woq | llama3 | fixed | 14179.3 | 15367.9 | 5.24889 | 95.8167 | 0 | | 18 | 0.435562 | 5 | 0 | wikitext | woq | llama3 | fixed | 14179.3 | 15367.9 | 5.44896 | 95.8369 | 0 | | 19 | 0.440932 | 6 | 0 | wikitext | woq | llama3 | fixed | 14179.3 | 15367.9 | 5.1933 | 95.8431 | 0 | | 20 | 0.44387 | 8 | 0 | wikitext | woq | llama3 | fixed | 14179.3 | 15367.9 | 5.20824 | 95.8455 | 0 | | 21 | 0.37977 | 4 | 0 | wikitext | woq | llama3 | fixed | 14179.3 | 15367.9 | 6.16325 | 95.8769 | 0 | | 22 | 0 | 4 | 0 | wikitext | comb_2 | llama3 | norm_nlr | 14185.3 | 15374.2 | 1.14597 | 202.198 | 0 | | 23 | 0 | 5 | 0 | wikitext | comb_2 | llama3 | norm_nlr | 14185.3 | 15374.2 | 1.14597 | 202.198 | 0 | | 24 | 0 | 6 | 0 | wikitext | comb_2 | llama3 | norm_nlr | 14185.3 | 15374.2 | 1.14597 | 202.198 | 0 | | 25 | 0 | 7 | 0 | wikitext | comb_2 | llama3 | norm_nlr | 14185.3 | 15374.2 | 1.14597 | 202.198 | 0 | | 26 | 0.442891 | 7 | 0 | wikitext | comb_18 | llama3 | norm_nlr | 14185.7 | 15374.2 | 5.23025 | 147.947 | 0 | | 27 | 0.440088 | 6 | 0 | wikitext | comb_11 | llama3 | norm_nlr | 14185.7 | 15374.2 | 5.19924 | 147.956 | 0 | | 28 | 0.442215 | 7 | 0 | wikitext | comb_11 | llama3 | norm_nlr | 14185.7 | 15374.2 | 5.24756 | 147.968 | 0 | | 29 | 0.437386 | 5 | 0 | wikitext | comb_18 | llama3 | norm_nlr | 14185.7 | 15374.2 | 5.41202 | 148.009 | 0 | | 30 | 0.380986 | 4 | 0 | wikitext | comb_11 | llama3 | norm_nlr | 14185.7 | 15374.2 | 6.23264 | 148.085 | 0 | | 31 | 0.440257 | 6 | 0 | wikitext | comb_18 | llama3 | norm_nlr | 14185.7 | 15374.2 | 5.23001 | 148.119 | 0 | | 32 | 0.443904 | 8 | 0 | wikitext | comb_11 | llama3 | norm_nlr | 14185.7 | 15374.2 | 5.20745 | 148.164 | 0 | | 33 | 0.378386 | 4 | 0 | wikitext | comb_18 | llama3 | norm_nlr | 14185.7 | 15374.2 | 6.16797 | 148.355 | 0 | | 34 | 0.436508 | 5 | 0 | wikitext | comb_11 | llama3 | norm_nlr | 14185.7 | 15374.2 | 5.43094 | 148.379 | 0 | | 35 | 0.444377 | 8 | 0 | wikitext | comb_18 | llama3 | norm_nlr | 14185.7 | 15374.2 | 5.20728 | 148.395 | 0 | | 36 | 0.436373 | 5 | 0 | wikitext | comb_6 | llama3 | norm_nlr | 14185.7 | 15374.2 | 5.3921 | 175.279 | 0 | | 37 | 0.378419 | 4 | 0 | wikitext | comb_6 | llama3 | norm_nlr | 14185.7 | 15374.2 | 6.15577 | 175.288 | 0 | | 38 | 0.443533 | 7 | 0 | wikitext | comb_6 | llama3 | norm_nlr | 14185.7 | 15374.2 | 5.22837 | 175.343 | 0 | | 39 | 0.444107 | 8 | 0 | wikitext | comb_6 | llama3 | norm_nlr | 14185.7 | 15374.2 | 5.21485 | 175.53 | 0 | | 40 | 0.440696 | 6 | 0 | wikitext | comb_6 | llama3 | norm_nlr | 14185.7 | 15374.2 | 5.23038 | 175.603 | 0 | | 41 | 0.440257 | 6 | 0 | wikitext | comb_15 | llama3 | norm_nlr | 14185.7 | 15374.2 | 5.23111 | 201.24 | 0 | | 42 | 0.442891 | 7 | 0 | wikitext | comb_15 | llama3 | norm_nlr | 14185.7 | 15374.2 | 5.22931 | 201.289 | 0 | | 43 | 0.378116 | 4 | 0 | wikitext | comb_15 | llama3 | norm_nlr | 14185.7 | 15374.2 | 6.17802 | 201.489 | 0 | | 44 | 0.444411 | 8 | 0 | wikitext | comb_15 | llama3 | norm_nlr | 14185.7 | 15374.2 | 5.208 | 201.509 | 0 | | 45 | 0.301655 | 8 | 0 | wikitext | comb_2 | llama3 | norm_nlr | 14185.7 | 15374.2 | 8.71646 | 201.86 | 0 | | 46 | 0.436879 | 5 | 0 | wikitext | comb_15 | llama3 | norm_nlr | 14185.7 | 15374.2 | 5.4106 | 201.891 | 0 | | 47 | 0 | 4 | 0 | wikitext | comb_12 | llama3 | norm_nlr | 14191.8 | 15378.4 | 1.58254 | 187.261 | 0 | | 48 | 0 | 4 | 0 | wikitext | comb_3 | llama3 | norm_nlr | 14191.8 | 15378.4 | 1.23333 | 187.283 | 0 | | 49 | 0 | 4 | 0 | wikitext | comb_16 | llama3 | norm_nlr | 14191.8 | 15378.4 | 1.80209 | 187.796 | 0 | | 50 | 0 | 4 | 0 | wikitext | comb_13 | llama3 | norm_nlr | 14191.8 | 15378.4 | 10.0525 | 187.802 | 0 | | 51 | 0 | 5 | 0 | wikitext | comb_13 | llama3 | norm_nlr | 14191.8 | 15378.4 | 10.0525 | 187.802 | 0 | | 52 | 0 | 6 | 0 | wikitext | comb_13 | llama3 | norm_nlr | 14191.8 | 15378.4 | 10.0525 | 187.802 | 0 | | 53 | 0.0355418 | 5 | 0 | wikitext | comb_3 | llama3 | norm_nlr | 14191.8 | 15378.4 | 1.5306 | 187.828 | 0 | | 54 | 0.443803 | 8 | 0 | wikitext | comb_16 | llama3 | norm_nlr | 14192.3 | 15380.5 | 5.16194 | 187.461 | 0 | | 55 | 0.430834 | 7 | 0 | wikitext | comb_3 | llama3 | norm_nlr | 14192.3 | 15380.5 | 5.30749 | 187.539 | 0 | | 56 | 0.441405 | 7 | 0 | wikitext | comb_16 | llama3 | norm_nlr | 14192.3 | 15380.5 | 5.24326 | 187.599 | 0 | | 57 | 0.424282 | 6 | 0 | wikitext | comb_12 | llama3 | norm_nlr | 14192.3 | 15380.5 | 5.48562 | 187.613 | 0 | | 58 | 0.288146 | 5 | 0 | wikitext | comb_16 | llama3 | norm_nlr | 14192.3 | 15380.5 | 8.61832 | 187.657 | 0 | | 59 | 0.403377 | 5 | 0 | wikitext | comb_17 | llama3 | norm_nlr | 14192.3 | 15380.5 | 5.51409 | 187.721 | 0 | | 60 | 0.413779 | 6 | 0 | wikitext | comb_16 | llama3 | norm_nlr | 14192.3 | 15380.5 | 5.61277 | 187.751 | 0 | | 61 | 0.227423 | 7 | 0 | wikitext | comb_13 | llama3 | norm_nlr | 14192.3 | 15380.5 | 12.6204 | 187.771 | 0 | | 62 | 0.441979 | 8 | 0 | wikitext | comb_3 | llama3 | norm_nlr | 14192.3 | 15380.5 | 5.21832 | 187.808 | 0 | | 63 | 0.42256 | 8 | 0 | wikitext | comb_13 | llama3 | norm_nlr | 14192.3 | 15380.5 | 5.22474 | 187.865 | 0 | | 64 | 0.441979 | 8 | 0 | wikitext | comb_12 | llama3 | norm_nlr | 14192.3 | 15380.5 | 5.23714 | 187.946 | 0 | | 65 | 0.365924 | 6 | 0 | wikitext | comb_3 | llama3 | norm_nlr | 14192.3 | 15380.5 | 6.60476 | 187.95 | 0 | | 66 | 0.441743 | 7 | 0 | wikitext | comb_17 | llama3 | norm_nlr | 14192.3 | 15380.5 | 5.25572 | 187.956 | 0 | | 67 | 0.220027 | 5 | 0 | wikitext | comb_12 | llama3 | norm_nlr | 14192.3 | 15380.5 | 12.0249 | 188.009 | 0 | | 68 | 0.440426 | 7 | 0 | wikitext | comb_12 | llama3 | norm_nlr | 14192.3 | 15380.5 | 5.2084 | 188.032 | 0 | | 69 | 0.224485 | 4 | 0 | wikitext | comb_17 | llama3 | norm_nlr | 14192.3 | 15380.5 | 11.9652 | 188.046 | 0 | | 70 | 0.444107 | 8 | 0 | wikitext | comb_17 | llama3 | norm_nlr | 14192.3 | 15380.5 | 5.21989 | 188.102 | 0 | | 71 | 0.439818 | 6 | 0 | wikitext | comb_17 | llama3 | norm_nlr | 14192.3 | 15380.5 | 5.20365 | 188.222 | 0 | | 72 | 0 | 4 | 0 | wikitext | comb_4 | llama3 | norm_nlr | 16812 | 19811.8 | 1.12481 | 426.526 | 0 | | 73 | 0 | 5 | 0 | wikitext | comb_4 | llama3 | norm_nlr | 16812 | 19811.8 | 1.12481 | 426.526 | 0 | | 74 | 0 | 6 | 0 | wikitext | comb_4 | llama3 | norm_nlr | 16812 | 19811.8 | 1.12481 | 426.526 | 0 | | 75 | 0 | 7 | 0 | wikitext | comb_4 | llama3 | norm_nlr | 16812 | 19811.8 | 1.12481 | 426.526 | 0 | | 76 | 0 | 8 | 0 | wikitext | comb_4 | llama3 | norm_nlr | 16812 | 19811.8 | 1.12481 | 426.526 | 0 | | 77 | 0 | 4 | 0 | wikitext | comb_10 | llama3 | norm_nlr | 11058 | 21091.1 | 1.18446 | 4.43101 | 0 | | 78 | 0 | 5 | 0 | wikitext | comb_10 | llama3 | norm_nlr | 11058 | 21091.1 | 1.18446 | 4.43101 | 0 | | 79 | 0.443668 | 32 | 0 | wikitext | base | llama3 | ---- | 33003.5 | 33156 | 5.22381 | 26.8009 | 0 | | 80 | 0.443634 | 8 | 0 | wikitext | comb_10 | llama3 | norm_nlr | 58810.6 | 68843.2 | 5.21296 | 4.40037 | 0 | | 81 | 0.386998 | 6 | 0 | wikitext | comb_10 | llama3 | norm_nlr | 58810.6 | 68843.2 | 5.64073 | 4.42918 | 0 | | 82 | 0.43178 | 7 | 0 | wikitext | comb_10 | llama3 | norm_nlr | 58810.6 | 68843.2 | 5.31969 | 4.43837 | 0 |