Diogo-V commited on
Commit
bb55dd8
1 Parent(s): 595a94c

Adds final graphs

Browse files
Files changed (47) hide show
  1. results/best_param_per_func_with_baselines/tinyllama/4/best_param_per_func_with_baselines.png +0 -0
  2. results/best_param_per_func_with_baselines/tinyllama/5/best_param_per_func_with_baselines.png +0 -0
  3. results/best_param_per_func_with_baselines/tinyllama/6/best_param_per_func_with_baselines.png +0 -0
  4. results/best_param_per_func_with_baselines/tinyllama/7/best_param_per_func_with_baselines.png +0 -0
  5. results/best_param_per_func_with_baselines/tinyllama/8/best_param_per_func_with_baselines.png +0 -0
  6. results/bitwidth_acc_decay_per_function/tinyllama.png +0 -0
  7. results/df.tsv +84 -0
  8. results/func_by_param_init_method/tinyllama/4/comb_14.png +0 -0
  9. results/func_by_param_init_method/tinyllama/4/comb_16.png +0 -0
  10. results/func_by_param_init_method/tinyllama/4/comb_17.png +0 -0
  11. results/func_by_param_init_method/tinyllama/4/comb_2.png +0 -0
  12. results/func_by_param_init_method/tinyllama/4/comb_3.png +0 -0
  13. results/func_by_param_init_method/tinyllama/4/comb_7.png +0 -0
  14. results/func_by_param_init_method/tinyllama/4/comb_8.png +0 -0
  15. results/func_by_param_init_method/tinyllama/5/comb_14.png +0 -0
  16. results/func_by_param_init_method/tinyllama/5/comb_16.png +0 -0
  17. results/func_by_param_init_method/tinyllama/5/comb_17.png +0 -0
  18. results/func_by_param_init_method/tinyllama/5/comb_2.png +0 -0
  19. results/func_by_param_init_method/tinyllama/5/comb_3.png +0 -0
  20. results/func_by_param_init_method/tinyllama/5/comb_7.png +0 -0
  21. results/func_by_param_init_method/tinyllama/5/comb_8.png +0 -0
  22. results/func_by_param_init_method/tinyllama/6/comb_14.png +0 -0
  23. results/func_by_param_init_method/tinyllama/6/comb_16.png +0 -0
  24. results/func_by_param_init_method/tinyllama/6/comb_17.png +0 -0
  25. results/func_by_param_init_method/tinyllama/6/comb_2.png +0 -0
  26. results/func_by_param_init_method/tinyllama/6/comb_3.png +0 -0
  27. results/func_by_param_init_method/tinyllama/6/comb_7.png +0 -0
  28. results/func_by_param_init_method/tinyllama/6/comb_8.png +0 -0
  29. results/func_by_param_init_method/tinyllama/7/comb_10.png +0 -0
  30. results/func_by_param_init_method/tinyllama/7/comb_14.png +0 -0
  31. results/func_by_param_init_method/tinyllama/7/comb_16.png +0 -0
  32. results/func_by_param_init_method/tinyllama/7/comb_17.png +0 -0
  33. results/func_by_param_init_method/tinyllama/7/comb_18.png +0 -0
  34. results/func_by_param_init_method/tinyllama/7/comb_2.png +0 -0
  35. results/func_by_param_init_method/tinyllama/7/comb_3.png +0 -0
  36. results/func_by_param_init_method/tinyllama/7/comb_7.png +0 -0
  37. results/func_by_param_init_method/tinyllama/7/comb_8.png +0 -0
  38. results/func_by_param_init_method/tinyllama/8/comb_10.png +0 -0
  39. results/func_by_param_init_method/tinyllama/8/comb_14.png +0 -0
  40. results/func_by_param_init_method/tinyllama/8/comb_16.png +0 -0
  41. results/func_by_param_init_method/tinyllama/8/comb_17.png +0 -0
  42. results/func_by_param_init_method/tinyllama/8/comb_18.png +0 -0
  43. results/func_by_param_init_method/tinyllama/8/comb_2.png +0 -0
  44. results/func_by_param_init_method/tinyllama/8/comb_3.png +0 -0
  45. results/func_by_param_init_method/tinyllama/8/comb_7.png +0 -0
  46. results/func_by_param_init_method/tinyllama/8/comb_8.png +0 -0
  47. results/results.txt +85 -0
results/best_param_per_func_with_baselines/tinyllama/4/best_param_per_func_with_baselines.png ADDED
results/best_param_per_func_with_baselines/tinyllama/5/best_param_per_func_with_baselines.png ADDED
results/best_param_per_func_with_baselines/tinyllama/6/best_param_per_func_with_baselines.png ADDED
results/best_param_per_func_with_baselines/tinyllama/7/best_param_per_func_with_baselines.png ADDED
results/best_param_per_func_with_baselines/tinyllama/8/best_param_per_func_with_baselines.png ADDED
results/bitwidth_acc_decay_per_function/tinyllama.png ADDED
results/df.tsv ADDED
@@ -0,0 +1,84 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ accuracy bits clip dataset method model params peak_mem_alloc_mb peak_mem_reserv_mb perplexity time_ms wer
2
+ 0.3641674816608429 4 0.0 wikitext ao_woq tinyllama fixed 741.692928 866.123776 7.043089866638184 18.556989 0.0
3
+ 0.37713611125946045 8 0.0 wikitext ao_woq tinyllama fixed 1631.725568 1988.100096 6.605966091156006 15.390611 0.0
4
+ 0.0 4 0.0 wikitext comb_5 tinyllama nlr_t_no_sched 1895.561216 2157.969408 1.110665202140808 19.433262 0.0
5
+ 0.0 5 0.0 wikitext comb_5 tinyllama nlr_t_no_sched 1895.561216 2157.969408 1.110665202140808 19.433262 0.0
6
+ 0.0 6 0.0 wikitext comb_5 tinyllama nlr_t_no_sched 1895.561216 2157.969408 1.110665202140808 19.433262 0.0
7
+ 0.0 7 0.0 wikitext comb_5 tinyllama nlr_t_no_sched 1895.561216 2157.969408 1.110665202140808 19.433262 0.0
8
+ 0.0 8 0.0 wikitext comb_5 tinyllama nlr_t_no_sched 1895.561216 2157.969408 1.110665202140808 19.433262 0.0
9
+ 0.0 4 0.0 wikitext comb_11 tinyllama nlr_t_no_sched 1895.561216 2157.969408 1.109306812286377 25.945974 0.0
10
+ 0.0 5 0.0 wikitext comb_11 tinyllama nlr_t_no_sched 1895.561216 2157.969408 1.109306812286377 25.945974 0.0
11
+ 0.0 6 0.0 wikitext comb_11 tinyllama nlr_t_no_sched 1895.561216 2157.969408 1.109306812286377 25.945974 0.0
12
+ 0.0 7 0.0 wikitext comb_11 tinyllama nlr_t_no_sched 1895.561216 2157.969408 1.109306812286377 25.945974 0.0
13
+ 0.0 8 0.0 wikitext comb_11 tinyllama nlr_t_no_sched 1895.561216 2157.969408 1.109306812286377 25.945974 0.0
14
+ 0.37274572253227234 6 0.0 wikitext comb_8 tinyllama nlr_t_no_sched 1896.032256 2157.969408 6.825120449066162 14.822067 0.0
15
+ 0.3467409610748291 5 0.0 wikitext comb_8 tinyllama nlr_t_no_sched 1896.032256 2157.969408 7.698853969573975 15.044339 0.0
16
+ 0.37706854939460754 8 0.0 wikitext comb_8 tinyllama nlr_t_no_sched 1896.032256 2157.969408 6.6527509689331055 15.050894 0.0
17
+ 0.30101317167282104 4 0.0 wikitext comb_8 tinyllama nlr_t_no_sched 1896.032256 2157.969408 9.370594024658203 15.30351 0.0
18
+ 0.37406280636787415 7 0.0 wikitext comb_8 tinyllama nlr_t_no_sched 1896.032256 2157.969408 6.726755142211914 15.732151 0.0
19
+ 0.3676123023033142 5 0.0 wikitext woq tinyllama fixed 1896.111616 2160.06656 6.966304302215576 16.130207 0.0
20
+ 0.3763255476951599 7 0.0 wikitext woq tinyllama fixed 1896.111616 2160.06656 6.663349628448486 16.142134 0.0
21
+ 0.37727120518684387 8 0.0 wikitext woq tinyllama fixed 1896.111616 2160.06656 6.604811191558838 16.250135 0.0
22
+ 0.3469773828983307 4 0.0 wikitext woq tinyllama fixed 1896.111616 2160.06656 7.655362606048584 16.405294 0.0
23
+ 0.37858834862709045 6 0.0 wikitext woq tinyllama fixed 1896.111616 2160.06656 6.501583099365234 16.922372 0.0
24
+ 0.02380952797830105 7 0.0 wikitext comb_18 tinyllama nlr_t_no_sched 1897.394176 2160.06656 1.1020679473876953 27.30117 0.0
25
+ 0.0 4 0.0 wikitext comb_18 tinyllama nlr_t_no_sched 1897.394176 2160.06656 1.1322431564331055 27.319544 0.0
26
+ 0.0 5 0.0 wikitext comb_18 tinyllama nlr_t_no_sched 1897.394176 2160.06656 1.1322431564331055 27.319544 0.0
27
+ 0.0 6 0.0 wikitext comb_18 tinyllama nlr_t_no_sched 1897.394176 2160.06656 1.1322431564331055 27.319544 0.0
28
+ 0.0 4 0.0 wikitext comb_0 tinyllama nlr_t_no_sched 1897.394176 2160.06656 1.117425560951233 27.367375 0.0
29
+ 0.0 5 0.0 wikitext comb_0 tinyllama nlr_t_no_sched 1897.394176 2160.06656 1.117425560951233 27.367375 0.0
30
+ 0.0 6 0.0 wikitext comb_0 tinyllama nlr_t_no_sched 1897.394176 2160.06656 1.117425560951233 27.367375 0.0
31
+ 0.0 7 0.0 wikitext comb_0 tinyllama nlr_t_no_sched 1897.394176 2160.06656 1.117425560951233 27.367375 0.0
32
+ 0.0 8 0.0 wikitext comb_0 tinyllama nlr_t_no_sched 1897.394176 2160.06656 1.117425560951233 27.367375 0.0
33
+ 0.0 4 0.0 wikitext comb_10 tinyllama nlr_t_no_sched 1897.394176 2160.06656 1.12163245677948 40.600346 0.0
34
+ 0.0 5 0.0 wikitext comb_10 tinyllama nlr_t_no_sched 1897.394176 2160.06656 1.12163245677948 40.600346 0.0
35
+ 0.0 6 0.0 wikitext comb_10 tinyllama nlr_t_no_sched 1897.394176 2160.06656 1.12163245677948 40.600346 0.0
36
+ 0.0 4 0.0 wikitext comb_12 tinyllama nlr_t_no_sched 1897.394176 2160.06656 1.1093063354492188 40.71396 0.0
37
+ 0.0 5 0.0 wikitext comb_12 tinyllama nlr_t_no_sched 1897.394176 2160.06656 1.1093063354492188 40.71396 0.0
38
+ 0.0 6 0.0 wikitext comb_12 tinyllama nlr_t_no_sched 1897.394176 2160.06656 1.1093063354492188 40.71396 0.0
39
+ 0.0 7 0.0 wikitext comb_12 tinyllama nlr_t_no_sched 1897.394176 2160.06656 1.1093063354492188 40.71396 0.0
40
+ 0.0 8 0.0 wikitext comb_12 tinyllama nlr_t_no_sched 1897.394176 2160.06656 1.1093063354492188 40.71396 0.0
41
+ 0.2913205027580261 4 0.0 wikitext comb_14 tinyllama nlr_t_no_sched 1897.865216 2160.06656 9.837532043457031 27.404319 0.0
42
+ 0.3742992579936981 6 0.0 wikitext comb_17 tinyllama nlr_t_no_sched 1897.865216 2160.06656 6.776387691497803 27.433229 0.0
43
+ 0.37220534682273865 6 0.0 wikitext comb_16 tinyllama nlr_t_no_sched 1897.865216 2160.06656 6.813462257385254 27.438662 0.0
44
+ 0.09371834248304367 8 0.0 wikitext comb_18 tinyllama nlr_t_no_sched 1897.865216 2160.06656 29.213275909423828 27.457965 0.0
45
+ 0.3466734290122986 5 0.0 wikitext comb_14 tinyllama nlr_t_no_sched 1897.865216 2160.06656 7.701914310455322 27.479193 0.0
46
+ 0.3761904835700989 8 0.0 wikitext comb_17 tinyllama nlr_t_no_sched 1897.865216 2160.06656 6.669031620025635 27.484724 0.0
47
+ 0.30847686529159546 4 0.0 wikitext comb_2 tinyllama nlr_t_no_sched 1897.865216 2160.06656 8.844282150268555 27.49003 0.0
48
+ 0.3451874256134033 5 0.0 wikitext comb_17 tinyllama nlr_t_no_sched 1897.865216 2160.06656 7.8390889167785645 27.490512 0.0
49
+ 0.346065491437912 5 0.0 wikitext comb_2 tinyllama nlr_t_no_sched 1897.865216 2160.06656 7.72405481338501 27.500745 0.0
50
+ 0.34491726756095886 5 0.0 wikitext comb_16 tinyllama nlr_t_no_sched 1897.865216 2160.06656 7.801002025604248 27.503932 0.0
51
+ 0.372543066740036 7 0.0 wikitext comb_2 tinyllama nlr_t_no_sched 1897.865216 2160.06656 6.797382831573486 27.513916 0.0
52
+ 0.3766970932483673 8 0.0 wikitext comb_14 tinyllama nlr_t_no_sched 1897.865216 2160.06656 6.625375270843506 27.515933 0.0
53
+ 0.19415739178657532 4 0.0 wikitext comb_17 tinyllama nlr_t_no_sched 1897.865216 2160.06656 15.055026054382324 27.517325 0.0
54
+ 0.317088782787323 4 0.0 wikitext comb_16 tinyllama nlr_t_no_sched 1897.865216 2160.06656 8.428974151611328 27.519404 0.0
55
+ 0.3721039891242981 6 0.0 wikitext comb_14 tinyllama nlr_t_no_sched 1897.865216 2160.06656 6.838970184326172 27.568308 0.0
56
+ 0.3720364570617676 7 0.0 wikitext comb_17 tinyllama nlr_t_no_sched 1897.865216 2160.06656 6.772279739379883 27.573243 0.0
57
+ 0.37382641434669495 7 0.0 wikitext comb_16 tinyllama nlr_t_no_sched 1897.865216 2160.06656 6.789385795593262 27.58242 0.0
58
+ 0.37352246046066284 6 0.0 wikitext comb_2 tinyllama nlr_t_no_sched 1897.865216 2160.06656 6.798985958099365 27.5874 0.0
59
+ 0.37426549196243286 7 0.0 wikitext comb_14 tinyllama nlr_t_no_sched 1897.865216 2160.06656 6.708649635314941 27.600502 0.0
60
+ 0.37612298130989075 8 0.0 wikitext comb_16 tinyllama nlr_t_no_sched 1897.865216 2160.06656 6.650889873504639 27.67143 0.0
61
+ 0.3768659234046936 8 0.0 wikitext comb_2 tinyllama nlr_t_no_sched 1897.865216 2160.06656 6.639966011047363 27.684658 0.0
62
+ 0.29013848304748535 4 0.0 wikitext comb_3 tinyllama nlr_t_no_sched 1897.865216 2160.06656 9.911487579345703 34.627976 0.0
63
+ 0.37683218717575073 8 0.0 wikitext comb_3 tinyllama nlr_t_no_sched 1897.865216 2160.06656 6.642193794250488 34.647166 0.0
64
+ 0.3470449149608612 5 0.0 wikitext comb_3 tinyllama nlr_t_no_sched 1897.865216 2160.06656 7.678282737731934 34.654184 0.0
65
+ 0.3715636432170868 6 0.0 wikitext comb_3 tinyllama nlr_t_no_sched 1897.865216 2160.06656 6.86018705368042 34.760978 0.0
66
+ 0.3743330240249634 7 0.0 wikitext comb_3 tinyllama nlr_t_no_sched 1897.865216 2160.06656 6.723891735076904 34.825004 0.0
67
+ 0.34603172540664673 5 0.0 wikitext comb_7 tinyllama nlr_t_no_sched 1897.865216 2160.06656 7.698445796966553 40.770407 0.0
68
+ 0.2938196659088135 4 0.0 wikitext comb_7 tinyllama nlr_t_no_sched 1897.865216 2160.06656 9.86754035949707 40.815591 0.0
69
+ 0.16572104394435883 7 0.0 wikitext comb_10 tinyllama nlr_t_no_sched 1897.865216 2160.06656 16.877504348754883 40.820557 0.0
70
+ 0.34660589694976807 8 0.0 wikitext comb_10 tinyllama nlr_t_no_sched 1897.865216 2160.06656 7.364253520965576 40.908013 0.0
71
+ 0.37436679005622864 7 0.0 wikitext comb_7 tinyllama nlr_t_no_sched 1897.865216 2160.06656 6.7033820152282715 40.910472 0.0
72
+ 0.3727119565010071 6 0.0 wikitext comb_7 tinyllama nlr_t_no_sched 1897.865216 2160.06656 6.847280979156494 40.965379 0.0
73
+ 0.3773387372493744 8 0.0 wikitext comb_7 tinyllama nlr_t_no_sched 1897.865216 2160.06656 6.629304885864258 40.971027 0.0
74
+ 0.0 4 0.0 wikitext comb_6 tinyllama nlr_t_no_sched 1381.170176 2487.222272 1.1211762428283691 0.480479 0.0
75
+ 0.0 5 0.0 wikitext comb_6 tinyllama nlr_t_no_sched 1381.170176 2487.222272 1.1211762428283691 0.480479 0.0
76
+ 0.0 6 0.0 wikitext comb_6 tinyllama nlr_t_no_sched 1381.170176 2487.222272 1.1211762428283691 0.480479 0.0
77
+ 0.0 7 0.0 wikitext comb_6 tinyllama nlr_t_no_sched 1381.170176 2487.222272 1.1211762428283691 0.480479 0.0
78
+ 0.0 8 0.0 wikitext comb_6 tinyllama nlr_t_no_sched 1381.170176 2487.222272 1.1211762428283691 0.480479 0.0
79
+ 0.0 4 0.0 wikitext comb_4 tinyllama nlr_t_no_sched 2225.074688 2747.26912 1.1093051433563232 99.458451 0.0
80
+ 0.0 5 0.0 wikitext comb_4 tinyllama nlr_t_no_sched 2225.074688 2747.26912 1.1093051433563232 99.458451 0.0
81
+ 0.0 6 0.0 wikitext comb_4 tinyllama nlr_t_no_sched 2225.074688 2747.26912 1.1093051433563232 99.458451 0.0
82
+ 0.0 7 0.0 wikitext comb_4 tinyllama nlr_t_no_sched 2225.074688 2747.26912 1.1093051433563232 99.458451 0.0
83
+ 0.0 8 0.0 wikitext comb_4 tinyllama nlr_t_no_sched 2225.074688 2747.26912 1.1093051433563232 99.458451 0.0
84
+ 0.37814927101135254 32 0.0 wikitext base tinyllama ---- 4470.547968 4485.808128 6.595952033996582 11.691268 0.0
results/func_by_param_init_method/tinyllama/4/comb_14.png ADDED
results/func_by_param_init_method/tinyllama/4/comb_16.png ADDED
results/func_by_param_init_method/tinyllama/4/comb_17.png ADDED
results/func_by_param_init_method/tinyllama/4/comb_2.png ADDED
results/func_by_param_init_method/tinyllama/4/comb_3.png ADDED
results/func_by_param_init_method/tinyllama/4/comb_7.png ADDED
results/func_by_param_init_method/tinyllama/4/comb_8.png ADDED
results/func_by_param_init_method/tinyllama/5/comb_14.png ADDED
results/func_by_param_init_method/tinyllama/5/comb_16.png ADDED
results/func_by_param_init_method/tinyllama/5/comb_17.png ADDED
results/func_by_param_init_method/tinyllama/5/comb_2.png ADDED
results/func_by_param_init_method/tinyllama/5/comb_3.png ADDED
results/func_by_param_init_method/tinyllama/5/comb_7.png ADDED
results/func_by_param_init_method/tinyllama/5/comb_8.png ADDED
results/func_by_param_init_method/tinyllama/6/comb_14.png ADDED
results/func_by_param_init_method/tinyllama/6/comb_16.png ADDED
results/func_by_param_init_method/tinyllama/6/comb_17.png ADDED
results/func_by_param_init_method/tinyllama/6/comb_2.png ADDED
results/func_by_param_init_method/tinyllama/6/comb_3.png ADDED
results/func_by_param_init_method/tinyllama/6/comb_7.png ADDED
results/func_by_param_init_method/tinyllama/6/comb_8.png ADDED
results/func_by_param_init_method/tinyllama/7/comb_10.png ADDED
results/func_by_param_init_method/tinyllama/7/comb_14.png ADDED
results/func_by_param_init_method/tinyllama/7/comb_16.png ADDED
results/func_by_param_init_method/tinyllama/7/comb_17.png ADDED
results/func_by_param_init_method/tinyllama/7/comb_18.png ADDED
results/func_by_param_init_method/tinyllama/7/comb_2.png ADDED
results/func_by_param_init_method/tinyllama/7/comb_3.png ADDED
results/func_by_param_init_method/tinyllama/7/comb_7.png ADDED
results/func_by_param_init_method/tinyllama/7/comb_8.png ADDED
results/func_by_param_init_method/tinyllama/8/comb_10.png ADDED
results/func_by_param_init_method/tinyllama/8/comb_14.png ADDED
results/func_by_param_init_method/tinyllama/8/comb_16.png ADDED
results/func_by_param_init_method/tinyllama/8/comb_17.png ADDED
results/func_by_param_init_method/tinyllama/8/comb_18.png ADDED
results/func_by_param_init_method/tinyllama/8/comb_2.png ADDED
results/func_by_param_init_method/tinyllama/8/comb_3.png ADDED
results/func_by_param_init_method/tinyllama/8/comb_7.png ADDED
results/func_by_param_init_method/tinyllama/8/comb_8.png ADDED
results/results.txt ADDED
@@ -0,0 +1,85 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ | | accuracy | bits | clip | dataset | method | model | params | peak_mem_alloc_mb | peak_mem_reserv_mb | perplexity | time_ms | wer |
2
+ |---:|-----------:|-------:|-------:|:----------|:---------|:----------|:---------------|--------------------:|---------------------:|-------------:|----------:|------:|
3
+ | 0 | 0.364167 | 4 | 0 | wikitext | ao_woq | tinyllama | fixed | 741.693 | 866.124 | 7.04309 | 18.557 | 0 |
4
+ | 1 | 0.377136 | 8 | 0 | wikitext | ao_woq | tinyllama | fixed | 1631.73 | 1988.1 | 6.60597 | 15.3906 | 0 |
5
+ | 2 | 0 | 4 | 0 | wikitext | comb_5 | tinyllama | nlr_t_no_sched | 1895.56 | 2157.97 | 1.11067 | 19.4333 | 0 |
6
+ | 3 | 0 | 5 | 0 | wikitext | comb_5 | tinyllama | nlr_t_no_sched | 1895.56 | 2157.97 | 1.11067 | 19.4333 | 0 |
7
+ | 4 | 0 | 6 | 0 | wikitext | comb_5 | tinyllama | nlr_t_no_sched | 1895.56 | 2157.97 | 1.11067 | 19.4333 | 0 |
8
+ | 5 | 0 | 7 | 0 | wikitext | comb_5 | tinyllama | nlr_t_no_sched | 1895.56 | 2157.97 | 1.11067 | 19.4333 | 0 |
9
+ | 6 | 0 | 8 | 0 | wikitext | comb_5 | tinyllama | nlr_t_no_sched | 1895.56 | 2157.97 | 1.11067 | 19.4333 | 0 |
10
+ | 7 | 0 | 4 | 0 | wikitext | comb_11 | tinyllama | nlr_t_no_sched | 1895.56 | 2157.97 | 1.10931 | 25.946 | 0 |
11
+ | 8 | 0 | 5 | 0 | wikitext | comb_11 | tinyllama | nlr_t_no_sched | 1895.56 | 2157.97 | 1.10931 | 25.946 | 0 |
12
+ | 9 | 0 | 6 | 0 | wikitext | comb_11 | tinyllama | nlr_t_no_sched | 1895.56 | 2157.97 | 1.10931 | 25.946 | 0 |
13
+ | 10 | 0 | 7 | 0 | wikitext | comb_11 | tinyllama | nlr_t_no_sched | 1895.56 | 2157.97 | 1.10931 | 25.946 | 0 |
14
+ | 11 | 0 | 8 | 0 | wikitext | comb_11 | tinyllama | nlr_t_no_sched | 1895.56 | 2157.97 | 1.10931 | 25.946 | 0 |
15
+ | 12 | 0.372746 | 6 | 0 | wikitext | comb_8 | tinyllama | nlr_t_no_sched | 1896.03 | 2157.97 | 6.82512 | 14.8221 | 0 |
16
+ | 13 | 0.346741 | 5 | 0 | wikitext | comb_8 | tinyllama | nlr_t_no_sched | 1896.03 | 2157.97 | 7.69885 | 15.0443 | 0 |
17
+ | 14 | 0.377069 | 8 | 0 | wikitext | comb_8 | tinyllama | nlr_t_no_sched | 1896.03 | 2157.97 | 6.65275 | 15.0509 | 0 |
18
+ | 15 | 0.301013 | 4 | 0 | wikitext | comb_8 | tinyllama | nlr_t_no_sched | 1896.03 | 2157.97 | 9.37059 | 15.3035 | 0 |
19
+ | 16 | 0.374063 | 7 | 0 | wikitext | comb_8 | tinyllama | nlr_t_no_sched | 1896.03 | 2157.97 | 6.72676 | 15.7322 | 0 |
20
+ | 17 | 0.367612 | 5 | 0 | wikitext | woq | tinyllama | fixed | 1896.11 | 2160.07 | 6.9663 | 16.1302 | 0 |
21
+ | 18 | 0.376326 | 7 | 0 | wikitext | woq | tinyllama | fixed | 1896.11 | 2160.07 | 6.66335 | 16.1421 | 0 |
22
+ | 19 | 0.377271 | 8 | 0 | wikitext | woq | tinyllama | fixed | 1896.11 | 2160.07 | 6.60481 | 16.2501 | 0 |
23
+ | 20 | 0.346977 | 4 | 0 | wikitext | woq | tinyllama | fixed | 1896.11 | 2160.07 | 7.65536 | 16.4053 | 0 |
24
+ | 21 | 0.378588 | 6 | 0 | wikitext | woq | tinyllama | fixed | 1896.11 | 2160.07 | 6.50158 | 16.9224 | 0 |
25
+ | 22 | 0.0238095 | 7 | 0 | wikitext | comb_18 | tinyllama | nlr_t_no_sched | 1897.39 | 2160.07 | 1.10207 | 27.3012 | 0 |
26
+ | 23 | 0 | 4 | 0 | wikitext | comb_18 | tinyllama | nlr_t_no_sched | 1897.39 | 2160.07 | 1.13224 | 27.3195 | 0 |
27
+ | 24 | 0 | 5 | 0 | wikitext | comb_18 | tinyllama | nlr_t_no_sched | 1897.39 | 2160.07 | 1.13224 | 27.3195 | 0 |
28
+ | 25 | 0 | 6 | 0 | wikitext | comb_18 | tinyllama | nlr_t_no_sched | 1897.39 | 2160.07 | 1.13224 | 27.3195 | 0 |
29
+ | 26 | 0 | 4 | 0 | wikitext | comb_0 | tinyllama | nlr_t_no_sched | 1897.39 | 2160.07 | 1.11743 | 27.3674 | 0 |
30
+ | 27 | 0 | 5 | 0 | wikitext | comb_0 | tinyllama | nlr_t_no_sched | 1897.39 | 2160.07 | 1.11743 | 27.3674 | 0 |
31
+ | 28 | 0 | 6 | 0 | wikitext | comb_0 | tinyllama | nlr_t_no_sched | 1897.39 | 2160.07 | 1.11743 | 27.3674 | 0 |
32
+ | 29 | 0 | 7 | 0 | wikitext | comb_0 | tinyllama | nlr_t_no_sched | 1897.39 | 2160.07 | 1.11743 | 27.3674 | 0 |
33
+ | 30 | 0 | 8 | 0 | wikitext | comb_0 | tinyllama | nlr_t_no_sched | 1897.39 | 2160.07 | 1.11743 | 27.3674 | 0 |
34
+ | 31 | 0 | 4 | 0 | wikitext | comb_10 | tinyllama | nlr_t_no_sched | 1897.39 | 2160.07 | 1.12163 | 40.6003 | 0 |
35
+ | 32 | 0 | 5 | 0 | wikitext | comb_10 | tinyllama | nlr_t_no_sched | 1897.39 | 2160.07 | 1.12163 | 40.6003 | 0 |
36
+ | 33 | 0 | 6 | 0 | wikitext | comb_10 | tinyllama | nlr_t_no_sched | 1897.39 | 2160.07 | 1.12163 | 40.6003 | 0 |
37
+ | 34 | 0 | 4 | 0 | wikitext | comb_12 | tinyllama | nlr_t_no_sched | 1897.39 | 2160.07 | 1.10931 | 40.714 | 0 |
38
+ | 35 | 0 | 5 | 0 | wikitext | comb_12 | tinyllama | nlr_t_no_sched | 1897.39 | 2160.07 | 1.10931 | 40.714 | 0 |
39
+ | 36 | 0 | 6 | 0 | wikitext | comb_12 | tinyllama | nlr_t_no_sched | 1897.39 | 2160.07 | 1.10931 | 40.714 | 0 |
40
+ | 37 | 0 | 7 | 0 | wikitext | comb_12 | tinyllama | nlr_t_no_sched | 1897.39 | 2160.07 | 1.10931 | 40.714 | 0 |
41
+ | 38 | 0 | 8 | 0 | wikitext | comb_12 | tinyllama | nlr_t_no_sched | 1897.39 | 2160.07 | 1.10931 | 40.714 | 0 |
42
+ | 39 | 0.291321 | 4 | 0 | wikitext | comb_14 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 9.83753 | 27.4043 | 0 |
43
+ | 40 | 0.374299 | 6 | 0 | wikitext | comb_17 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 6.77639 | 27.4332 | 0 |
44
+ | 41 | 0.372205 | 6 | 0 | wikitext | comb_16 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 6.81346 | 27.4387 | 0 |
45
+ | 42 | 0.0937183 | 8 | 0 | wikitext | comb_18 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 29.2133 | 27.458 | 0 |
46
+ | 43 | 0.346673 | 5 | 0 | wikitext | comb_14 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 7.70191 | 27.4792 | 0 |
47
+ | 44 | 0.37619 | 8 | 0 | wikitext | comb_17 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 6.66903 | 27.4847 | 0 |
48
+ | 45 | 0.308477 | 4 | 0 | wikitext | comb_2 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 8.84428 | 27.49 | 0 |
49
+ | 46 | 0.345187 | 5 | 0 | wikitext | comb_17 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 7.83909 | 27.4905 | 0 |
50
+ | 47 | 0.346065 | 5 | 0 | wikitext | comb_2 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 7.72405 | 27.5007 | 0 |
51
+ | 48 | 0.344917 | 5 | 0 | wikitext | comb_16 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 7.801 | 27.5039 | 0 |
52
+ | 49 | 0.372543 | 7 | 0 | wikitext | comb_2 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 6.79738 | 27.5139 | 0 |
53
+ | 50 | 0.376697 | 8 | 0 | wikitext | comb_14 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 6.62538 | 27.5159 | 0 |
54
+ | 51 | 0.194157 | 4 | 0 | wikitext | comb_17 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 15.055 | 27.5173 | 0 |
55
+ | 52 | 0.317089 | 4 | 0 | wikitext | comb_16 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 8.42897 | 27.5194 | 0 |
56
+ | 53 | 0.372104 | 6 | 0 | wikitext | comb_14 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 6.83897 | 27.5683 | 0 |
57
+ | 54 | 0.372036 | 7 | 0 | wikitext | comb_17 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 6.77228 | 27.5732 | 0 |
58
+ | 55 | 0.373826 | 7 | 0 | wikitext | comb_16 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 6.78939 | 27.5824 | 0 |
59
+ | 56 | 0.373522 | 6 | 0 | wikitext | comb_2 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 6.79899 | 27.5874 | 0 |
60
+ | 57 | 0.374265 | 7 | 0 | wikitext | comb_14 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 6.70865 | 27.6005 | 0 |
61
+ | 58 | 0.376123 | 8 | 0 | wikitext | comb_16 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 6.65089 | 27.6714 | 0 |
62
+ | 59 | 0.376866 | 8 | 0 | wikitext | comb_2 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 6.63997 | 27.6847 | 0 |
63
+ | 60 | 0.290138 | 4 | 0 | wikitext | comb_3 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 9.91149 | 34.628 | 0 |
64
+ | 61 | 0.376832 | 8 | 0 | wikitext | comb_3 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 6.64219 | 34.6472 | 0 |
65
+ | 62 | 0.347045 | 5 | 0 | wikitext | comb_3 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 7.67828 | 34.6542 | 0 |
66
+ | 63 | 0.371564 | 6 | 0 | wikitext | comb_3 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 6.86019 | 34.761 | 0 |
67
+ | 64 | 0.374333 | 7 | 0 | wikitext | comb_3 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 6.72389 | 34.825 | 0 |
68
+ | 65 | 0.346032 | 5 | 0 | wikitext | comb_7 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 7.69845 | 40.7704 | 0 |
69
+ | 66 | 0.29382 | 4 | 0 | wikitext | comb_7 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 9.86754 | 40.8156 | 0 |
70
+ | 67 | 0.165721 | 7 | 0 | wikitext | comb_10 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 16.8775 | 40.8206 | 0 |
71
+ | 68 | 0.346606 | 8 | 0 | wikitext | comb_10 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 7.36425 | 40.908 | 0 |
72
+ | 69 | 0.374367 | 7 | 0 | wikitext | comb_7 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 6.70338 | 40.9105 | 0 |
73
+ | 70 | 0.372712 | 6 | 0 | wikitext | comb_7 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 6.84728 | 40.9654 | 0 |
74
+ | 71 | 0.377339 | 8 | 0 | wikitext | comb_7 | tinyllama | nlr_t_no_sched | 1897.87 | 2160.07 | 6.6293 | 40.971 | 0 |
75
+ | 72 | 0 | 4 | 0 | wikitext | comb_6 | tinyllama | nlr_t_no_sched | 1381.17 | 2487.22 | 1.12118 | 0.480479 | 0 |
76
+ | 73 | 0 | 5 | 0 | wikitext | comb_6 | tinyllama | nlr_t_no_sched | 1381.17 | 2487.22 | 1.12118 | 0.480479 | 0 |
77
+ | 74 | 0 | 6 | 0 | wikitext | comb_6 | tinyllama | nlr_t_no_sched | 1381.17 | 2487.22 | 1.12118 | 0.480479 | 0 |
78
+ | 75 | 0 | 7 | 0 | wikitext | comb_6 | tinyllama | nlr_t_no_sched | 1381.17 | 2487.22 | 1.12118 | 0.480479 | 0 |
79
+ | 76 | 0 | 8 | 0 | wikitext | comb_6 | tinyllama | nlr_t_no_sched | 1381.17 | 2487.22 | 1.12118 | 0.480479 | 0 |
80
+ | 77 | 0 | 4 | 0 | wikitext | comb_4 | tinyllama | nlr_t_no_sched | 2225.07 | 2747.27 | 1.10931 | 99.4585 | 0 |
81
+ | 78 | 0 | 5 | 0 | wikitext | comb_4 | tinyllama | nlr_t_no_sched | 2225.07 | 2747.27 | 1.10931 | 99.4585 | 0 |
82
+ | 79 | 0 | 6 | 0 | wikitext | comb_4 | tinyllama | nlr_t_no_sched | 2225.07 | 2747.27 | 1.10931 | 99.4585 | 0 |
83
+ | 80 | 0 | 7 | 0 | wikitext | comb_4 | tinyllama | nlr_t_no_sched | 2225.07 | 2747.27 | 1.10931 | 99.4585 | 0 |
84
+ | 81 | 0 | 8 | 0 | wikitext | comb_4 | tinyllama | nlr_t_no_sched | 2225.07 | 2747.27 | 1.10931 | 99.4585 | 0 |
85
+ | 82 | 0.378149 | 32 | 0 | wikitext | base | tinyllama | ---- | 4470.55 | 4485.81 | 6.59595 | 11.6913 | 0 |