Upload results for llama3
Browse files- results/df.tsv +69 -0
- results/results.txt +70 -0
results/df.tsv
ADDED
@@ -0,0 +1,69 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
accuracy bits clip dataset method model params peak_mem_alloc_mb peak_mem_reserv_mb perplexity time_ms wer
|
2 |
+
0.4277946949005127 4 0.0 wikitext ao_woq llama3 fixed 5542.623744 7163.871232 5.3583574295043945 39.500762 0.0
|
3 |
+
0.0 4 0.0 wikitext comb_5 llama3 nlr_t_no_sched 14178.745344 15367.929856 1.2404379844665527 121.466856 0.0
|
4 |
+
0.0 4 0.0 wikitext comb_11 llama3 nlr_t_no_sched 14178.745344 15367.929856 1.1248141527175903 145.935296 0.0
|
5 |
+
0.065552182495594 4 0.0 wikitext comb_8 llama3 nlr_t_no_sched 14179.216384 15367.929856 51.48540115356445 69.068076 0.0
|
6 |
+
0.3797703683376312 4 0.0 wikitext woq llama3 fixed 14179.331584 15367.929856 6.163248062133789 95.588442 0.0
|
7 |
+
0.0047619054093956 4 0.0 wikitext comb_18 llama3 nlr_t_no_sched 14185.276416 15374.221312 1.1258682012557983 147.906492 0.0
|
8 |
+
0.0079365093261003 4 0.0 wikitext comb_10 llama3 nlr_t_no_sched 14185.276416 15374.221312 1.1351985931396484 201.489016 0.0
|
9 |
+
0.0546975657343864 4 0.0 wikitext comb_3 llama3 nlr_t_no_sched 14185.341952 15374.221312 1.9115358591079712 175.816608 0.0
|
10 |
+
0.0621118061244487 4 0.0 wikitext comb_14 llama3 nlr_t_no_sched 14185.66656 15374.221312 29.12266540527344 147.944895 0.0
|
11 |
+
0.2624451220035553 4 0.0 wikitext comb_17 llama3 nlr_t_no_sched 14185.747456 15374.221312 11.384479522705078 147.678698 0.0
|
12 |
+
0.241843968629837 4 0.0 wikitext comb_16 llama3 nlr_t_no_sched 14185.747456 15374.221312 13.005107879638672 147.69713 0.0
|
13 |
+
0.124822698533535 4 0.0 wikitext comb_2 llama3 nlr_t_no_sched 14185.747456 15374.221312 28.73665809631348 148.042488 0.0
|
14 |
+
0.0600135140120983 4 0.0 wikitext comb_7 llama3 nlr_t_no_sched 14185.747456 15374.221312 58.5887565612793 201.604194 0.0
|
15 |
+
0.0 4 0.0 wikitext comb_6 llama3 nlr_t_no_sched 11051.945984 18748.53888 1.1451951265335083 4.409536 0.0
|
16 |
+
0.0 7 0.0 wikitext comb_5 llama3 nlr_t_no_sched 14178.745344 15367.929856 1.1227006912231443 121.210918 0.0
|
17 |
+
0.0 7 0.0 wikitext comb_11 llama3 nlr_t_no_sched 14178.745344 15367.929856 1.1248141527175903 145.789043 0.0
|
18 |
+
0.4441067278385162 7 0.0 wikitext comb_8 llama3 nlr_t_no_sched 14179.216384 15367.929856 5.2373480796813965 68.5546 0.0
|
19 |
+
0.4427558183670044 7 0.0 wikitext woq llama3 fixed 14179.331584 15367.929856 5.248887062072754 95.510221 0.0
|
20 |
+
0.0 7 0.0 wikitext comb_18 llama3 nlr_t_no_sched 14185.276416 15374.221312 1.14442241191864 147.962915 0.0
|
21 |
+
0.0274170320481061 7 0.0 wikitext comb_10 llama3 nlr_t_no_sched 14185.27744 15374.221312 1.1136080026626587 201.44854 0.0
|
22 |
+
0.4438365399837494 7 0.0 wikitext comb_17 llama3 nlr_t_no_sched 14185.747456 15374.221312 5.2295026779174805 147.263902 0.0
|
23 |
+
0.4435663521289825 7 0.0 wikitext comb_14 llama3 nlr_t_no_sched 14185.747456 15374.221312 5.23347806930542 147.349152 0.0
|
24 |
+
0.4436339139938354 7 0.0 wikitext comb_16 llama3 nlr_t_no_sched 14185.747456 15374.221312 5.234407901763916 147.630622 0.0
|
25 |
+
0.4438365399837494 7 0.0 wikitext comb_2 llama3 nlr_t_no_sched 14185.747456 15374.221312 5.240307331085205 147.907941 0.0
|
26 |
+
0.4431948661804199 7 0.0 wikitext comb_3 llama3 nlr_t_no_sched 14185.747456 15374.221312 5.228732109069824 175.129737 0.0
|
27 |
+
0.4434650540351867 7 0.0 wikitext comb_7 llama3 nlr_t_no_sched 14185.747456 15374.221312 5.239895343780518 201.007751 0.0
|
28 |
+
0.0 7 0.0 wikitext comb_6 llama3 nlr_t_no_sched 11051.945984 18748.53888 1.150550365447998 4.409446 0.0
|
29 |
+
0.4437352418899536 8 0.0 wikitext ao_woq llama3 fixed 12110.375936 14040.43264 5.208643436431885 52.35414 0.0
|
30 |
+
0.0 8 0.0 wikitext comb_5 llama3 nlr_t_no_sched 14178.745344 15367.929856 1.1235297918319702 121.529527 0.0
|
31 |
+
0.0 8 0.0 wikitext comb_11 llama3 nlr_t_no_sched 14178.745344 15367.929856 1.1248141527175903 146.053433 0.0
|
32 |
+
0.443498820066452 8 0.0 wikitext comb_8 llama3 nlr_t_no_sched 14179.216384 15367.929856 5.202676296234131 69.423541 0.0
|
33 |
+
0.443870335817337 8 0.0 wikitext woq llama3 fixed 14179.331584 15367.929856 5.208242893218994 95.591094 0.0
|
34 |
+
0.4438365399837494 8 0.0 wikitext comb_14 llama3 nlr_t_no_sched 14185.747456 15374.221312 5.206423759460449 147.850202 0.0
|
35 |
+
0.4432962238788605 8 0.0 wikitext comb_17 llama3 nlr_t_no_sched 14185.747456 15374.221312 5.215326309204102 147.90709 0.0
|
36 |
+
0.0827760845422744 8 0.0 wikitext comb_18 llama3 nlr_t_no_sched 14185.747456 15374.221312 33.215667724609375 147.999591 0.0
|
37 |
+
0.4439716637134552 8 0.0 wikitext comb_2 llama3 nlr_t_no_sched 14185.747456 15374.221312 5.211247444152832 148.099943 0.0
|
38 |
+
0.443363755941391 8 0.0 wikitext comb_16 llama3 nlr_t_no_sched 14185.747456 15374.221312 5.2125773429870605 148.327226 0.0
|
39 |
+
0.4439041018486023 8 0.0 wikitext comb_3 llama3 nlr_t_no_sched 14185.747456 15374.221312 5.213589668273926 175.339251 0.0
|
40 |
+
0.3078352212905884 8 0.0 wikitext comb_10 llama3 nlr_t_no_sched 14185.747456 15374.221312 8.37353801727295 201.392404 0.0
|
41 |
+
0.4443093538284302 8 0.0 wikitext comb_7 llama3 nlr_t_no_sched 14185.747456 15374.221312 5.203152179718018 201.603874 0.0
|
42 |
+
0.0 8 0.0 wikitext comb_6 llama3 nlr_t_no_sched 11051.945984 18748.53888 1.1399809122085571 4.418255 0.0
|
43 |
+
0.0 6 0.0 wikitext comb_5 llama3 nlr_t_no_sched 14178.745344 15367.929856 1.145577907562256 121.159422 0.0
|
44 |
+
0.0 6 0.0 wikitext comb_11 llama3 nlr_t_no_sched 14178.745344 15367.929856 1.1248141527175903 146.114884 0.0
|
45 |
+
0.4381628036499023 6 0.0 wikitext comb_8 llama3 nlr_t_no_sched 14179.216384 15367.929856 5.209409236907959 69.01063 0.0
|
46 |
+
0.4409320950508117 6 0.0 wikitext woq llama3 fixed 14179.331584 15367.929856 5.193300724029541 95.697418 0.0
|
47 |
+
0.0 6 0.0 wikitext comb_18 llama3 nlr_t_no_sched 14185.276416 15374.221312 1.1636452674865725 148.035144 0.0
|
48 |
+
0.0 6 0.0 wikitext comb_10 llama3 nlr_t_no_sched 14185.276416 15374.221312 1.1606180667877195 201.552603 0.0
|
49 |
+
0.4382641315460205 6 0.0 wikitext comb_16 llama3 nlr_t_no_sched 14185.747456 15374.221312 5.218070030212402 147.619341 0.0
|
50 |
+
0.4389395713806152 6 0.0 wikitext comb_17 llama3 nlr_t_no_sched 14185.747456 15374.221312 5.210784912109375 147.885593 0.0
|
51 |
+
0.4374535977840423 6 0.0 wikitext comb_2 llama3 nlr_t_no_sched 14185.747456 15374.221312 5.207483768463135 147.984403 0.0
|
52 |
+
0.4377575218677521 6 0.0 wikitext comb_14 llama3 nlr_t_no_sched 14185.747456 15374.221312 5.234193801879883 148.281961 0.0
|
53 |
+
0.4386356174945831 6 0.0 wikitext comb_3 llama3 nlr_t_no_sched 14185.747456 15374.221312 5.227176189422607 175.940369 0.0
|
54 |
+
0.4378926157951355 6 0.0 wikitext comb_7 llama3 nlr_t_no_sched 14185.747456 15374.221312 5.239664554595947 201.404379 0.0
|
55 |
+
0.0 6 0.0 wikitext comb_6 llama3 nlr_t_no_sched 11051.945984 18748.53888 1.1385393142700195 4.417957 0.0
|
56 |
+
0.0 5 0.0 wikitext comb_5 llama3 nlr_t_no_sched 14178.745344 15367.929856 1.2200177907943726 121.614514 0.0
|
57 |
+
0.0 5 0.0 wikitext comb_11 llama3 nlr_t_no_sched 14178.745344 15367.929856 1.1248141527175903 146.125173 0.0
|
58 |
+
0.3920635282993316 5 0.0 wikitext comb_8 llama3 nlr_t_no_sched 14179.216384 15367.929856 6.063994884490967 68.929145 0.0
|
59 |
+
0.4355623126029968 5 0.0 wikitext woq llama3 fixed 14179.331584 15367.929856 5.448963165283203 95.602699 0.0
|
60 |
+
0.0095238108187913 5 0.0 wikitext comb_18 llama3 nlr_t_no_sched 14185.276416 15374.221312 1.1374850273132324 148.163994 0.0
|
61 |
+
0.0031746034510433 5 0.0 wikitext comb_10 llama3 nlr_t_no_sched 14185.276416 15374.221312 1.1366512775421145 201.653023 0.0
|
62 |
+
0.3940898478031158 5 0.0 wikitext comb_14 llama3 nlr_t_no_sched 14185.747456 15374.221312 5.969732761383057 147.499204 0.0
|
63 |
+
0.3852414786815643 5 0.0 wikitext comb_17 llama3 nlr_t_no_sched 14185.747456 15374.221312 6.185377597808838 147.726175 0.0
|
64 |
+
0.3841270208358764 5 0.0 wikitext comb_16 llama3 nlr_t_no_sched 14185.747456 15374.221312 6.20028018951416 147.991972 0.0
|
65 |
+
0.3874029219150543 5 0.0 wikitext comb_2 llama3 nlr_t_no_sched 14185.747456 15374.221312 6.124840259552002 148.051112 0.0
|
66 |
+
0.3967240750789642 5 0.0 wikitext comb_3 llama3 nlr_t_no_sched 14185.747456 15374.221312 5.949668884277344 175.763149 0.0
|
67 |
+
0.3933468759059906 5 0.0 wikitext comb_7 llama3 nlr_t_no_sched 14185.747456 15374.221312 6.018429279327393 200.980925 0.0
|
68 |
+
0.0 5 0.0 wikitext comb_6 llama3 nlr_t_no_sched 11051.945984 18748.53888 1.1440914869308472 4.421197 0.0
|
69 |
+
0.4436677098274231 32 0.0 wikitext base llama3 ---- 33003.526656 33155.97312 5.223813056945801 26.241893 0.0
|
results/results.txt
ADDED
@@ -0,0 +1,70 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
| | accuracy | bits | clip | dataset | method | model | params | peak_mem_alloc_mb | peak_mem_reserv_mb | perplexity | time_ms | wer |
|
2 |
+
|---:|-----------:|-------:|-------:|:----------|:---------|:--------|:---------------|--------------------:|---------------------:|-------------:|----------:|------:|
|
3 |
+
| 0 | 0.4278 | 4 | 0 | wikitext | ao_woq | llama3 | fixed | 5542.62 | 7163.87 | 5.3584 | 39.5008 | 0 |
|
4 |
+
| 1 | 0 | 4 | 0 | wikitext | comb_5 | llama3 | nlr_t_no_sched | 14178.7 | 15367.9 | 1.2404 | 121.467 | 0 |
|
5 |
+
| 2 | 0 | 4 | 0 | wikitext | comb_11 | llama3 | nlr_t_no_sched | 14178.7 | 15367.9 | 1.1248 | 145.935 | 0 |
|
6 |
+
| 3 | 0.0656 | 4 | 0 | wikitext | comb_8 | llama3 | nlr_t_no_sched | 14179.2 | 15367.9 | 51.4854 | 69.0681 | 0 |
|
7 |
+
| 4 | 0.3798 | 4 | 0 | wikitext | woq | llama3 | fixed | 14179.3 | 15367.9 | 6.1632 | 95.5884 | 0 |
|
8 |
+
| 5 | 0.0048 | 4 | 0 | wikitext | comb_18 | llama3 | nlr_t_no_sched | 14185.3 | 15374.2 | 1.1259 | 147.906 | 0 |
|
9 |
+
| 6 | 0.0079 | 4 | 0 | wikitext | comb_10 | llama3 | nlr_t_no_sched | 14185.3 | 15374.2 | 1.1352 | 201.489 | 0 |
|
10 |
+
| 7 | 0.0547 | 4 | 0 | wikitext | comb_3 | llama3 | nlr_t_no_sched | 14185.3 | 15374.2 | 1.9115 | 175.817 | 0 |
|
11 |
+
| 8 | 0.0621 | 4 | 0 | wikitext | comb_14 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 29.1227 | 147.945 | 0 |
|
12 |
+
| 9 | 0.2624 | 4 | 0 | wikitext | comb_17 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 11.3845 | 147.679 | 0 |
|
13 |
+
| 10 | 0.2418 | 4 | 0 | wikitext | comb_16 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 13.0051 | 147.697 | 0 |
|
14 |
+
| 11 | 0.1248 | 4 | 0 | wikitext | comb_2 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 28.7367 | 148.042 | 0 |
|
15 |
+
| 12 | 0.06 | 4 | 0 | wikitext | comb_7 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 58.5888 | 201.604 | 0 |
|
16 |
+
| 13 | 0 | 4 | 0 | wikitext | comb_6 | llama3 | nlr_t_no_sched | 11051.9 | 18748.5 | 1.1452 | 4.4095 | 0 |
|
17 |
+
| 0 | 0 | 7 | 0 | wikitext | comb_5 | llama3 | nlr_t_no_sched | 14178.7 | 15367.9 | 1.1227 | 121.211 | 0 |
|
18 |
+
| 1 | 0 | 7 | 0 | wikitext | comb_11 | llama3 | nlr_t_no_sched | 14178.7 | 15367.9 | 1.1248 | 145.789 | 0 |
|
19 |
+
| 2 | 0.4441 | 7 | 0 | wikitext | comb_8 | llama3 | nlr_t_no_sched | 14179.2 | 15367.9 | 5.2373 | 68.5546 | 0 |
|
20 |
+
| 3 | 0.4428 | 7 | 0 | wikitext | woq | llama3 | fixed | 14179.3 | 15367.9 | 5.2489 | 95.5102 | 0 |
|
21 |
+
| 4 | 0 | 7 | 0 | wikitext | comb_18 | llama3 | nlr_t_no_sched | 14185.3 | 15374.2 | 1.1444 | 147.963 | 0 |
|
22 |
+
| 5 | 0.0274 | 7 | 0 | wikitext | comb_10 | llama3 | nlr_t_no_sched | 14185.3 | 15374.2 | 1.1136 | 201.448 | 0 |
|
23 |
+
| 6 | 0.4438 | 7 | 0 | wikitext | comb_17 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 5.2295 | 147.264 | 0 |
|
24 |
+
| 7 | 0.4436 | 7 | 0 | wikitext | comb_14 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 5.2335 | 147.349 | 0 |
|
25 |
+
| 8 | 0.4436 | 7 | 0 | wikitext | comb_16 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 5.2344 | 147.631 | 0 |
|
26 |
+
| 9 | 0.4438 | 7 | 0 | wikitext | comb_2 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 5.2403 | 147.908 | 0 |
|
27 |
+
| 10 | 0.4432 | 7 | 0 | wikitext | comb_3 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 5.2287 | 175.13 | 0 |
|
28 |
+
| 11 | 0.4435 | 7 | 0 | wikitext | comb_7 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 5.2399 | 201.008 | 0 |
|
29 |
+
| 12 | 0 | 7 | 0 | wikitext | comb_6 | llama3 | nlr_t_no_sched | 11051.9 | 18748.5 | 1.1506 | 4.4094 | 0 |
|
30 |
+
| 0 | 0.4437 | 8 | 0 | wikitext | ao_woq | llama3 | fixed | 12110.4 | 14040.4 | 5.2086 | 52.3541 | 0 |
|
31 |
+
| 1 | 0 | 8 | 0 | wikitext | comb_5 | llama3 | nlr_t_no_sched | 14178.7 | 15367.9 | 1.1235 | 121.529 | 0 |
|
32 |
+
| 2 | 0 | 8 | 0 | wikitext | comb_11 | llama3 | nlr_t_no_sched | 14178.7 | 15367.9 | 1.1248 | 146.053 | 0 |
|
33 |
+
| 3 | 0.4435 | 8 | 0 | wikitext | comb_8 | llama3 | nlr_t_no_sched | 14179.2 | 15367.9 | 5.2027 | 69.4235 | 0 |
|
34 |
+
| 4 | 0.4439 | 8 | 0 | wikitext | woq | llama3 | fixed | 14179.3 | 15367.9 | 5.2082 | 95.5911 | 0 |
|
35 |
+
| 5 | 0.4438 | 8 | 0 | wikitext | comb_14 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 5.2064 | 147.85 | 0 |
|
36 |
+
| 6 | 0.4433 | 8 | 0 | wikitext | comb_17 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 5.2153 | 147.907 | 0 |
|
37 |
+
| 7 | 0.0828 | 8 | 0 | wikitext | comb_18 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 33.2157 | 148 | 0 |
|
38 |
+
| 8 | 0.444 | 8 | 0 | wikitext | comb_2 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 5.2112 | 148.1 | 0 |
|
39 |
+
| 9 | 0.4434 | 8 | 0 | wikitext | comb_16 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 5.2126 | 148.327 | 0 |
|
40 |
+
| 10 | 0.4439 | 8 | 0 | wikitext | comb_3 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 5.2136 | 175.339 | 0 |
|
41 |
+
| 11 | 0.3078 | 8 | 0 | wikitext | comb_10 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 8.3735 | 201.392 | 0 |
|
42 |
+
| 12 | 0.4443 | 8 | 0 | wikitext | comb_7 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 5.2032 | 201.604 | 0 |
|
43 |
+
| 13 | 0 | 8 | 0 | wikitext | comb_6 | llama3 | nlr_t_no_sched | 11051.9 | 18748.5 | 1.14 | 4.4183 | 0 |
|
44 |
+
| 0 | 0 | 6 | 0 | wikitext | comb_5 | llama3 | nlr_t_no_sched | 14178.7 | 15367.9 | 1.1456 | 121.159 | 0 |
|
45 |
+
| 1 | 0 | 6 | 0 | wikitext | comb_11 | llama3 | nlr_t_no_sched | 14178.7 | 15367.9 | 1.1248 | 146.115 | 0 |
|
46 |
+
| 2 | 0.4382 | 6 | 0 | wikitext | comb_8 | llama3 | nlr_t_no_sched | 14179.2 | 15367.9 | 5.2094 | 69.0106 | 0 |
|
47 |
+
| 3 | 0.4409 | 6 | 0 | wikitext | woq | llama3 | fixed | 14179.3 | 15367.9 | 5.1933 | 95.6974 | 0 |
|
48 |
+
| 4 | 0 | 6 | 0 | wikitext | comb_18 | llama3 | nlr_t_no_sched | 14185.3 | 15374.2 | 1.1636 | 148.035 | 0 |
|
49 |
+
| 5 | 0 | 6 | 0 | wikitext | comb_10 | llama3 | nlr_t_no_sched | 14185.3 | 15374.2 | 1.1606 | 201.553 | 0 |
|
50 |
+
| 6 | 0.4383 | 6 | 0 | wikitext | comb_16 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 5.2181 | 147.619 | 0 |
|
51 |
+
| 7 | 0.4389 | 6 | 0 | wikitext | comb_17 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 5.2108 | 147.886 | 0 |
|
52 |
+
| 8 | 0.4375 | 6 | 0 | wikitext | comb_2 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 5.2075 | 147.984 | 0 |
|
53 |
+
| 9 | 0.4378 | 6 | 0 | wikitext | comb_14 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 5.2342 | 148.282 | 0 |
|
54 |
+
| 10 | 0.4386 | 6 | 0 | wikitext | comb_3 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 5.2272 | 175.94 | 0 |
|
55 |
+
| 11 | 0.4379 | 6 | 0 | wikitext | comb_7 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 5.2397 | 201.404 | 0 |
|
56 |
+
| 12 | 0 | 6 | 0 | wikitext | comb_6 | llama3 | nlr_t_no_sched | 11051.9 | 18748.5 | 1.1385 | 4.418 | 0 |
|
57 |
+
| 0 | 0 | 5 | 0 | wikitext | comb_5 | llama3 | nlr_t_no_sched | 14178.7 | 15367.9 | 1.22 | 121.615 | 0 |
|
58 |
+
| 1 | 0 | 5 | 0 | wikitext | comb_11 | llama3 | nlr_t_no_sched | 14178.7 | 15367.9 | 1.1248 | 146.125 | 0 |
|
59 |
+
| 2 | 0.3921 | 5 | 0 | wikitext | comb_8 | llama3 | nlr_t_no_sched | 14179.2 | 15367.9 | 6.064 | 68.9291 | 0 |
|
60 |
+
| 3 | 0.4356 | 5 | 0 | wikitext | woq | llama3 | fixed | 14179.3 | 15367.9 | 5.449 | 95.6027 | 0 |
|
61 |
+
| 4 | 0.0095 | 5 | 0 | wikitext | comb_18 | llama3 | nlr_t_no_sched | 14185.3 | 15374.2 | 1.1375 | 148.164 | 0 |
|
62 |
+
| 5 | 0.0032 | 5 | 0 | wikitext | comb_10 | llama3 | nlr_t_no_sched | 14185.3 | 15374.2 | 1.1367 | 201.653 | 0 |
|
63 |
+
| 6 | 0.3941 | 5 | 0 | wikitext | comb_14 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 5.9697 | 147.499 | 0 |
|
64 |
+
| 7 | 0.3852 | 5 | 0 | wikitext | comb_17 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 6.1854 | 147.726 | 0 |
|
65 |
+
| 8 | 0.3841 | 5 | 0 | wikitext | comb_16 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 6.2003 | 147.992 | 0 |
|
66 |
+
| 9 | 0.3874 | 5 | 0 | wikitext | comb_2 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 6.1248 | 148.051 | 0 |
|
67 |
+
| 10 | 0.3967 | 5 | 0 | wikitext | comb_3 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 5.9497 | 175.763 | 0 |
|
68 |
+
| 11 | 0.3933 | 5 | 0 | wikitext | comb_7 | llama3 | nlr_t_no_sched | 14185.7 | 15374.2 | 6.0184 | 200.981 | 0 |
|
69 |
+
| 12 | 0 | 5 | 0 | wikitext | comb_6 | llama3 | nlr_t_no_sched | 11051.9 | 18748.5 | 1.1441 | 4.4212 | 0 |
|
70 |
+
| 14 | 0.4437 | 32 | 0 | wikitext | base | llama3 | ---- | 33003.5 | 33156 | 5.2238 | 26.2419 | 0 |
|