Update README.md
Browse files
README.md
CHANGED
@@ -16,7 +16,7 @@ a bit of Serbian, and a bit of Croatian languages.
|
|
16 |
ARC and PPL-512 DATA (Get the last data on the main post of the PR thread) :
|
17 |
|
18 |
```
|
19 |
-
IQ1_XS
|
20 |
PR
|
21 |
1.94 GB (1.93 BPW)
|
22 |
1.81 GiB (1.93 BPW)
|
@@ -24,7 +24,7 @@ PR
|
|
24 |
PPL over 564 chunks for n_ctx=512 = 40.0024 +/- 0.27710
|
25 |
|
26 |
|
27 |
-
IQ1_S
|
28 |
Master
|
29 |
2.01 GB (2.00 BPW)
|
30 |
1.87 GiB (2.00 BPW)
|
@@ -48,7 +48,7 @@ PR
|
|
48 |
PPL over 564 chunks for n_ctx=512 = 20.0588 +/- 0.14001
|
49 |
|
50 |
|
51 |
-
IQ1_XL
|
52 |
PR
|
53 |
2.21 GB (2.21 BPW)
|
54 |
2.06 GiB (2.21 BPW)
|
@@ -59,6 +59,11 @@ PR2
|
|
59 |
2.08 GiB (2.22 BPW)
|
60 |
PPL over 564 chunks for n_ctx=512 = 17.4537 +/- 0.11995
|
61 |
|
|
|
|
|
|
|
|
|
|
|
62 |
|
63 |
IQ2_XXS
|
64 |
Master
|
@@ -71,6 +76,11 @@ PR
|
|
71 |
2.22 GiB (2.37 BPW)
|
72 |
PPL over 564 chunks for n_ctx=512 = 13.8073 +/- 0.09290
|
73 |
|
|
|
|
|
|
|
|
|
|
|
74 |
|
75 |
IQ2_XS
|
76 |
Master
|
@@ -93,6 +103,11 @@ PR3
|
|
93 |
2.40 GiB (2.57 BPW)
|
94 |
PPL over 564 chunks for n_ctx=512 = 11.3031 +/- 0.07514
|
95 |
|
|
|
|
|
|
|
|
|
|
|
96 |
|
97 |
IQ2_S
|
98 |
Master
|
|
|
16 |
ARC and PPL-512 DATA (Get the last data on the main post of the PR thread) :
|
17 |
|
18 |
```
|
19 |
+
IQ1_XS - Unusable on <30B models
|
20 |
PR
|
21 |
1.94 GB (1.93 BPW)
|
22 |
1.81 GiB (1.93 BPW)
|
|
|
24 |
PPL over 564 chunks for n_ctx=512 = 40.0024 +/- 0.27710
|
25 |
|
26 |
|
27 |
+
IQ1_S - Unusable on <30B models
|
28 |
Master
|
29 |
2.01 GB (2.00 BPW)
|
30 |
1.87 GiB (2.00 BPW)
|
|
|
48 |
PPL over 564 chunks for n_ctx=512 = 20.0588 +/- 0.14001
|
49 |
|
50 |
|
51 |
+
IQ1_XL - Unusable on <= 13b models
|
52 |
PR
|
53 |
2.21 GB (2.21 BPW)
|
54 |
2.06 GiB (2.21 BPW)
|
|
|
59 |
2.08 GiB (2.22 BPW)
|
60 |
PPL over 564 chunks for n_ctx=512 = 17.4537 +/- 0.11995
|
61 |
|
62 |
+
PR3
|
63 |
+
2.25 GB (2.25 BPW)
|
64 |
+
2.10 GiB (2.25 BPW)
|
65 |
+
PPL over 564 chunks for n_ctx=512 = 17.3669 +/- 0.11928
|
66 |
+
|
67 |
|
68 |
IQ2_XXS
|
69 |
Master
|
|
|
76 |
2.22 GiB (2.37 BPW)
|
77 |
PPL over 564 chunks for n_ctx=512 = 13.8073 +/- 0.09290
|
78 |
|
79 |
+
PR2
|
80 |
+
2.40 GB (2.39 BPW)
|
81 |
+
2.23 GiB (2.39 BPW)
|
82 |
+
PPL over 564 chunks for n_ctx=512 = 12.9671 +/- 0.08687
|
83 |
+
|
84 |
|
85 |
IQ2_XS
|
86 |
Master
|
|
|
103 |
2.40 GiB (2.57 BPW)
|
104 |
PPL over 564 chunks for n_ctx=512 = 11.3031 +/- 0.07514
|
105 |
|
106 |
+
PR4
|
107 |
+
2.59 GB (2.58 BPW)
|
108 |
+
2.42 GiB (2.58 BPW)
|
109 |
+
PPL over 564 chunks for n_ctx=512 = 10.9291 +/- 0.07270
|
110 |
+
|
111 |
|
112 |
IQ2_S
|
113 |
Master
|