Update README.md
Browse files
README.md
CHANGED
@@ -25,15 +25,15 @@ full wiki.train would have taken 10h
|
|
25 |
for more info on imatrix handling see https://github.com/ggerganov/llama.cpp/pull/5302
|
26 |
|
27 |
### ppl (512 wiki.test, 300chunks)
|
28 |
-
| quant
|
29 |
-
|
30 |
-
| f16(baseline)
|
31 |
-
| q8_0
|
32 |
-
| q5_k_m
|
33 |
-
| q4_k_m
|
34 |
-
| iq3_xxs
|
35 |
-
| iq3_xxs(wiki)
|
36 |
-
| iq3_xxs(kal)
|
37 |
-
| q2_k
|
38 |
-
| iq2_xs
|
39 |
-
| iq2_xxs
|
|
|
25 |
for more info on imatrix handling see https://github.com/ggerganov/llama.cpp/pull/5302
|
26 |
|
27 |
### ppl (512 wiki.test, 300chunks)
|
28 |
+
| quant | ppl (lower is better) |
|
29 |
+
|--------------------|-----|
|
30 |
+
| f16(baseline) | 5.8839 +/- 0.05173 |
|
31 |
+
| q8_0 | xxx |
|
32 |
+
| q5_k_m | xxx |
|
33 |
+
| q4_k_m | xxx |
|
34 |
+
| iq3_xxs | 6.1984 +/- 0.05475 |
|
35 |
+
| iq3_xxs(only-wiki) | 6.1796 +/- 0.05446 |
|
36 |
+
| iq3_xxs(only-kal) | 6.1984 +/- 0.05475 |
|
37 |
+
| q2_k | xxx |
|
38 |
+
| iq2_xs | xxx |
|
39 |
+
| iq2_xxs | xxx |
|