@@ -17,6 +17,7 @@ struct quant_option {
1717
1818static  const  std::vector<struct  quant_option > QUANT_OPTIONS = {
1919    { " Q4_0" "  4.34G, +0.4685 ppl @ Llama-3-8B" 
20+     { " Q4_0_B16" "  3.56G, 5.9624 +/- 0.03348 ppl @ LLaMA-v2-7B" 
2021    { " Q4_1" "  4.78G, +0.4511 ppl @ Llama-3-8B" 
2122    { " Q5_0" "  5.21G, +0.1316 ppl @ Llama-3-8B" 
2223    { " Q5_1" "  5.65G, +0.1062 ppl @ Llama-3-8B" 
@@ -46,6 +47,7 @@ static const std::vector<struct quant_option> QUANT_OPTIONS = {
4647    { " Q5_K_M" "  5.33G, +0.0569 ppl @ Llama-3-8B" 
4748    { " Q6_K" "  6.14G, +0.0217 ppl @ Llama-3-8B" 
4849    { " Q8_0" "  7.96G, +0.0026 ppl @ Llama-3-8B" 
50+     { " Q8_0_B16" "  6.70G, 5.8011 +/- 0.03239 ppl @ LLaMA-v1-7B" 
4951    { " Q4_0_4_4" "  4.34G, +0.4685 ppl @ Llama-3-8B" 
5052    { " Q4_0_4_8" "  4.34G, +0.4685 ppl @ Llama-3-8B" 
5153    { " Q4_0_8_8" "  4.34G, +0.4685 ppl @ Llama-3-8B" 
0 commit comments