ggml : fix Q4_1 quantization

2024-12-29 12:54:35 +00:00 · 2023-05-07 18:07:11 +03:00 · 2023-05-07 18:07:11 +03:00 · c216656990
commit c216656990
parent 4991499a5a
1 changed files with 2 additions and 2 deletions
--- a/ggml.c
+++ b/ggml.c
@ -826,8 +826,8 @@ static void quantize_row_q4_1_reference(const float * restrict x, block_q4_1 * r
        y[i].m = min;
        for (int l = 0; l < qk/2; ++l) {
-            const float x0 = (x[0    + l] - min)*id;
+            const float x0 = (x[i*qk + 0    + l] - min)*id;
-            const float x1 = (x[qk/2 + l] - min)*id;
+            const float x1 = (x[i*qk + qk/2 + l] - min)*id;
            const uint8_t xi0 = MIN(15, (int8_t)(x0 + 0.5f));
            const uint8_t xi1 = MIN(15, (int8_t)(x1 + 0.5f));