From 8fbf7777cec57adee97c2b02e0a648e919c94963 Mon Sep 17 00:00:00 2001 From: Georgi Gerganov Date: Sun, 7 May 2023 20:26:02 +0300 Subject: [PATCH] ggml : fix Q5_0 quantization --- ggml.c | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ggml.c b/ggml.c index 623b15e9b..50f830e65 100644 --- a/ggml.c +++ b/ggml.c @@ -845,7 +845,7 @@ static void quantize_row_q5_0_reference(const float * restrict x, block_q5_0 * r const float d = max / -16; const float id = d ? 1.0f/d : 0.0f; - y[i].d = d; + y[i].d = GGML_FP32_TO_FP16(d); uint32_t qh = 0;