mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2024-11-13 14:29:52 +00:00
k-quants : fix zero-weight guard in Q6_K (ref #3040)
This commit is contained in:
parent
ea2c85d5d2
commit
178b1850eb
@ -1089,6 +1089,7 @@ void quantize_row_q6_K_reference(const float * restrict x, block_q6_K * restrict
|
|||||||
if (!max_abs_scale) {
|
if (!max_abs_scale) {
|
||||||
memset(&y[i], 0, sizeof(block_q6_K));
|
memset(&y[i], 0, sizeof(block_q6_K));
|
||||||
y[i].d = ggml_fp32_to_fp16(0.f);
|
y[i].d = ggml_fp32_to_fp16(0.f);
|
||||||
|
x += QK_K;
|
||||||
continue;
|
continue;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user