mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2024-12-27 03:44:35 +00:00
ggml : do not break cuBLAS build (Q4_3 is not yet implemented)
This commit is contained in:
parent
66aab46079
commit
8a1756abdf
3
ggml.c
3
ggml.c
@ -8040,9 +8040,6 @@ static void ggml_compute_forward_mul_mat_q_f32(
|
|||||||
else if (type == GGML_TYPE_Q4_2) {
|
else if (type == GGML_TYPE_Q4_2) {
|
||||||
dequantize_row_q_cuda = dequantize_row_q4_2_cuda;
|
dequantize_row_q_cuda = dequantize_row_q4_2_cuda;
|
||||||
}
|
}
|
||||||
else if (type == GGML_TYPE_Q4_3) {
|
|
||||||
dequantize_row_q_cuda = dequantize_row_q4_3_cuda;
|
|
||||||
}
|
|
||||||
else {
|
else {
|
||||||
GGML_ASSERT(false);
|
GGML_ASSERT(false);
|
||||||
}
|
}
|
||||||
|
Loading…
Reference in New Issue
Block a user