kompute : remove Q6_K from list of supported quant types

2024-12-30 21:34:36 +00:00 · 2023-10-04 16:19:19 -04:00 · 2023-10-04 16:19:19 -04:00 · 3d850db767
commit 3d850db767
parent 24a4a5956a
1 changed files with 1 additions and 2 deletions
--- a/llama.cpp
+++ b/llama.cpp
@ -6498,8 +6498,7 @@ struct llama_context * llama_new_context_with_model(
        && (model->ftype == LLAMA_FTYPE_ALL_F32
            || model->ftype == LLAMA_FTYPE_MOSTLY_F16
            || model->ftype == LLAMA_FTYPE_MOSTLY_Q4_0
-            || model->ftype == LLAMA_FTYPE_MOSTLY_Q4_1
-            || model->ftype == LLAMA_FTYPE_MOSTLY_Q6_K)) {
+            || model->ftype == LLAMA_FTYPE_MOSTLY_Q4_1)) {
        // this allocates all Vulkan resources and memory buffers
        ctx->ctx_kompute = ggml_vk_init();