common : disable KV cache shifting automatically for unsupported models (#11053)

* Disable KV cache shifting automatically for unsupported models instead of exiting directly Signed-off-by: Molly Sophia <mollysophia379@gmail.com> * Update common/common.cpp Co-authored-by: Georgi Gerganov <ggerganov@gmail.com> --------- Signed-off-by: Molly Sophia <mollysophia379@gmail.com> Co-authored-by: Georgi Gerganov <ggerganov@gmail.com>
2025-01-12 03:31:46 +00:00 · 2025-01-03 20:13:18 +08:00 · 2025-01-03 20:13:18 +08:00 · 4b0c638b9a
commit 4b0c638b9a
parent e7da954ecc
1 changed files with 2 additions and 3 deletions
--- a/common/common.cpp
+++ b/common/common.cpp
@ -889,9 +889,8 @@ struct common_init_result common_init_from_params(common_params & params) {
    }

    if (params.ctx_shift && !llama_kv_cache_can_shift(lctx)) {
-        LOG_ERR("%s: KV cache shifting is not supported for this model (--no-context-shift to disable)'\n", __func__);
-        llama_free_model(model);
-        return iparams;
+        LOG_WRN("%s: KV cache shifting is not supported for this model, disabling KV cache shifting\n", __func__);
+        params.ctx_shift = false;
    }

    if (!params.control_vectors.empty()) {