llama : use unused n_embd_k_gqa in k_shift

This also slightly reduces the diff from the master branch
2025-01-12 11:40:17 +00:00 · 2024-09-01 21:59:24 -04:00 · 2024-09-01 21:59:24 -04:00 · 375de5b1f8
commit 375de5b1f8
parent 5f62db790b
1 changed files with 1 additions and 1 deletions
--- a/src/llama.cpp
+++ b/src/llama.cpp
@ -10806,7 +10806,7 @@ struct llm_build_context {
                        ggml_view_3d(ctx0, kv_self.k_l[il],
                            n_embd_head_k, n_head_kv, n_ctx,
                            ggml_row_size(kv_self.k_l[il]->type, n_embd_head_k),
-                            ggml_row_size(kv_self.k_l[il]->type, hparams.n_embd_k_gqa(il)),
+                            ggml_row_size(kv_self.k_l[il]->type, n_embd_k_gqa),
                            0),
                        lctx.inp_K_shift, rope_factors, n_rot, rope_type, n_ctx_orig, freq_base, freq_scale,
                        ext_factor, attn_factor, beta_fast, beta_slow);