mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2024-12-25 10:54:36 +00:00
parent
a75fa576ab
commit
df9d1293de
@ -4209,7 +4209,7 @@ struct llm_build_context {
|
|||||||
struct ggml_tensor * Kcur = ggml_concat(ctx0, krotated, kpass);
|
struct ggml_tensor * Kcur = ggml_concat(ctx0, krotated, kpass);
|
||||||
cb(Kcur, "Kcur", il);
|
cb(Kcur, "Kcur", il);
|
||||||
|
|
||||||
struct ggml_tensor * Q = ggml_cont(ctx0, ggml_permute(ctx0, Qcur, 1, 2, 0, 3));
|
struct ggml_tensor * Q = ggml_cont(ctx0, ggml_permute(ctx0, Qcur, 2, 1, 0, 3));
|
||||||
cb(Q, "Q", il);
|
cb(Q, "Q", il);
|
||||||
|
|
||||||
Kcur = ggml_cont(ctx0, ggml_permute(ctx0, Kcur, 2, 1, 0, 3));
|
Kcur = ggml_cont(ctx0, ggml_permute(ctx0, Kcur, 2, 1, 0, 3));
|
||||||
|
Loading…
Reference in New Issue
Block a user