From 712fecba61b803fc324004220d7bb782240dcba6 Mon Sep 17 00:00:00 2001 From: ngxson Date: Mon, 8 Jul 2024 16:48:55 +0200 Subject: [PATCH] no more transpose A --- src/llama.cpp | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/src/llama.cpp b/src/llama.cpp index a4ceb0959..b42cc5fb4 100644 --- a/src/llama.cpp +++ b/src/llama.cpp @@ -7867,10 +7867,9 @@ static struct ggml_tensor * llm_build_lora_mm( continue; } // TODO: check if lora_a need transpose - struct ggml_tensor * a = ggml_cont(ctx0, ggml_transpose(ctx0, lora->a)); struct ggml_tensor * ab_cur = ggml_mul_mat( ctx0, lora->b, - ggml_mul_mat(ctx0, a, cur) + ggml_mul_mat(ctx0, lora->a, cur) ); ab_cur = ggml_scale_inplace(ctx0, ab_cur, scale); res = ggml_add(ctx0, res, ab_cur);