mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2025-01-13 12:10:18 +00:00
no more transpose A
This commit is contained in:
parent
79e2982788
commit
712fecba61
@ -7867,10 +7867,9 @@ static struct ggml_tensor * llm_build_lora_mm(
|
|||||||
continue;
|
continue;
|
||||||
}
|
}
|
||||||
// TODO: check if lora_a need transpose
|
// TODO: check if lora_a need transpose
|
||||||
struct ggml_tensor * a = ggml_cont(ctx0, ggml_transpose(ctx0, lora->a));
|
|
||||||
struct ggml_tensor * ab_cur = ggml_mul_mat(
|
struct ggml_tensor * ab_cur = ggml_mul_mat(
|
||||||
ctx0, lora->b,
|
ctx0, lora->b,
|
||||||
ggml_mul_mat(ctx0, a, cur)
|
ggml_mul_mat(ctx0, lora->a, cur)
|
||||||
);
|
);
|
||||||
ab_cur = ggml_scale_inplace(ctx0, ab_cur, scale);
|
ab_cur = ggml_scale_inplace(ctx0, ab_cur, scale);
|
||||||
res = ggml_add(ctx0, res, ab_cur);
|
res = ggml_add(ctx0, res, ab_cur);
|
||||||
|
Loading…
Reference in New Issue
Block a user