mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2025-01-13 12:10:18 +00:00
llama : add ggml_cont to trigger bug with Metal
This commit is contained in:
parent
bd33e5ab92
commit
ad80e5a4a7
@ -2418,11 +2418,11 @@ static struct ggml_cgraph * llm_build_llama(
|
|||||||
|
|
||||||
// split cached V into n_head heads
|
// split cached V into n_head heads
|
||||||
struct ggml_tensor * V =
|
struct ggml_tensor * V =
|
||||||
ggml_view_3d(ctx0, kv_self.v,
|
ggml_cont(ctx0, ggml_view_3d(ctx0, kv_self.v,
|
||||||
n_past + N, n_embd_head, n_head_kv,
|
n_past + N, n_embd_head, n_head_kv,
|
||||||
ggml_element_size(kv_self.v)*n_ctx,
|
ggml_element_size(kv_self.v)*n_ctx,
|
||||||
ggml_element_size(kv_self.v)*n_ctx*n_embd_head,
|
ggml_element_size(kv_self.v)*n_ctx*n_embd_head,
|
||||||
ggml_element_size(kv_self.v)*n_ctx*n_embd_gqa*il);
|
ggml_element_size(kv_self.v)*n_ctx*n_embd_gqa*il));
|
||||||
offload_func_v(V);
|
offload_func_v(V);
|
||||||
ggml_set_name(V, "V");
|
ggml_set_name(V, "V");
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user