mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2024-11-15 15:29:53 +00:00
metal : fix wrong number of tokens per sequence in SSM_SCAN
Some checks failed
flake8 Lint / Lint (push) Has been cancelled
Some checks failed
flake8 Lint / Lint (push) Has been cancelled
This commit is contained in:
parent
5b8ec2b978
commit
62b09b343c
@ -1690,7 +1690,7 @@ static void ggml_metal_encode_node(
|
|||||||
const int64_t d_inner = ne01;
|
const int64_t d_inner = ne01;
|
||||||
const int64_t n_head = ne02;
|
const int64_t n_head = ne02;
|
||||||
const int64_t n_group = ne41;
|
const int64_t n_group = ne41;
|
||||||
const int64_t n_seq_tokens = ne11;
|
const int64_t n_seq_tokens = ne12;
|
||||||
const int64_t n_seqs = ne13;
|
const int64_t n_seqs = ne13;
|
||||||
|
|
||||||
id<MTLComputePipelineState> pipeline = nil;
|
id<MTLComputePipelineState> pipeline = nil;
|
||||||
|
Loading…
Reference in New Issue
Block a user