metal : fix wrong number of tokens per sequence in SSM_SCAN

2024-11-15 15:29:53 +00:00 · 2024-10-02 21:35:50 -04:00 · 2024-10-02 21:35:50 -04:00 · 62b09b343c
commit 62b09b343c
parent 5b8ec2b978
1 changed files with 1 additions and 1 deletions
--- a/ggml/src/ggml-metal.m
+++ b/ggml/src/ggml-metal.m
@ -1690,7 +1690,7 @@ static void ggml_metal_encode_node(
                const int64_t d_inner      = ne01;
                const int64_t n_head       = ne02;
                const int64_t n_group      = ne41;
-                const int64_t n_seq_tokens = ne11;
+                const int64_t n_seq_tokens = ne12;
                const int64_t n_seqs       = ne13;
                id<MTLComputePipelineState> pipeline = nil;