metal : fix wrong number of tokens per sequence in SSM_SCAN

2025-07-12 14:14:22 +00:00 · 2024-10-02 21:35:50 -04:00
parent 5b8ec2b978
commit 62b09b343c
1 changed files with 1 additions and 1 deletions
--- a/ggml/src/ggml-metal.m
+++ b/ggml/src/ggml-metal.m
@ -1690,7 +1690,7 @@ static void ggml_metal_encode_node(
                const int64_t d_inner      = ne01;
                const int64_t n_head       = ne02;
                const int64_t n_group      = ne41;
-                const int64_t n_seq_tokens = ne11;
+                const int64_t n_seq_tokens = ne12;
                const int64_t n_seqs       = ne13;

                id<MTLComputePipelineState> pipeline = nil;