llama : fix buffer checks for mamba and rwk (llama/10111)

* llama : fix buffer checks for mamba and rwk * llama : fix missing worst case flag during reserve * cuda : fix supports_op for norm * disable sched SET_CAUSE
2025-06-16 13:58:09 +00:00 · 2024-10-31 22:54:23 +01:00
parent 371bfaca8c
commit 3e231ab9cc
3 changed files with 6 additions and 3 deletions
--- a/ggml/src/ggml.c
+++ b/ggml/src/ggml.c
@ -7243,6 +7243,7 @@ struct ggml_tensor * ggml_ssm_conv(
    const int64_t n_s     = sx->ne[2];

    // TODO: maybe support other strides than 1?
+    // FIXME: this is always true?
    GGML_ASSERT(sx->ne[0] == d_conv - 1 + n_t);
    GGML_ASSERT(sx->ne[1] == d_inner);
    GGML_ASSERT(n_t >= 0);