fix: divide 0 exception in mamba (#7932)

Signed-off-by: thxCode <thxcode0824@gmail.com>
2024-12-26 03:14:35 +00:00 · 2024-06-17 22:11:08 +08:00 · 2024-06-17 22:11:08 +08:00 · c637fcd34d
commit c637fcd34d
parent 6a2f0b3474
1 changed files with 1 additions and 1 deletions
--- a/llama.cpp
+++ b/llama.cpp
@ -5383,7 +5383,7 @@ static bool llm_load_tensors(
    // create tensors for the weights
    {
        const int64_t n_embd       = hparams.n_embd;
-        const int64_t n_embd_head  = n_embd / hparams.n_head;
+        const int64_t n_embd_head  = (hparams.n_head == 0) ? 0 : n_embd / hparams.n_head;
        const int64_t n_embd_k_gqa = hparams.n_embd_k_gqa();
        const int64_t n_embd_v_gqa = hparams.n_embd_v_gqa();
        const int64_t n_embd_gqa   = n_embd_v_gqa;