@@ -42,7 +42,7 @@ ggml_tensor * llm_build_mamba_base::build_mamba_layer(llm_graph_input_rs * inp,
4242 cur = ggml_reshape_3d (ctx0, cur, cur->ne [0 ], n_seq_tokens, n_seqs);
4343
4444 // {n_embd, 2*d_inner} @ {n_embd, n_seq_tokens, n_seqs} => {2*d_inner, n_seq_tokens, n_seqs}
45- ggml_tensor * xz = build_lora_mm (layer.ssm_in , cur);
45+ ggml_tensor * xz = build_lora_mm (layer.ssm_in , cur, layer. ssm_in_s );
4646 // split the above in two
4747 // => {d_inner, n_seq_tokens, n_seqs}
4848 ggml_tensor * x = ggml_view_3d (ctx0, xz, d_inner, xz->ne [1 ], xz->ne [2 ], xz->nb [1 ], xz->nb [2 ], 0 );
@@ -137,7 +137,7 @@ ggml_tensor * llm_build_mamba_base::build_mamba_layer(llm_graph_input_rs * inp,
137137 y = ggml_swiglu_split (ctx0, ggml_cont (ctx0, z), y);
138138
139139 // {d_inner, n_embd} @ {d_inner, n_seq_tokens, n_seqs} => {n_embd, n_seq_tokens, n_seqs}
140- cur = build_lora_mm (layer.ssm_out , y);
140+ cur = build_lora_mm (layer.ssm_out , y, layer. ssm_out_s );
141141 }
142142
143143 // {n_embd, n_seq_tokens, n_seqs} => {n_embd, n_tokens}
@@ -184,7 +184,7 @@ ggml_tensor * llm_build_mamba_base::build_mamba2_layer(llm_graph_input_rs * inp,
184184 // d_in_proj = 2 * self.d_inner + 2 * self.ngroups * self.d_state + self.nheads
185185
186186 // {n_embd, d_in_proj} @ {n_embd, n_seq_tokens, n_seqs} => {d_in_proj, n_seq_tokens, n_seqs}
187- ggml_tensor * zxBCdt = build_lora_mm (model.layers [il].ssm_in , cur);
187+ ggml_tensor * zxBCdt = build_lora_mm (model.layers [il].ssm_in , cur, model. layers [il]. ssm_in_s );
188188
189189 // split the above in three
190190 ggml_tensor * z = ggml_view_4d (ctx0, zxBCdt, head_dim, n_head, n_seq_tokens, n_seqs, head_dim * zxBCdt->nb [0 ],
@@ -278,7 +278,7 @@ ggml_tensor * llm_build_mamba_base::build_mamba2_layer(llm_graph_input_rs * inp,
278278 y = ggml_reshape_3d (ctx0, y, d_inner, n_seq_tokens, n_seqs);
279279
280280 // {d_inner, n_embd} @ {d_inner, n_seq_tokens, n_seqs} => {n_embd, n_seq_tokens, n_seqs}
281- cur = build_lora_mm (model.layers [il].ssm_out , y);
281+ cur = build_lora_mm (model.layers [il].ssm_out , y, model. layers [il]. ssm_out_s );
282282 }
283283
284284 // {n_embd, n_seq_tokens, n_seqs} => {n_embd, n_tokens}
0 commit comments