Skip to content

Commit 7503535

Browse files
authored
Merge pull request ggml-org#3 from DominguesM/nvidia-nemotron-nano-v2
Nemotron-H: MLP gate cleanup + honor ssm_dt_rank for dt_dim
2 parents 3132915 + 4223a1f commit 7503535

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

src/llama-model.cpp

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -14339,11 +14339,11 @@ struct llm_build_nemotronh : public llm_graph_context_mamba {
1433914339

1434014340
cur = build_ffn(cur,
1434114341
model.layers[il].ffn_up, model.layers[il].ffn_up_b, NULL,
14342-
model.layers[il].ffn_gate, model.layers[il].ffn_gate_b, NULL,
14342+
NULL, NULL, NULL,
1434314343
model.layers[il].ffn_down, model.layers[il].ffn_down_b, NULL,
1434414344
NULL,
1434514345
LLM_FFN_RELU_SQR, LLM_FFN_PAR, il);
14346-
cb(cur, "ffn_out", il);
14346+
cb(cur, "ffn_out", il);
1434714347

1434814348
cur = build_cvec(cur, il);
1434914349
cb(cur, "l_out", il);

0 commit comments

Comments
 (0)