This commit is contained in:
Vaibhavs10 2025-07-04 14:15:34 +02:00
parent 6201b43814
commit 97c64a0974
1 changed files with 15 additions and 13 deletions

View File

@ -13828,12 +13828,13 @@ struct llm_build_smollm3 : public llm_graph_context {
LLM_NORM_RMS, il); LLM_NORM_RMS, il);
cb(ffn_cur, "ffn_norm", il); cb(ffn_cur, "ffn_norm", il);
ffn_cur = build_ffn(ffn_cur, ffn_cur = build_ffn(
model.layers[il].ffn_up, NULL, NULL, ffn_cur,
model.layers[il].ffn_gate, NULL, NULL, model.layers[il].ffn_up, model.layers[il].ffn_up_b, nullptr,
model.layers[il].ffn_down, NULL, NULL, model.layers[il].ffn_gate, model.layers[il].ffn_gate_b, nullptr,
NULL, model.layers[il].ffn_down, model.layers[il].ffn_down_b, nullptr,
LLM_FFN_SILU, LLM_FFN_PAR, il); nullptr,
LLM_FFN_SILU, LLM_FFN_PAR, il);
cb(ffn_cur, "ffn_out", il); cb(ffn_cur, "ffn_out", il);
cur = ggml_add(ctx0, cur, ffn_cur); cur = ggml_add(ctx0, cur, ffn_cur);
@ -13848,13 +13849,14 @@ struct llm_build_smollm3 : public llm_graph_context {
LLM_NORM_RMS, il); LLM_NORM_RMS, il);
cb(cur, "ffn_norm", il); cb(cur, "ffn_norm", il);
cur = build_ffn(cur, cur = build_ffn(
model.layers[il].ffn_up, NULL, NULL, cur,
model.layers[il].ffn_gate, NULL, NULL, model.layers[il].ffn_up, model.layers[il].ffn_up_b, nullptr,
model.layers[il].ffn_down, NULL, NULL, model.layers[il].ffn_gate, model.layers[il].ffn_gate_b, nullptr,
NULL, model.layers[il].ffn_down, model.layers[il].ffn_down_b, nullptr,
LLM_FFN_SILU, LLM_FFN_PAR, il); nullptr,
cb(cur, "ffn_out", il); LLM_FFN_SILU, LLM_FFN_PAR, il);
cb(cur, "ffn_out", il);
cur = ggml_add(ctx0, cur, ffn_inp); cur = ggml_add(ctx0, cur, ffn_inp);
cb(cur, "ffn_out", il); cb(cur, "ffn_out", il);