graph : remove redundant scale_w parameter (#20235)

This commit is contained in:
Sigbjørn Skjæret 2026-03-08 18:58:28 +01:00 committed by GitHub
parent 451ef08432
commit 35bee031e1
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
41 changed files with 85 additions and 86 deletions

View file

@ -1,6 +1,5 @@
#include "models.h"
llm_build_dbrx::llm_build_dbrx(const llama_model & model, const llm_graph_params & params) : llm_graph_context(params) {
const int64_t n_embd_head = hparams.n_embd_head_v;
const int64_t n_embd_gqa = hparams.n_embd_v_gqa();
@ -89,7 +88,7 @@ llm_build_dbrx::llm_build_dbrx(const llama_model & model, const llm_graph_params
nullptr,
n_expert, n_expert_used,
LLM_FFN_SILU, true,
false, 0.0,
hparams.expert_weights_scale,
LLAMA_EXPERT_GATING_FUNC_TYPE_SOFTMAX,
il);
cb(cur, "ffn_moe_out", il);