We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 76e88c9 commit 5da3811Copy full SHA for 5da3811
src/llama-model.cpp
@@ -1429,7 +1429,10 @@ void llama_model::load_hparams(llama_model_loader & ml) {
1429
ml.get_key(LLM_KV_FIRST_K_DENSE_REPLACE, hparams.first_k_dense_replace, 0);
1430
1431
// Expert gating function (GLM45 uses sigmoid)
1432
- ml.get_key(LLM_KV_EXPERT_GATING_FUNC, hparams.expert_gating_func, uint32_t(LLAMA_EXPERT_GATING_FUNC_TYPE_SIGMOID));
+ ml.get_key(LLM_KV_EXPERT_GATING_FUNC, hparams.expert_gating_func, false);
1433
+ if (hparams.expert_gating_func == LLAMA_EXPERT_GATING_FUNC_TYPE_NONE) {
1434
+ hparams.expert_gating_func = LLAMA_EXPERT_GATING_FUNC_TYPE_SIGMOID;
1435
+ }
1436
1437
switch (hparams.n_layer) {
1438
case 46: type = LLM_TYPE_12B; break; // GLM-4.5-Air
0 commit comments