model : Qwen3-Next-80B-A3B has 48 layers (#17898)

* model : Qwen3-Next-80B-A3B has 48 layers

* model : Add 80B-A3B type name
This commit is contained in:
Eric Zhang 2025-12-10 22:22:40 +08:00 committed by GitHub
parent 2d2e1030e3
commit b677721819
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
1 changed files with 2 additions and 1 deletions

View File

@ -120,6 +120,7 @@ const char * llm_type_name(llm_type type) {
case LLM_TYPE_16B_A1B: return "16B.A1B"; case LLM_TYPE_16B_A1B: return "16B.A1B";
case LLM_TYPE_21B_A3B: return "21B.A3B"; case LLM_TYPE_21B_A3B: return "21B.A3B";
case LLM_TYPE_30B_A3B: return "30B.A3B"; case LLM_TYPE_30B_A3B: return "30B.A3B";
case LLM_TYPE_80B_A3B: return "80B.A3B";
case LLM_TYPE_100B_A6B: return "100B.A6B"; case LLM_TYPE_100B_A6B: return "100B.A6B";
case LLM_TYPE_106B_A12B: return "106B.A12B"; case LLM_TYPE_106B_A12B: return "106B.A12B";
case LLM_TYPE_230B_A10B: return "230B.A10B"; case LLM_TYPE_230B_A10B: return "230B.A10B";
@ -2257,7 +2258,7 @@ void llama_model::load_hparams(llama_model_loader & ml) {
} }
switch (hparams.n_layer) { switch (hparams.n_layer) {
case 80: type = LLM_TYPE_80B_A3B; break; case 48: type = LLM_TYPE_80B_A3B; break;
default: type = LLM_TYPE_UNKNOWN; default: type = LLM_TYPE_UNKNOWN;
} }
} break; } break;