Преглед изворни кода

model : Qwen3-Next-80B-A3B has 48 layers (#17898)

* model : Qwen3-Next-80B-A3B has 48 layers

* model : Add 80B-A3B type name
Eric Zhang пре 1 месец
родитељ
комит
b677721819
1 измењених фајлова са 2 додато и 1 уклоњено
  1. 2 1
      src/llama-model.cpp

+ 2 - 1
src/llama-model.cpp

@@ -120,6 +120,7 @@ const char * llm_type_name(llm_type type) {
         case LLM_TYPE_16B_A1B:       return "16B.A1B";
         case LLM_TYPE_21B_A3B:       return "21B.A3B";
         case LLM_TYPE_30B_A3B:       return "30B.A3B";
+        case LLM_TYPE_80B_A3B:       return "80B.A3B";
         case LLM_TYPE_100B_A6B:      return "100B.A6B";
         case LLM_TYPE_106B_A12B:     return "106B.A12B";
         case LLM_TYPE_230B_A10B:     return "230B.A10B";
@@ -2257,7 +2258,7 @@ void llama_model::load_hparams(llama_model_loader & ml) {
                 }
 
                 switch (hparams.n_layer) {
-                    case 80: type = LLM_TYPE_80B_A3B; break;
+                    case 48: type = LLM_TYPE_80B_A3B; break;
                     default: type = LLM_TYPE_UNKNOWN;
                 }
             } break;