From 156263e0e79f8bff8fc2dffb4289330b2b014536 Mon Sep 17 00:00:00 2001 From: Roger Wang Date: Sat, 27 Sep 2025 18:17:59 -0700 Subject: [PATCH 1/2] fix Signed-off-by: Roger Wang --- vllm/model_executor/models/qwen3_moe.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/vllm/model_executor/models/qwen3_moe.py b/vllm/model_executor/models/qwen3_moe.py index 45b9c656a4bb..ba076e2203fe 100644 --- a/vllm/model_executor/models/qwen3_moe.py +++ b/vllm/model_executor/models/qwen3_moe.py @@ -107,7 +107,7 @@ def __init__( ): super().__init__() - config = vllm_config.model_config.hf_config + config = vllm_config.model_config.hf_config.get_text_config() parallel_config = vllm_config.parallel_config quant_config = vllm_config.quant_config @@ -293,7 +293,7 @@ class Qwen3MoeDecoderLayer(nn.Module): def __init__(self, vllm_config: VllmConfig, prefix: str = "") -> None: super().__init__() - config = vllm_config.model_config.hf_config + config = vllm_config.model_config.hf_config.get_text_config() cache_config = vllm_config.cache_config quant_config = vllm_config.quant_config @@ -586,7 +586,7 @@ class Qwen3MoeForCausalLM(nn.Module, SupportsPP, SupportsLoRA, def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""): super().__init__() - config = vllm_config.model_config.hf_config + config = vllm_config.model_config.hf_config.get_text_config() quant_config = vllm_config.quant_config self.config = config self.quant_config = quant_config From a718628fdeed31e1ec42367be1f88fb407bb4dc8 Mon Sep 17 00:00:00 2001 From: Roger Wang Date: Sat, 27 Sep 2025 18:33:57 -0700 Subject: [PATCH 2/2] update Signed-off-by: Roger Wang --- vllm/model_executor/models/qwen3_moe.py | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/vllm/model_executor/models/qwen3_moe.py b/vllm/model_executor/models/qwen3_moe.py index ba076e2203fe..61f1abad72b6 100644 --- a/vllm/model_executor/models/qwen3_moe.py +++ b/vllm/model_executor/models/qwen3_moe.py @@ -107,7 +107,7 @@ def __init__( ): super().__init__() - config = vllm_config.model_config.hf_config.get_text_config() + config = vllm_config.model_config.hf_text_config parallel_config = vllm_config.parallel_config quant_config = vllm_config.quant_config @@ -293,7 +293,7 @@ class Qwen3MoeDecoderLayer(nn.Module): def __init__(self, vllm_config: VllmConfig, prefix: str = "") -> None: super().__init__() - config = vllm_config.model_config.hf_config.get_text_config() + config = vllm_config.model_config.hf_text_config cache_config = vllm_config.cache_config quant_config = vllm_config.quant_config @@ -372,7 +372,7 @@ class Qwen3MoeModel(nn.Module): def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""): super().__init__() - config = vllm_config.model_config.hf_config.get_text_config() + config = vllm_config.model_config.hf_text_config quant_config = vllm_config.quant_config parallel_config = vllm_config.parallel_config eplb_config = parallel_config.eplb_config @@ -586,7 +586,7 @@ class Qwen3MoeForCausalLM(nn.Module, SupportsPP, SupportsLoRA, def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""): super().__init__() - config = vllm_config.model_config.hf_config.get_text_config() + config = vllm_config.model_config.hf_text_config quant_config = vllm_config.quant_config self.config = config self.quant_config = quant_config