From fdd8acf01f59e78f013508bc0bf22c48477e38bf Mon Sep 17 00:00:00 2001 From: zRzRzRzRzRzRzR <2448370773@qq.com> Date: Sun, 28 Sep 2025 18:08:21 +0800 Subject: [PATCH] update glm-4.5 doc Signed-off-by: zRzRzRzRzRzRzR <2448370773@qq.com> --- docs/features/tool_calling.md | 6 ++++-- docs/models/supported_models.md | 2 +- tests/models/registry.py | 2 +- vllm/model_executor/models/glm4_moe.py | 2 +- 4 files changed, 7 insertions(+), 5 deletions(-) diff --git a/docs/features/tool_calling.md b/docs/features/tool_calling.md index 16693db7255c..241438ae5578 100644 --- a/docs/features/tool_calling.md +++ b/docs/features/tool_calling.md @@ -323,8 +323,10 @@ Flags: `--tool-call-parser longcat` Supported models: -* `ZhipuAI/GLM-4.5` -* `ZhipuAI/GLM-4.5-Air` +* `zai-org/GLM-4.5` +* `zai-org/GLM-4.5-Air` +* `zai-org/GLM-4.6` +* `zai-org/GLM-4.6-Air` Flags: `--tool-call-parser glm45` diff --git a/docs/models/supported_models.md b/docs/models/supported_models.md index 650f62492282..3ee5a7d0ffc5 100644 --- a/docs/models/supported_models.md +++ b/docs/models/supported_models.md @@ -367,7 +367,7 @@ th { | `Gemma3nForCausalLM` | Gemma 3n | `google/gemma-3n-E2B-it`, `google/gemma-3n-E4B-it`, etc. | | | ✅︎ | | `GlmForCausalLM` | GLM-4 | `zai-org/glm-4-9b-chat-hf`, etc. | ✅︎ | ✅︎ | ✅︎ | | `Glm4ForCausalLM` | GLM-4-0414 | `zai-org/GLM-4-32B-0414`, etc. | ✅︎ | ✅︎ | ✅︎ | -| `Glm4MoeForCausalLM` | GLM-4.5 | `zai-org/GLM-4.5`, etc. | ✅︎ | ✅︎ | ✅︎ | +| `Glm4MoeForCausalLM` | GLM-4.5, GLM-4.6 | `zai-org/GLM-4.5`, etc. | ✅︎ | ✅︎ | ✅︎ | | `GPT2LMHeadModel` | GPT-2 | `gpt2`, `gpt2-xl`, etc. | | ✅︎ | ✅︎ | | `GPTBigCodeForCausalLM` | StarCoder, SantaCoder, WizardCoder | `bigcode/starcoder`, `bigcode/gpt_bigcode-santacoder`, `WizardLM/WizardCoder-15B-V1.0`, etc. | ✅︎ | ✅︎ | ✅︎ | | `GPTJForCausalLM` | GPT-J | `EleutherAI/gpt-j-6b`, `nomic-ai/gpt4all-j`, etc. | | ✅︎ | ✅︎ | diff --git a/tests/models/registry.py b/tests/models/registry.py index e321acc873c6..124a97ed0c89 100644 --- a/tests/models/registry.py +++ b/tests/models/registry.py @@ -642,7 +642,7 @@ def check_available_online( speculative_model="baidu/ERNIE-4.5-21B-A3B-PT"), "Glm4MoeMTPModel": _HfExamplesInfo("zai-org/GLM-4.5", speculative_model="zai-org/GLM-4.5", - min_transformers_version="4.54", + min_transformers_version="4.56", is_available_online=False), "LongCatFlashMTPModel": _HfExamplesInfo( "meituan-longcat/LongCat-Flash-Chat", diff --git a/vllm/model_executor/models/glm4_moe.py b/vllm/model_executor/models/glm4_moe.py index 947c6ce62f55..2557748b7faa 100644 --- a/vllm/model_executor/models/glm4_moe.py +++ b/vllm/model_executor/models/glm4_moe.py @@ -21,7 +21,7 @@ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. -"""Inference-only GLM-4.5 model compatible with HuggingFace weights.""" +"""Inference-only GLM-4.5, GLM-4.6 model compatible with HuggingFace weights.""" import typing from collections.abc import Callable, Iterable from itertools import islice