modelscope · Jintao-Huang · Sep 16, 2025 · Sep 16, 2025 · Sep 16, 2025 · Sep 16, 2025
diff --git a/README.md b/README.md
@@ -124,18 +124,18 @@ Running Environment:
 
 |              | Range        | Recommended         | Notes                                     |
 |--------------|--------------|---------------------|-------------------------------------------|
-| python       | >=3.9        | 3.10                |                                           |
+| python       | >=3.9        | 3.10/3.11                |                                           |
 | cuda         |              | cuda12              | No need to install if using CPU, NPU, MPS |
 | torch        | >=2.0        | 2.7.1               |                                           |
-| transformers | >=4.33       | 4.55.4              |                                           |
+| transformers | >=4.33       | 4.56.1              |                                           |
 | modelscope   | >=1.23       |                     |                                           |
 | peft         | >=0.11,<0.18 |                     |                                           |
 | flash_attn   |              | 2.7.4.post1/3.0.0b1 |                                           |
 | trl          | >=0.15,<0.21 | 0.20.0              | RLHF                                      |
-| deepspeed    | >=0.14       | 0.16.9              | Training                                  |
-| vllm         | >=0.5.1      | 0.10                | Inference/Deployment                      |
-| sglang       | >=0.4.6      | 0.4.9.post6         | Inference/Deployment                      |
-| lmdeploy     | >=0.5   | 0.9.2                 | Inference/Deployment                      |
+| deepspeed    | >=0.14       | 0.17.5              | Training                                  |
+| vllm         | >=0.5.1      | 0.10.1.1                | Inference/Deployment                      |
+| sglang       | >=0.4.6      | 0.4.10.post2         | Inference/Deployment                      |
+| lmdeploy     | >=0.5   | 0.9.2.post1                 | Inference/Deployment                      |
-| python       | >=3.9        | 3.10/3.11                |                                           |
-| cuda         |              | cuda12              | No need to install if using CPU, NPU, MPS |
-| torch        | >=2.0        | 2.7.1               |                                           |
-| transformers | >=4.33       | 4.55.4              |                                           |
-| transformers | >=4.33       | 4.56.1              |                                           |
-| modelscope   | >=1.23       |                     |                                           |
-| peft         | >=0.11,<0.18 |                     |                                           |
-| flash_attn   |              | 2.7.4.post1/3.0.0b1 |                                           |
-| trl          | >=0.15,<0.21 | 0.20.0              | RLHF                                      |
-| deepspeed    | >=0.14       | 0.16.9              | Training                                  |
-| vllm         | >=0.5.1      | 0.10                | Inference/Deployment                      |
-| sglang       | >=0.4.6      | 0.4.9.post6         | Inference/Deployment                      |
-| lmdeploy     | >=0.5   | 0.9.2                 | Inference/Deployment                      |
-| deepspeed    | >=0.14       | 0.17.5              | Training                                  |
-| vllm         | >=0.5.1      | 0.10.1.1                | Inference/Deployment                      |
-| sglang       | >=0.4.6      | 0.4.10.post2         | Inference/Deployment                      |
-| lmdeploy     | >=0.5   | 0.9.2.post1                 | Inference/Deployment                      |
+| python       | >=3.9        | 3.10/3.11           |                                           |
+| cuda         |              | cuda12              | No need to install if using CPU, NPU, MPS |
+| torch        | >=2.0        | 2.7.1               |                                           |
+| transformers | >=4.33       | 4.56.1              |                                           |
+| modelscope   | >=1.23       |                     |                                           |
+| peft         | >=0.11,<0.18 |                     |                                           |
+| flash_attn   |              | 2.7.4.post1/3.0.0b1 |                                           |
+| trl          | >=0.15,<0.21 | 0.20.0              | RLHF                                      |
+| deepspeed    | >=0.14       | 0.17.5              | Training                                  |
+| vllm         | >=0.5.1      | 0.10.1.1            | Inference/Deployment                      |
+| sglang       | >=0.4.6      | 0.4.10.post2        | Inference/Deployment                      |
+| lmdeploy     | >=0.5        | 0.9.2.post1         | Inference/Deployment                      |
-| python       | >=3.9        | 3.10/3.11                |                                           |
-| cuda         |              | cuda12              | No need to install if using CPU, NPU, MPS |
-| torch        | >=2.0        | 2.7.1               |                                           |
-| transformers | >=4.33       | 4.55.4              |                                           |
-| transformers | >=4.33       | 4.56.1              |                                           |
-| modelscope   | >=1.23       |                     |                                           |
-| peft         | >=0.11,<0.18 |                     |                                           |
-| flash_attn   |              | 2.7.4.post1/3.0.0b1 |                                           |
-| trl          | >=0.15,<0.21 | 0.20.0              | RLHF                                      |
-| deepspeed    | >=0.14       | 0.16.9              | Training                                  |
-| vllm         | >=0.5.1      | 0.10                | Inference/Deployment                      |
-| sglang       | >=0.4.6      | 0.4.9.post6         | Inference/Deployment                      |
-| lmdeploy     | >=0.5   | 0.9.2                 | Inference/Deployment                      |
-| deepspeed    | >=0.14       | 0.17.5              | Training                                  |
-| vllm         | >=0.5.1      | 0.10.1.1                | Inference/Deployment                      |
-| sglang       | >=0.4.6      | 0.4.10.post2         | Inference/Deployment                      |
-| lmdeploy     | >=0.5   | 0.9.2.post1                 | Inference/Deployment                      |
+| python       | >=3.9        | 3.10/3.11           |                                           |
+| cuda         |              | cuda12              | No need to install if using CPU, NPU, MPS |
+| torch        | >=2.0        | 2.7.1               |                                           |
+| transformers | >=4.33       | 4.56.1              |                                           |
+| modelscope   | >=1.23       |                     |                                           |
+| peft         | >=0.11,<0.18 |                     |                                           |
+| flash_attn   |              | 2.7.4.post1/3.0.0b1 |                                           |
+| trl          | >=0.15,<0.21 | 0.20.0              | RLHF                                      |
+| deepspeed    | >=0.14       | 0.17.5              | Training                                  |
+| vllm         | >=0.5.1      | 0.10.1.1            | Inference/Deployment                      |
+| sglang       | >=0.4.6      | 0.4.10.post2        | Inference/Deployment                      |
+| lmdeploy     | >=0.5        | 0.9.2.post1         | Inference/Deployment                      |
 | evalscope    | >=0.11       |                     | Evaluation                                |
 | gradio       |              | 5.32.1              | Web-UI/App                                |
 

diff --git a/README_CN.md b/README_CN.md
@@ -120,18 +120,18 @@ pip install -e .
 
 |              | 范围           | 推荐                  | 备注                 |
 |--------------|--------------|---------------------|--------------------|
-| python       | >=3.9        | 3.10                |                    |
+| python       | >=3.9        | 3.10/3.11            |                    |
 | cuda         |              | cuda12              | 使用cpu、npu、mps则无需安装 |
 | torch        | >=2.0        | 2.7.1               |                    |
-| transformers | >=4.33       | 4.55.4              |                    |
+| transformers | >=4.33       | 4.56.1              |                    |
 | modelscope   | >=1.23       |                     |                    |
 | peft         | >=0.11,<0.18 |                     |                    |
 | flash_attn   |              | 2.7.4.post1/3.0.0b1 |                    |
 | trl          | >=0.15,<0.21 | 0.20.0              | RLHF               |
-| deepspeed    | >=0.14       | 0.16.9              | 训练                 |
-| vllm         | >=0.5.1      | 0.10                | 推理/部署              |
-| sglang       | >=0.4.6      | 0.4.9.post6         | 推理/部署              |
-| lmdeploy     | >=0.5   | 0.9.2                 | 推理/部署              |
+| deepspeed    | >=0.14       | 0.17.5              | 训练                 |
+| vllm         | >=0.5.1      | 0.10.1.1                | 推理/部署              |
+| sglang       | >=0.4.6      | 0.4.10.post2         | 推理/部署              |
+| lmdeploy     | >=0.5   | 0.9.2.post1                 | 推理/部署              |
-| python       | >=3.9        | 3.10/3.11            |                    |
-| cuda         |              | cuda12              | 使用cpu、npu、mps则无需安装 |
-| torch        | >=2.0        | 2.7.1               |                    |
-| transformers | >=4.33       | 4.55.4              |                    |
-| transformers | >=4.33       | 4.56.1              |                    |
-| modelscope   | >=1.23       |                     |                    |
-| peft         | >=0.11,<0.18 |                     |                    |
-| flash_attn   |              | 2.7.4.post1/3.0.0b1 |                    |
-| trl          | >=0.15,<0.21 | 0.20.0              | RLHF               |
-| deepspeed    | >=0.14       | 0.16.9              | 训练                 |
-| vllm         | >=0.5.1      | 0.10                | 推理/部署              |
-| sglang       | >=0.4.6      | 0.4.9.post6         | 推理/部署              |
-| lmdeploy     | >=0.5   | 0.9.2                 | 推理/部署              |
-| deepspeed    | >=0.14       | 0.17.5              | 训练                 |
-| vllm         | >=0.5.1      | 0.10.1.1                | 推理/部署              |
-| sglang       | >=0.4.6      | 0.4.10.post2         | 推理/部署              |
-| lmdeploy     | >=0.5   | 0.9.2.post1                 | 推理/部署              |
+| python       | >=3.9        | 3.10/3.11           |                    |
+| cuda         |              | cuda12              | 使用cpu、npu、mps则无需安装 |
+| torch        | >=2.0        | 2.7.1               |                    |
+| transformers | >=4.33       | 4.56.1              |                    |
+| modelscope   | >=1.23       |                     |                    |
+| peft         | >=0.11,<0.18 |                     |                    |
+| flash_attn   |              | 2.7.4.post1/3.0.0b1 |                    |
+| trl          | >=0.15,<0.21 | 0.20.0              | RLHF               |
+| deepspeed    | >=0.14       | 0.17.5              | 训练                 |
+| vllm         | >=0.5.1      | 0.10.1.1            | 推理/部署              |
+| sglang       | >=0.4.6      | 0.4.10.post2        | 推理/部署              |
+| lmdeploy     | >=0.5        | 0.9.2.post1         | 推理/部署              |
-| python       | >=3.9        | 3.10/3.11            |                    |
-| cuda         |              | cuda12              | 使用cpu、npu、mps则无需安装 |
-| torch        | >=2.0        | 2.7.1               |                    |
-| transformers | >=4.33       | 4.55.4              |                    |
-| transformers | >=4.33       | 4.56.1              |                    |
-| modelscope   | >=1.23       |                     |                    |
-| peft         | >=0.11,<0.18 |                     |                    |
-| flash_attn   |              | 2.7.4.post1/3.0.0b1 |                    |
-| trl          | >=0.15,<0.21 | 0.20.0              | RLHF               |
-| deepspeed    | >=0.14       | 0.16.9              | 训练                 |
-| vllm         | >=0.5.1      | 0.10                | 推理/部署              |
-| sglang       | >=0.4.6      | 0.4.9.post6         | 推理/部署              |
-| lmdeploy     | >=0.5   | 0.9.2                 | 推理/部署              |
-| deepspeed    | >=0.14       | 0.17.5              | 训练                 |
-| vllm         | >=0.5.1      | 0.10.1.1                | 推理/部署              |
-| sglang       | >=0.4.6      | 0.4.10.post2         | 推理/部署              |
-| lmdeploy     | >=0.5   | 0.9.2.post1                 | 推理/部署              |
+| python       | >=3.9        | 3.10/3.11           |                    |
+| cuda         |              | cuda12              | 使用cpu、npu、mps则无需安装 |
+| torch        | >=2.0        | 2.7.1               |                    |
+| transformers | >=4.33       | 4.56.1              |                    |
+| modelscope   | >=1.23       |                     |                    |
+| peft         | >=0.11,<0.18 |                     |                    |
+| flash_attn   |              | 2.7.4.post1/3.0.0b1 |                    |
+| trl          | >=0.15,<0.21 | 0.20.0              | RLHF               |
+| deepspeed    | >=0.14       | 0.17.5              | 训练                 |
+| vllm         | >=0.5.1      | 0.10.1.1            | 推理/部署              |
+| sglang       | >=0.4.6      | 0.4.10.post2        | 推理/部署              |
+| lmdeploy     | >=0.5        | 0.9.2.post1         | 推理/部署              |
 | evalscope    | >=0.11       |                     | 评测                 |
 | gradio       |              | 5.32.1              | Web-UI/App         |
 

diff --git a/docs/source/GetStarted/SWIFT安装.md b/docs/source/GetStarted/SWIFT安装.md
@@ -91,18 +91,18 @@ modelscope-registry.us-west-1.cr.aliyuncs.com/modelscope-repo/modelscope:ubuntu2
 
 |              | 范围           | 推荐                  | 备注                 |
 |--------------|--------------|---------------------|--------------------|
-| python       | >=3.9        | 3.10                |                    |
+| python       | >=3.9        | 3.10/3.11                |                    |
 | cuda         |              | cuda12              | 使用cpu、npu、mps则无需安装 |
 | torch        | >=2.0        | 2.7.1               |                    |
-| transformers | >=4.33       | 4.55.4              |                    |
+| transformers | >=4.33       | 4.56.1              |                    |
 | modelscope   | >=1.23       |                     |                    |
 | peft         | >=0.11,<0.18 |                     |                    |
 | flash_attn   |              | 2.7.4.post1/3.0.0b1 |                    |
 | trl          | >=0.15,<0.21 | 0.20.0              | RLHF               |
-| deepspeed    | >=0.14       | 0.16.9              | 训练                 |
-| vllm         | >=0.5.1      | 0.10                | 推理/部署              |
-| sglang       | >=0.4.6      | 0.4.9.post6         | 推理/部署              |
-| lmdeploy     | >=0.5   | 0.9.2                 | 推理/部署              |
+| deepspeed    | >=0.14       | 0.17.5              | 训练                 |
+| vllm         | >=0.5.1      | 0.10.1.1                | 推理/部署              |
+| sglang       | >=0.4.6      | 0.4.10.post2         | 推理/部署              |
+| lmdeploy     | >=0.5   | 0.9.2.post1                 | 推理/部署              |
-| python       | >=3.9        | 3.10/3.11                |                    |
-| cuda         |              | cuda12              | 使用cpu、npu、mps则无需安装 |
-| torch        | >=2.0        | 2.7.1               |                    |
-| transformers | >=4.33       | 4.55.4              |                    |
-| transformers | >=4.33       | 4.56.1              |                    |
-| modelscope   | >=1.23       |                     |                    |
-| peft         | >=0.11,<0.18 |                     |                    |
-| flash_attn   |              | 2.7.4.post1/3.0.0b1 |                    |
-| trl          | >=0.15,<0.21 | 0.20.0              | RLHF               |
-| deepspeed    | >=0.14       | 0.16.9              | 训练                 |
-| vllm         | >=0.5.1      | 0.10                | 推理/部署              |
-| sglang       | >=0.4.6      | 0.4.9.post6         | 推理/部署              |
-| lmdeploy     | >=0.5   | 0.9.2                 | 推理/部署              |
-| deepspeed    | >=0.14       | 0.17.5              | 训练                 |
-| vllm         | >=0.5.1      | 0.10.1.1                | 推理/部署              |
-| sglang       | >=0.4.6      | 0.4.10.post2         | 推理/部署              |
-| lmdeploy     | >=0.5   | 0.9.2.post1                 | 推理/部署              |
+| python       | >=3.9        | 3.10/3.11           |                    |
+| cuda         |              | cuda12              | 使用cpu、npu、mps则无需安装 |
+| torch        | >=2.0        | 2.7.1               |                    |
+| transformers | >=4.33       | 4.56.1              |                    |
+| modelscope   | >=1.23       |                     |                    |
+| peft         | >=0.11,<0.18 |                     |                    |
+| flash_attn   |              | 2.7.4.post1/3.0.0b1 |                    |
+| trl          | >=0.15,<0.21 | 0.20.0              | RLHF               |
+| deepspeed    | >=0.14       | 0.17.5              | 训练                 |
+| vllm         | >=0.5.1      | 0.10.1.1            | 推理/部署              |
+| sglang       | >=0.4.6      | 0.4.10.post2        | 推理/部署              |
+| lmdeploy     | >=0.5        | 0.9.2.post1         | 推理/部署              |
-| python       | >=3.9        | 3.10/3.11                |                    |
-| cuda         |              | cuda12              | 使用cpu、npu、mps则无需安装 |
-| torch        | >=2.0        | 2.7.1               |                    |
-| transformers | >=4.33       | 4.55.4              |                    |
-| transformers | >=4.33       | 4.56.1              |                    |
-| modelscope   | >=1.23       |                     |                    |
-| peft         | >=0.11,<0.18 |                     |                    |
-| flash_attn   |              | 2.7.4.post1/3.0.0b1 |                    |
-| trl          | >=0.15,<0.21 | 0.20.0              | RLHF               |
-| deepspeed    | >=0.14       | 0.16.9              | 训练                 |
-| vllm         | >=0.5.1      | 0.10                | 推理/部署              |
-| sglang       | >=0.4.6      | 0.4.9.post6         | 推理/部署              |
-| lmdeploy     | >=0.5   | 0.9.2                 | 推理/部署              |
-| deepspeed    | >=0.14       | 0.17.5              | 训练                 |
-| vllm         | >=0.5.1      | 0.10.1.1                | 推理/部署              |
-| sglang       | >=0.4.6      | 0.4.10.post2         | 推理/部署              |
-| lmdeploy     | >=0.5   | 0.9.2.post1                 | 推理/部署              |
+| python       | >=3.9        | 3.10/3.11           |                    |
+| cuda         |              | cuda12              | 使用cpu、npu、mps则无需安装 |
+| torch        | >=2.0        | 2.7.1               |                    |
+| transformers | >=4.33       | 4.56.1              |                    |
+| modelscope   | >=1.23       |                     |                    |
+| peft         | >=0.11,<0.18 |                     |                    |
+| flash_attn   |              | 2.7.4.post1/3.0.0b1 |                    |
+| trl          | >=0.15,<0.21 | 0.20.0              | RLHF               |
+| deepspeed    | >=0.14       | 0.17.5              | 训练                 |
+| vllm         | >=0.5.1      | 0.10.1.1            | 推理/部署              |
+| sglang       | >=0.4.6      | 0.4.10.post2        | 推理/部署              |
+| lmdeploy     | >=0.5        | 0.9.2.post1         | 推理/部署              |
 | evalscope    | >=0.11       |                     | 评测                 |
 | gradio       |              | 5.32.1              | Web-UI/App         |
 

diff --git a/docs/source/Megatron-SWIFT/快速开始.md b/docs/source/Megatron-SWIFT/快速开始.md
@@ -45,14 +45,14 @@ modelscope-registry.us-west-1.cr.aliyuncs.com/modelscope-repo/modelscope:ubuntu2
 推荐运行环境：
 |              | 范围           | 推荐          | 备注                 |
 |--------------|--------------|-------------|--------------------|
-| python       | >=3.9        | 3.10        |                    |
+| python       | >=3.9        | 3.10/3.11        |                    |
 | cuda         |              | cuda12      |                    |
 | torch        | >=2.0        | 2.6.0/2.7.1       |                    |
 | transformer_engine    | >=2.3       |          |                  |
 | apex |   |  0.1 | |
 | megatron_core    | >=0.12       | 0.13      |                  |
 | flash_attn    |        | 2.7.4.post1/3.0.0b1   |                  |
-| transformers | >=4.33       | 4.51.3      |                    |
+| transformers | >=4.33       | 4.56.1      |                    |
-| python       | >=3.9        | 3.10/3.11        |                    |
-| cuda         |              | cuda12      |                    |
-| torch        | >=2.0        | 2.6.0/2.7.1       |                    |
-| transformer_engine    | >=2.3       |          |                  |
-| apex |   |  0.1 | |
-| megatron_core    | >=0.12       | 0.13      |                  |
-| flash_attn    |        | 2.7.4.post1/3.0.0b1   |                  |
-| transformers | >=4.33       | 4.51.3      |                    |
-| transformers | >=4.33       | 4.56.1      |                    |
+| python       | >=3.9        | 3.10/3.11   |                    |
+| cuda         |              | cuda12      |                    |
+| torch        | >=2.0        | 2.6.0/2.7.1 |                    |
+| transformer_engine    | >=2.3       |             |                  |
+| apex         |              | 0.1         |                    |
+| megatron_core    | >=0.12       | 0.13        |                  |
+| flash_attn    |              | 2.7.4.post1/3.0.0b1   |                  |
+| transformers | >=4.33       | 4.56.1      |                    |
-| python       | >=3.9        | 3.10/3.11        |                    |
-| cuda         |              | cuda12      |                    |
-| torch        | >=2.0        | 2.6.0/2.7.1       |                    |
-| transformer_engine    | >=2.3       |          |                  |
-| apex |   |  0.1 | |
-| megatron_core    | >=0.12       | 0.13      |                  |
-| flash_attn    |        | 2.7.4.post1/3.0.0b1   |                  |
-| transformers | >=4.33       | 4.51.3      |                    |
-| transformers | >=4.33       | 4.56.1      |                    |
+| python       | >=3.9        | 3.10/3.11   |                    |
+| cuda         |              | cuda12      |                    |
+| torch        | >=2.0        | 2.6.0/2.7.1 |                    |
+| transformer_engine    | >=2.3       |             |                  |
+| apex         |              | 0.1         |                    |
+| megatron_core    | >=0.12       | 0.13        |                  |
+| flash_attn    |              | 2.7.4.post1/3.0.0b1   |                  |
+| transformers | >=4.33       | 4.56.1      |                    |
 | modelscope   | >=1.23       |             |                    |
 | peft         | >=0.11,<0.18 |             |      LoRA          |
 | trl          | >=0.15,<0.21 |       |      RLHF        |

diff --git a/docs/source_en/GetStarted/SWIFT-installation.md b/docs/source_en/GetStarted/SWIFT-installation.md
@@ -92,18 +92,18 @@ More images can be found [here](https://modelscope.cn/docs/intro/environment-set
 
 |              | Range        | Recommended         | Notes                                     |
 |--------------|--------------|---------------------|-------------------------------------------|
-| python       | >=3.9        | 3.10                |                                           |
+| python       | >=3.9        | 3.10/3.11                |                                           |
 | cuda         |              | cuda12              | No need to install if using CPU, NPU, MPS |
 | torch        | >=2.0        | 2.7.1               |                                           |
-| transformers | >=4.33       | 4.55.4              |                                           |
+| transformers | >=4.33       | 4.56.1              |                                           |
 | modelscope   | >=1.23       |                     |                                           |
 | peft         | >=0.11,<0.18 |                     |                                           |
 | flash_attn   |              | 2.7.4.post1/3.0.0b1 |                                           |
 | trl          | >=0.15,<0.21 | 0.20.0              | RLHF                                      |
-| deepspeed    | >=0.14       | 0.16.9              | Training                                  |
-| vllm         | >=0.5.1      | 0.10                | Inference/Deployment                      |
-| sglang       | >=0.4.6      | 0.4.9.post6         | Inference/Deployment                      |
-| lmdeploy     | >=0.5   | 0.9.2                 | Inference/Deployment                      |
+| deepspeed    | >=0.14       | 0.17.5              | Training                                  |
+| vllm         | >=0.5.1      | 0.10.1.1                | Inference/Deployment                      |
+| sglang       | >=0.4.6      | 0.4.10.post2         | Inference/Deployment                      |
+| lmdeploy     | >=0.5   | 0.9.2.post1                 | Inference/Deployment                      |
-| python       | >=3.9        | 3.10/3.11                |                                           |
-| cuda         |              | cuda12              | No need to install if using CPU, NPU, MPS |
-| torch        | >=2.0        | 2.7.1               |                                           |
-| transformers | >=4.33       | 4.55.4              |                                           |
-| transformers | >=4.33       | 4.56.1              |                                           |
-| modelscope   | >=1.23       |                     |                                           |
-| peft         | >=0.11,<0.18 |                     |                                           |
-| flash_attn   |              | 2.7.4.post1/3.0.0b1 |                                           |
-| trl          | >=0.15,<0.21 | 0.20.0              | RLHF                                      |
-| deepspeed    | >=0.14       | 0.16.9              | Training                                  |
-| vllm         | >=0.5.1      | 0.10                | Inference/Deployment                      |
-| sglang       | >=0.4.6      | 0.4.9.post6         | Inference/Deployment                      |
-| lmdeploy     | >=0.5   | 0.9.2                 | Inference/Deployment                      |
-| deepspeed    | >=0.14       | 0.17.5              | Training                                  |
-| vllm         | >=0.5.1      | 0.10.1.1                | Inference/Deployment                      |
-| sglang       | >=0.4.6      | 0.4.10.post2         | Inference/Deployment                      |
-| lmdeploy     | >=0.5   | 0.9.2.post1                 | Inference/Deployment                      |
+| python       | >=3.9        | 3.10/3.11           |                                           |
+| cuda         |              | cuda12              | No need to install if using CPU, NPU, MPS |
+| torch        | >=2.0        | 2.7.1               |                                           |
+| transformers | >=4.33       | 4.56.1              |                                           |
+| modelscope   | >=1.23       |                     |                                           |
+| peft         | >=0.11,<0.18 |                     |                                           |
+| flash_attn   |              | 2.7.4.post1/3.0.0b1 |                                           |
+| trl          | >=0.15,<0.21 | 0.20.0              | RLHF                                      |
+| deepspeed    | >=0.14       | 0.17.5              | Training                                  |
+| vllm         | >=0.5.1      | 0.10.1.1            | Inference/Deployment                      |
+| sglang       | >=0.4.6      | 0.4.10.post2        | Inference/Deployment                      |
+| lmdeploy     | >=0.5        | 0.9.2.post1         | Inference/Deployment                      |
-| python       | >=3.9        | 3.10/3.11                |                                           |
-| cuda         |              | cuda12              | No need to install if using CPU, NPU, MPS |
-| torch        | >=2.0        | 2.7.1               |                                           |
-| transformers | >=4.33       | 4.55.4              |                                           |
-| transformers | >=4.33       | 4.56.1              |                                           |
-| modelscope   | >=1.23       |                     |                                           |
-| peft         | >=0.11,<0.18 |                     |                                           |
-| flash_attn   |              | 2.7.4.post1/3.0.0b1 |                                           |
-| trl          | >=0.15,<0.21 | 0.20.0              | RLHF                                      |
-| deepspeed    | >=0.14       | 0.16.9              | Training                                  |
-| vllm         | >=0.5.1      | 0.10                | Inference/Deployment                      |
-| sglang       | >=0.4.6      | 0.4.9.post6         | Inference/Deployment                      |
-| lmdeploy     | >=0.5   | 0.9.2                 | Inference/Deployment                      |
-| deepspeed    | >=0.14       | 0.17.5              | Training                                  |
-| vllm         | >=0.5.1      | 0.10.1.1                | Inference/Deployment                      |
-| sglang       | >=0.4.6      | 0.4.10.post2         | Inference/Deployment                      |
-| lmdeploy     | >=0.5   | 0.9.2.post1                 | Inference/Deployment                      |
+| python       | >=3.9        | 3.10/3.11           |                                           |
+| cuda         |              | cuda12              | No need to install if using CPU, NPU, MPS |
+| torch        | >=2.0        | 2.7.1               |                                           |
+| transformers | >=4.33       | 4.56.1              |                                           |
+| modelscope   | >=1.23       |                     |                                           |
+| peft         | >=0.11,<0.18 |                     |                                           |
+| flash_attn   |              | 2.7.4.post1/3.0.0b1 |                                           |
+| trl          | >=0.15,<0.21 | 0.20.0              | RLHF                                      |
+| deepspeed    | >=0.14       | 0.17.5              | Training                                  |
+| vllm         | >=0.5.1      | 0.10.1.1            | Inference/Deployment                      |
+| sglang       | >=0.4.6      | 0.4.10.post2        | Inference/Deployment                      |
+| lmdeploy     | >=0.5        | 0.9.2.post1         | Inference/Deployment                      |
 | evalscope    | >=0.11       |                     | Evaluation                                |
 | gradio       |              | 5.32.1              | Web-UI/App                                |
 

diff --git a/docs/source_en/Megatron-SWIFT/Quick-start.md b/docs/source_en/Megatron-SWIFT/Quick-start.md
@@ -46,14 +46,14 @@ Recommended Operating Environment:
 
 |        | Range | Recommended | Notes |
 |--------------|--------------|-------------|--------------------|
-| python       | >=3.9        | 3.10        |                    |
+| python       | >=3.9        | 3.10/3.11        |                    |
 | cuda         |              | cuda12      |                    |
 | torch        | >=2.0        | 2.6.0/2.7.1    |                    |
 | transformer_engine    | >=2.3       |         |                  |
 | apex |   |  0.1 | |
 | megatron_core    | >=0.12       | 0.13      |                  |
 | flash_attn    |        | 2.7.4.post1/3.0.0b1   |                  |
-| transformers | >=4.33       | 4.51.3      |                    |
+| transformers | >=4.33       | 4.56.1      |                    |
-| python       | >=3.9        | 3.10/3.11        |                    |
-| cuda         |              | cuda12      |                    |
-| torch        | >=2.0        | 2.6.0/2.7.1    |                    |
-| transformer_engine    | >=2.3       |         |                  |
-| apex |   |  0.1 | |
-| megatron_core    | >=0.12       | 0.13      |                  |
-| flash_attn    |        | 2.7.4.post1/3.0.0b1   |                  |
-| transformers | >=4.33       | 4.51.3      |                    |
-| transformers | >=4.33       | 4.56.1      |                    |
+| python       | >=3.9        | 3.10/3.11   |                    |
+| cuda         |              | cuda12      |                    |
+| torch        | >=2.0        | 2.6.0/2.7.1 |                    |
+| transformer_engine    | >=2.3       |             |                  |
+| apex         |              | 0.1         |                    |
+| megatron_core    | >=0.12       | 0.13        |                  |
+| flash_attn    |              | 2.7.4.post1/3.0.0b1   |                  |
+| transformers | >=4.33       | 4.56.1      |                    |
-| python       | >=3.9        | 3.10/3.11        |                    |
-| cuda         |              | cuda12      |                    |
-| torch        | >=2.0        | 2.6.0/2.7.1    |                    |
-| transformer_engine    | >=2.3       |         |                  |
-| apex |   |  0.1 | |
-| megatron_core    | >=0.12       | 0.13      |                  |
-| flash_attn    |        | 2.7.4.post1/3.0.0b1   |                  |
-| transformers | >=4.33       | 4.51.3      |                    |
-| transformers | >=4.33       | 4.56.1      |                    |
+| python       | >=3.9        | 3.10/3.11   |                    |
+| cuda         |              | cuda12      |                    |
+| torch        | >=2.0        | 2.6.0/2.7.1 |                    |
+| transformer_engine    | >=2.3       |             |                  |
+| apex         |              | 0.1         |                    |
+| megatron_core    | >=0.12       | 0.13        |                  |
+| flash_attn    |              | 2.7.4.post1/3.0.0b1   |                  |
+| transformers | >=4.33       | 4.56.1      |                    |
 | modelscope   | >=1.23       |             |                    |
 | peft         | >=0.11,<0.18 |             |      LoRA          |
 | trl          | >=0.15,<0.21 |       |      RLHF        |

diff --git a/requirements/install_all.sh b/requirements/install_all.sh
@@ -1,13 +1,13 @@
 # please use python=3.10, cuda12.*
 # sh requirements/install_all.sh
 pip install "sglang[all]<0.5" -U
-pip install "vllm>=0.5.1" "transformers<4.56" "trl<0.21" -U
+pip install "vllm>=0.5.1,<0.10.2" "transformers<4.57" "trl<0.21" -U
 pip install "lmdeploy>=0.5" -U
 pip install autoawq -U --no-deps
 pip install auto_gptq optimum bitsandbytes "gradio<5.33" -U
 pip install git+https://github.com/modelscope/ms-swift.git
-pip install timm -U
-pip install "deepspeed" -U
-pip install qwen_vl_utils qwen_omni_utils decord librosa icecream soundfile -U
-pip install liger_kernel nvitop pre-commit math_verify py-spy -U
+pip install timm deepspeed -U
+pip install qwen_vl_utils qwen_omni_utils keye_vl_utils -U
+pip install decord librosa icecream soundfile -U
+pip install liger_kernel nvitop pre-commit math_verify==0.5.2 py-spy wandb swanlab -U
 # flash-attn: https://github.com/Dao-AILab/flash-attention/releases
diff --git a/tests/test_align/test_template/test_vision.py b/tests/test_align/test_template/test_vision.py
@@ -748,8 +748,9 @@ def test_minicpmv4_5():
     # test_glm4_1v()
     # test_gemma3n()
     # test_keye_vl()
+    test_keye_vl_1_5()
     # test_dots_ocr()
     # test_glm4_5v()
     # test_interns1()
     # test_internvl3_5()
-    test_minicpmv4_5()
+    # test_minicpmv4_5()