diff --git a/README.md b/README.md index d72aa805eb..923b7e12d2 100644 --- a/README.md +++ b/README.md @@ -124,18 +124,18 @@ Running Environment: | | Range | Recommended | Notes | |--------------|--------------|---------------------|-------------------------------------------| -| python | >=3.9 | 3.10 | | +| python | >=3.9 | 3.10/3.11 | | | cuda | | cuda12 | No need to install if using CPU, NPU, MPS | | torch | >=2.0 | 2.7.1 | | -| transformers | >=4.33 | 4.55.4 | | +| transformers | >=4.33 | 4.56.1 | | | modelscope | >=1.23 | | | | peft | >=0.11,<0.18 | | | | flash_attn | | 2.7.4.post1/3.0.0b1 | | | trl | >=0.15,<0.21 | 0.20.0 | RLHF | -| deepspeed | >=0.14 | 0.16.9 | Training | -| vllm | >=0.5.1 | 0.10 | Inference/Deployment | -| sglang | >=0.4.6 | 0.4.9.post6 | Inference/Deployment | -| lmdeploy | >=0.5 | 0.9.2 | Inference/Deployment | +| deepspeed | >=0.14 | 0.17.5 | Training | +| vllm | >=0.5.1 | 0.10.1.1 | Inference/Deployment | +| sglang | >=0.4.6 | 0.4.10.post2 | Inference/Deployment | +| lmdeploy | >=0.5 | 0.9.2.post1 | Inference/Deployment | | evalscope | >=0.11 | | Evaluation | | gradio | | 5.32.1 | Web-UI/App | diff --git a/README_CN.md b/README_CN.md index 5e677f4ebb..c477ceb0b6 100644 --- a/README_CN.md +++ b/README_CN.md @@ -120,18 +120,18 @@ pip install -e . | | 范围 | 推荐 | 备注 | |--------------|--------------|---------------------|--------------------| -| python | >=3.9 | 3.10 | | +| python | >=3.9 | 3.10/3.11 | | | cuda | | cuda12 | 使用cpu、npu、mps则无需安装 | | torch | >=2.0 | 2.7.1 | | -| transformers | >=4.33 | 4.55.4 | | +| transformers | >=4.33 | 4.56.1 | | | modelscope | >=1.23 | | | | peft | >=0.11,<0.18 | | | | flash_attn | | 2.7.4.post1/3.0.0b1 | | | trl | >=0.15,<0.21 | 0.20.0 | RLHF | -| deepspeed | >=0.14 | 0.16.9 | 训练 | -| vllm | >=0.5.1 | 0.10 | 推理/部署 | -| sglang | >=0.4.6 | 0.4.9.post6 | 推理/部署 | -| lmdeploy | >=0.5 | 0.9.2 | 推理/部署 | +| deepspeed | >=0.14 | 0.17.5 | 训练 | +| vllm | >=0.5.1 | 0.10.1.1 | 推理/部署 | +| sglang | >=0.4.6 | 0.4.10.post2 | 推理/部署 | +| lmdeploy | >=0.5 | 0.9.2.post1 | 推理/部署 | | evalscope | >=0.11 | | 评测 | | gradio | | 5.32.1 | Web-UI/App | diff --git "a/docs/source/GetStarted/SWIFT\345\256\211\350\243\205.md" "b/docs/source/GetStarted/SWIFT\345\256\211\350\243\205.md" index 120f23b639..67e7d9a19a 100644 --- "a/docs/source/GetStarted/SWIFT\345\256\211\350\243\205.md" +++ "b/docs/source/GetStarted/SWIFT\345\256\211\350\243\205.md" @@ -91,18 +91,18 @@ modelscope-registry.us-west-1.cr.aliyuncs.com/modelscope-repo/modelscope:ubuntu2 | | 范围 | 推荐 | 备注 | |--------------|--------------|---------------------|--------------------| -| python | >=3.9 | 3.10 | | +| python | >=3.9 | 3.10/3.11 | | | cuda | | cuda12 | 使用cpu、npu、mps则无需安装 | | torch | >=2.0 | 2.7.1 | | -| transformers | >=4.33 | 4.55.4 | | +| transformers | >=4.33 | 4.56.1 | | | modelscope | >=1.23 | | | | peft | >=0.11,<0.18 | | | | flash_attn | | 2.7.4.post1/3.0.0b1 | | | trl | >=0.15,<0.21 | 0.20.0 | RLHF | -| deepspeed | >=0.14 | 0.16.9 | 训练 | -| vllm | >=0.5.1 | 0.10 | 推理/部署 | -| sglang | >=0.4.6 | 0.4.9.post6 | 推理/部署 | -| lmdeploy | >=0.5 | 0.9.2 | 推理/部署 | +| deepspeed | >=0.14 | 0.17.5 | 训练 | +| vllm | >=0.5.1 | 0.10.1.1 | 推理/部署 | +| sglang | >=0.4.6 | 0.4.10.post2 | 推理/部署 | +| lmdeploy | >=0.5 | 0.9.2.post1 | 推理/部署 | | evalscope | >=0.11 | | 评测 | | gradio | | 5.32.1 | Web-UI/App | diff --git "a/docs/source/Megatron-SWIFT/\345\277\253\351\200\237\345\274\200\345\247\213.md" "b/docs/source/Megatron-SWIFT/\345\277\253\351\200\237\345\274\200\345\247\213.md" index 782d532cab..92b4da5eff 100644 --- "a/docs/source/Megatron-SWIFT/\345\277\253\351\200\237\345\274\200\345\247\213.md" +++ "b/docs/source/Megatron-SWIFT/\345\277\253\351\200\237\345\274\200\345\247\213.md" @@ -45,14 +45,14 @@ modelscope-registry.us-west-1.cr.aliyuncs.com/modelscope-repo/modelscope:ubuntu2 推荐运行环境: | | 范围 | 推荐 | 备注 | |--------------|--------------|-------------|--------------------| -| python | >=3.9 | 3.10 | | +| python | >=3.9 | 3.10/3.11 | | | cuda | | cuda12 | | | torch | >=2.0 | 2.6.0/2.7.1 | | | transformer_engine | >=2.3 | | | | apex | | 0.1 | | | megatron_core | >=0.12 | 0.13 | | | flash_attn | | 2.7.4.post1/3.0.0b1 | | -| transformers | >=4.33 | 4.51.3 | | +| transformers | >=4.33 | 4.56.1 | | | modelscope | >=1.23 | | | | peft | >=0.11,<0.18 | | LoRA | | trl | >=0.15,<0.21 | | RLHF | diff --git a/docs/source_en/GetStarted/SWIFT-installation.md b/docs/source_en/GetStarted/SWIFT-installation.md index d785768259..0a05861e9f 100644 --- a/docs/source_en/GetStarted/SWIFT-installation.md +++ b/docs/source_en/GetStarted/SWIFT-installation.md @@ -92,18 +92,18 @@ More images can be found [here](https://modelscope.cn/docs/intro/environment-set | | Range | Recommended | Notes | |--------------|--------------|---------------------|-------------------------------------------| -| python | >=3.9 | 3.10 | | +| python | >=3.9 | 3.10/3.11 | | | cuda | | cuda12 | No need to install if using CPU, NPU, MPS | | torch | >=2.0 | 2.7.1 | | -| transformers | >=4.33 | 4.55.4 | | +| transformers | >=4.33 | 4.56.1 | | | modelscope | >=1.23 | | | | peft | >=0.11,<0.18 | | | | flash_attn | | 2.7.4.post1/3.0.0b1 | | | trl | >=0.15,<0.21 | 0.20.0 | RLHF | -| deepspeed | >=0.14 | 0.16.9 | Training | -| vllm | >=0.5.1 | 0.10 | Inference/Deployment | -| sglang | >=0.4.6 | 0.4.9.post6 | Inference/Deployment | -| lmdeploy | >=0.5 | 0.9.2 | Inference/Deployment | +| deepspeed | >=0.14 | 0.17.5 | Training | +| vllm | >=0.5.1 | 0.10.1.1 | Inference/Deployment | +| sglang | >=0.4.6 | 0.4.10.post2 | Inference/Deployment | +| lmdeploy | >=0.5 | 0.9.2.post1 | Inference/Deployment | | evalscope | >=0.11 | | Evaluation | | gradio | | 5.32.1 | Web-UI/App | diff --git a/docs/source_en/Megatron-SWIFT/Quick-start.md b/docs/source_en/Megatron-SWIFT/Quick-start.md index 389ae8bea1..e22f17d824 100644 --- a/docs/source_en/Megatron-SWIFT/Quick-start.md +++ b/docs/source_en/Megatron-SWIFT/Quick-start.md @@ -46,14 +46,14 @@ Recommended Operating Environment: | | Range | Recommended | Notes | |--------------|--------------|-------------|--------------------| -| python | >=3.9 | 3.10 | | +| python | >=3.9 | 3.10/3.11 | | | cuda | | cuda12 | | | torch | >=2.0 | 2.6.0/2.7.1 | | | transformer_engine | >=2.3 | | | | apex | | 0.1 | | | megatron_core | >=0.12 | 0.13 | | | flash_attn | | 2.7.4.post1/3.0.0b1 | | -| transformers | >=4.33 | 4.51.3 | | +| transformers | >=4.33 | 4.56.1 | | | modelscope | >=1.23 | | | | peft | >=0.11,<0.18 | | LoRA | | trl | >=0.15,<0.21 | | RLHF | diff --git a/requirements/install_all.sh b/requirements/install_all.sh index f65d8580a6..806dc01e3b 100644 --- a/requirements/install_all.sh +++ b/requirements/install_all.sh @@ -1,13 +1,13 @@ # please use python=3.10, cuda12.* # sh requirements/install_all.sh pip install "sglang[all]<0.5" -U -pip install "vllm>=0.5.1" "transformers<4.56" "trl<0.21" -U +pip install "vllm>=0.5.1,<0.10.2" "transformers<4.57" "trl<0.21" -U pip install "lmdeploy>=0.5" -U pip install autoawq -U --no-deps pip install auto_gptq optimum bitsandbytes "gradio<5.33" -U pip install git+https://github.com/modelscope/ms-swift.git -pip install timm -U -pip install "deepspeed" -U -pip install qwen_vl_utils qwen_omni_utils decord librosa icecream soundfile -U -pip install liger_kernel nvitop pre-commit math_verify py-spy -U +pip install timm deepspeed -U +pip install qwen_vl_utils qwen_omni_utils keye_vl_utils -U +pip install decord librosa icecream soundfile -U +pip install liger_kernel nvitop pre-commit math_verify==0.5.2 py-spy wandb swanlab -U # flash-attn: https://github.com/Dao-AILab/flash-attention/releases diff --git a/tests/test_align/test_template/test_vision.py b/tests/test_align/test_template/test_vision.py index b8379cedbb..0048221727 100644 --- a/tests/test_align/test_template/test_vision.py +++ b/tests/test_align/test_template/test_vision.py @@ -748,8 +748,9 @@ def test_minicpmv4_5(): # test_glm4_1v() # test_gemma3n() # test_keye_vl() + test_keye_vl_1_5() # test_dots_ocr() # test_glm4_5v() # test_interns1() # test_internvl3_5() - test_minicpmv4_5() + # test_minicpmv4_5()