modelscope · Jintao-Huang · Oct 21, 2025 · Oct 21, 2025 · Oct 21, 2025 · Oct 21, 2025
diff --git a/docs/source/BestPractices/Qwen3-VL最佳实践.md b/docs/source/BestPractices/Qwen3-VL最佳实践.md
@@ -73,7 +73,7 @@ print(output_text[0])
 使用 ms-swift 的 `PtEngine` 进行推理：
 ```python
 import os
-os.environ['SWIFT_DEBUG'] = '1'
+# os.environ['SWIFT_DEBUG'] = '1'
 os.environ['CUDA_VISIBLE_DEVICES'] = '0'
 os.environ['VIDEO_MAX_TOKEN_NUM'] = '128'
 os.environ['FPS_MAX_FRAMES'] = '16'

diff --git a/examples/models/deepseek_ocr/infer.py b/examples/models/deepseek_ocr/infer.py
@@ -0,0 +1,29 @@
+# pip install "transformers==4.46.3" easydict
+import os
+
+os.environ['CUDA_VISIBLE_DEVICES'] = '0'
+# os.environ['SWIFT_DEBUG'] = '1'
+
+if __name__ == '__main__':
+    from swift.llm import InferRequest, PtEngine, RequestConfig
+    engine = PtEngine('deepseek-ai/DeepSeek-OCR')
+    infer_request = InferRequest(
+        messages=[{
+            'role': 'user',
+            # or
+            'content': '<image>Free OCR.',
+            # "content": '<image><|grounding|>Convert the document to markdown.',
-            # "content": '<image><|grounding|>Convert the document to markdown.',
+response = resp_list[0].choices[0].message.content
+print('Non-streaming response:')
+print(response)
-            # "content": '<image><|grounding|>Convert the document to markdown.',
+response = resp_list[0].choices[0].message.content
+print('Non-streaming response:')
+print(response)
+        }],
+        images=['https://modelscope-open.oss-cn-hangzhou.aliyuncs.com/images/ocr.png'])
+    request_config = RequestConfig(max_tokens=512, temperature=0)
+    resp_list = engine.infer([infer_request], request_config=request_config)
+    response = resp_list[0].choices[0].message.content
+
+    # use stream
+    request_config = RequestConfig(max_tokens=512, temperature=0, stream=True)
+    gen_list = engine.infer([infer_request], request_config=request_config)
+    for chunk in gen_list[0]:
+        if chunk is None:
+            continue
+        print(chunk.choices[0].delta.content, end='', flush=True)
+    print()
diff --git a/examples/models/deepseek_vl2/deepseek_ocr.sh → examples/models/deepseek_ocr/train.sh b/examples/models/deepseek_vl2/deepseek_ocr.sh → examples/models/deepseek_ocr/train.sh
@@ -1,5 +1,5 @@
 # 24GiB
-pip install "transformers==4.46.3"
+pip install "transformers==4.46.3" easydict
 
 CUDA_VISIBLE_DEVICES=0 \
 swift sft \