From 26a7b1a85921c3884c25c7dc8a7b523777b5967c Mon Sep 17 00:00:00 2001
From: "vol@" <vol@openai.com>
Date: Tue, 5 Aug 2025 14:26:14 -0700
Subject: [PATCH] Update run-vllm.md

---
 articles/gpt-oss/run-vllm.md | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/articles/gpt-oss/run-vllm.md b/articles/gpt-oss/run-vllm.md
index fc70d119f0..b590795c49 100644
--- a/articles/gpt-oss/run-vllm.md
+++ b/articles/gpt-oss/run-vllm.md
@@ -26,7 +26,10 @@ Both models are **MXFP4 quantized** out of the box.
 ```shell
 uv venv --python 3.12 --seed
 source .venv/bin/activate
-uv pip install vllm --torch-backend=auto
+uv pip install --pre vllm==0.10.1+gptoss \
+    --extra-index-url https://wheels.vllm.ai/gpt-oss/ \
+    --extra-index-url https://download.pytorch.org/whl/nightly/cu128 \
+    --index-strategy unsafe-best-match
 ```
 
 2. **Start up a server and download the model**