From 87be73e6296622d6a02f0cded6fc42f536e5202d Mon Sep 17 00:00:00 2001 From: Randall Smith Date: Sat, 22 Nov 2025 00:48:39 -0600 Subject: [PATCH 1/3] Don't add FLASHINFER backend in test_cpu_offloading.py Signed-off-by: Randall Smith --- tests/v1/sample/test_sampling_params_e2e.py | 1 + 1 file changed, 1 insertion(+) diff --git a/tests/v1/sample/test_sampling_params_e2e.py b/tests/v1/sample/test_sampling_params_e2e.py index 1684252174d3..e7d689d01ec5 100644 --- a/tests/v1/sample/test_sampling_params_e2e.py +++ b/tests/v1/sample/test_sampling_params_e2e.py @@ -119,6 +119,7 @@ def test_bad_words(llm): params = SamplingParams(temperature=0, bad_words=[bad_words_1, bad_words_2]) output = llm.generate(PROMPT, params) new_text = output[0].outputs[0].text + print(f"new_text={new_text}") assert bad_words_1 not in new_text assert bad_words_2 not in new_text From d411c9c9be02db230ef0499679c735456b659c05 Mon Sep 17 00:00:00 2001 From: Randall Smith Date: Sat, 22 Nov 2025 00:50:34 -0600 Subject: [PATCH 2/3] add the right file Signed-off-by: Randall Smith --- tests/v1/kv_offload/test_cpu_offloading.py | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/tests/v1/kv_offload/test_cpu_offloading.py b/tests/v1/kv_offload/test_cpu_offloading.py index 3ee41c40859d..406d4c0b4c1f 100644 --- a/tests/v1/kv_offload/test_cpu_offloading.py +++ b/tests/v1/kv_offload/test_cpu_offloading.py @@ -12,10 +12,14 @@ from vllm import LLM, SamplingParams, TokensPrompt from vllm.config import KVEventsConfig, KVTransferConfig from vllm.distributed.kv_events import BlockStored, KVEventBatch +from vllm.platforms import current_platform from vllm.utils.system_utils import set_env_var CPU_BLOCK_SIZES = [48] -ATTN_BACKENDS = ["FLASH_ATTN", "FLASHINFER"] +ATTN_BACKENDS = ["FLASH_ATTN"] + +if current_platform.is_cuda(): + ATTN_BACKENDS.append("FLASHINFER") class MockSubscriber: From 3dd9f39ec496059315657f89053b7524f1ede1c8 Mon Sep 17 00:00:00 2001 From: Randall Smith Date: Sat, 22 Nov 2025 00:53:46 -0600 Subject: [PATCH 3/3] get rid of change Signed-off-by: Randall Smith --- tests/v1/sample/test_sampling_params_e2e.py | 1 - 1 file changed, 1 deletion(-) diff --git a/tests/v1/sample/test_sampling_params_e2e.py b/tests/v1/sample/test_sampling_params_e2e.py index e7d689d01ec5..1684252174d3 100644 --- a/tests/v1/sample/test_sampling_params_e2e.py +++ b/tests/v1/sample/test_sampling_params_e2e.py @@ -119,7 +119,6 @@ def test_bad_words(llm): params = SamplingParams(temperature=0, bad_words=[bad_words_1, bad_words_2]) output = llm.generate(PROMPT, params) new_text = output[0].outputs[0].text - print(f"new_text={new_text}") assert bad_words_1 not in new_text assert bad_words_2 not in new_text