From 25b41088d55c692d0109c07a99ef2c7da83e5364 Mon Sep 17 00:00:00 2001 From: Jack-Khuu Date: Thu, 4 Sep 2025 09:27:14 -0700 Subject: [PATCH 1/2] [ez] Fix app/vllm response processing broken by change in policy --- apps/vllm/main.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/apps/vllm/main.py b/apps/vllm/main.py index 9da85e631..bf6aadc95 100644 --- a/apps/vllm/main.py +++ b/apps/vllm/main.py @@ -17,7 +17,7 @@ from forge.actors.policy import Policy, PolicyConfig, SamplingOverrides, WorkerConfig from forge.controller.service import ServiceConfig, shutdown_service, spawn_service -from vllm.outputs import CompletionOutput +from vllm.outputs import RequestOutput async def main(): @@ -89,11 +89,11 @@ async def run_vllm(service_config: ServiceConfig, config: PolicyConfig, prompt: async with policy.session(): print("Requesting generation...") - responses: List[CompletionOutput] = await policy.generate.choose(prompt=prompt) + response_output: RequestOutput = await policy.generate.choose(prompt=prompt) print("\nGeneration Results:") print("=" * 80) - for batch, response in enumerate(responses): + for batch, response in enumerate(response_output.outputs): print(f"Sample {batch + 1}:") print(f"User: {prompt}") print(f"Assistant: {response.text}") From 441d9ae112925a633b4e228ab0870eac99ed6927 Mon Sep 17 00:00:00 2001 From: Jack-Khuu Date: Thu, 4 Sep 2025 09:57:41 -0700 Subject: [PATCH 2/2] Lint --- apps/vllm/main.py | 1 - 1 file changed, 1 deletion(-) diff --git a/apps/vllm/main.py b/apps/vllm/main.py index bf6aadc95..6f98a512e 100644 --- a/apps/vllm/main.py +++ b/apps/vllm/main.py @@ -13,7 +13,6 @@ import argparse import asyncio from argparse import Namespace -from typing import List from forge.actors.policy import Policy, PolicyConfig, SamplingOverrides, WorkerConfig from forge.controller.service import ServiceConfig, shutdown_service, spawn_service