From 76114ca0c16dcd74c590cda7187aa5cb03a014c3 Mon Sep 17 00:00:00 2001 From: Woosuk Kwon Date: Thu, 21 Nov 2024 19:36:47 -0800 Subject: [PATCH 1/2] [Minor] Fix line-too-long Signed-off-by: Woosuk Kwon --- vllm/entrypoints/llm.py | 9 +++++---- 1 file changed, 5 insertions(+), 4 deletions(-) diff --git a/vllm/entrypoints/llm.py b/vllm/entrypoints/llm.py index 2446a64a02eb..8eba0e2c74bc 100644 --- a/vllm/entrypoints/llm.py +++ b/vllm/entrypoints/llm.py @@ -109,16 +109,17 @@ class LLM: hf_overrides: If a dictionary, contains arguments to be forwarded to the HuggingFace config. If a callable, it is called to update the HuggingFace config. - compilation_config: Either an integer or a dictionary. If it is an integer, - it is used as the level of compilation optimization. If it is a dictionary, - it can specify the full compilation configuration. + compilation_config: Either an integer or a dictionary. If it is an + integer, it is used as the level of compilation optimization. + If it is a dictionary, it can specify the full compilation + configuration. **kwargs: Arguments for :class:`~vllm.EngineArgs`. (See :ref:`engine_args`) Note: This class is intended to be used for offline inference. For online serving, use the :class:`~vllm.AsyncLLMEngine` class instead. - """ # noqa + """ DEPRECATE_LEGACY: ClassVar[bool] = False """A flag to toggle whether to deprecate the legacy generate/encode API.""" From 984f0470c3a48ee06d22b73599612b8691cae1db Mon Sep 17 00:00:00 2001 From: Woosuk Kwon Date: Thu, 21 Nov 2024 19:38:16 -0800 Subject: [PATCH 2/2] fix Signed-off-by: Woosuk Kwon --- vllm/entrypoints/llm.py | 5 ++--- 1 file changed, 2 insertions(+), 3 deletions(-) diff --git a/vllm/entrypoints/llm.py b/vllm/entrypoints/llm.py index 8eba0e2c74bc..c211ec5aee08 100644 --- a/vllm/entrypoints/llm.py +++ b/vllm/entrypoints/llm.py @@ -110,9 +110,8 @@ class LLM: HuggingFace config. If a callable, it is called to update the HuggingFace config. compilation_config: Either an integer or a dictionary. If it is an - integer, it is used as the level of compilation optimization. - If it is a dictionary, it can specify the full compilation - configuration. + integer, it is used as the level of compilation optimization. If it + is a dictionary, it can specify the full compilation configuration. **kwargs: Arguments for :class:`~vllm.EngineArgs`. (See :ref:`engine_args`)