From d0840d6db6ff7259b1947748a557e4db7c22bb38 Mon Sep 17 00:00:00 2001 From: Pavel Tisnovsky Date: Tue, 26 Aug 2025 14:03:51 +0200 Subject: [PATCH 1/3] LCORE-599: bump-up Llama Stack version to 0.2.18 --- pyproject.toml | 4 ++-- src/constants.py | 2 +- uv.lock | 16 ++++++++-------- 3 files changed, 11 insertions(+), 11 deletions(-) diff --git a/pyproject.toml b/pyproject.toml index 82fb2d9c..76777c01 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -25,8 +25,8 @@ dependencies = [ "fastapi>=0.115.12", "uvicorn>=0.34.3", "kubernetes>=30.1.0", - "llama-stack==0.2.17", - "llama-stack-client==0.2.17", + "llama-stack==0.2.18", + "llama-stack-client==0.2.18", "rich>=14.0.0", "cachetools>=6.1.0", "prometheus-client>=0.22.1", diff --git a/src/constants.py b/src/constants.py index 4a2a4b86..2260d510 100644 --- a/src/constants.py +++ b/src/constants.py @@ -2,7 +2,7 @@ # Minimal and maximal supported Llama Stack version MINIMAL_SUPPORTED_LLAMA_STACK_VERSION = "0.2.17" -MAXIMAL_SUPPORTED_LLAMA_STACK_VERSION = "0.2.17" +MAXIMAL_SUPPORTED_LLAMA_STACK_VERSION = "0.2.18" UNABLE_TO_PROCESS_RESPONSE = "Unable to process this request" diff --git a/uv.lock b/uv.lock index 15a3ddfd..bf2d91ef 100644 --- a/uv.lock +++ b/uv.lock @@ -1342,8 +1342,8 @@ requires-dist = [ { name = "fastapi", specifier = ">=0.115.12" }, { name = "jsonpath-ng", specifier = ">=1.6.1" }, { name = "kubernetes", specifier = ">=30.1.0" }, - { name = "llama-stack", specifier = "==0.2.17" }, - { name = "llama-stack-client", specifier = "==0.2.17" }, + { name = "llama-stack", specifier = "==0.2.18" }, + { name = "llama-stack-client", specifier = "==0.2.18" }, { name = "openai", specifier = "==1.99.9" }, { name = "prometheus-client", specifier = ">=0.22.1" }, { name = "rich", specifier = ">=14.0.0" }, @@ -1452,7 +1452,7 @@ wheels = [ [[package]] name = "llama-stack" -version = "0.2.17" +version = "0.2.18" source = { registry = "https://pypi.org/simple" } dependencies = [ { name = "aiohttp" }, @@ -1482,14 +1482,14 @@ dependencies = [ { name = "tiktoken" }, { name = "uvicorn" }, ] -sdist = { url = "https://files.pythonhosted.org/packages/3b/43/ab4969bd47c9981efa713fa21c8c2ac534425831b265157248bfc710a508/llama_stack-0.2.17.tar.gz", hash = "sha256:f5e50f85a7483022bb86f9971bbe6f98274175e2e5584fb0a7df2d9ac43f5d57", size = 3301909, upload-time = "2025-08-05T01:43:04.059Z" } +sdist = { url = "https://files.pythonhosted.org/packages/ed/e1/16c52856746e1412274c085a6e6a21829133f9db3d4932a009700594f4a2/llama_stack-0.2.18.tar.gz", hash = "sha256:0ea6e150140047568e45f98100027a79e20340711e5feff083d9b9dfe42d2605", size = 3321726, upload-time = "2025-08-19T22:12:17.257Z" } wheels = [ - { url = "https://files.pythonhosted.org/packages/53/87/ebb127c7594cfecfa5b42db99a919a942e429a1571fd6c872890dfc9a6d9/llama_stack-0.2.17-py3-none-any.whl", hash = "sha256:b067575c26938932bf1a54246009b08b0082d5d5b511c5f14bd81a80167e046c", size = 3624746, upload-time = "2025-08-05T01:43:02.395Z" }, + { url = "https://files.pythonhosted.org/packages/65/72/c68c50be2d2808fe162c3f344f976bc29839f0cee7a6d951cc3805f8482d/llama_stack-0.2.18-py3-none-any.whl", hash = "sha256:3383fb4da1cc6e77a58ae425ef49ce470bca784ca85051dd6b2b70966f936bea", size = 3650850, upload-time = "2025-08-19T22:12:15.857Z" }, ] [[package]] name = "llama-stack-client" -version = "0.2.17" +version = "0.2.18" source = { registry = "https://pypi.org/simple" } dependencies = [ { name = "anyio" }, @@ -1508,9 +1508,9 @@ dependencies = [ { name = "tqdm" }, { name = "typing-extensions" }, ] -sdist = { url = "https://files.pythonhosted.org/packages/c5/2a/bb2949d6a5c494d21da0c185d426e25eaa8016f8287b689249afc6c96fb5/llama_stack_client-0.2.17.tar.gz", hash = "sha256:1fe2070133c6356761e394fa346045e9b6b567d4c63157b9bc6be89b9a6e7a41", size = 257636, upload-time = "2025-08-05T01:42:55.911Z" } +sdist = { url = "https://files.pythonhosted.org/packages/69/da/5e5a745495f8a2b8ef24fc4d01fe9031aa2277c36447cb22192ec8c8cc1e/llama_stack_client-0.2.18.tar.gz", hash = "sha256:860c885c9e549445178ac55cc9422e6e2a91215ac7aff5aaccfb42f3ce07e79e", size = 277284, upload-time = "2025-08-19T22:12:09.106Z" } wheels = [ - { url = "https://files.pythonhosted.org/packages/81/fc/5eccc86b83c5ced3a3bca071d250a86ccafa4ff17546cf781deb7758ab74/llama_stack_client-0.2.17-py3-none-any.whl", hash = "sha256:336c32f8688700ff64717b8109f405dc87a990fbe310c2027ac9ed6d39d67d16", size = 350329, upload-time = "2025-08-05T01:42:54.381Z" }, + { url = "https://files.pythonhosted.org/packages/0a/e4/e97f8fdd8a07aa1efc7f7e37b5657d84357b664bf70dd1885a437edc0699/llama_stack_client-0.2.18-py3-none-any.whl", hash = "sha256:90f827d5476f7fc15fd993f1863af6a6e72bd064646bf6a99435eb43a1327f70", size = 367586, upload-time = "2025-08-19T22:12:07.899Z" }, ] [[package]] From 3e44dde47e6f4a2aa7a4f050228b657b13a63f1c Mon Sep 17 00:00:00 2001 From: Pavel Tisnovsky Date: Tue, 26 Aug 2025 14:56:50 +0200 Subject: [PATCH 2/3] Fixed configuration settings --- .github/workflows/e2e_tests.yaml | 3 ++- run.yaml | 1 + 2 files changed, 3 insertions(+), 1 deletion(-) diff --git a/.github/workflows/e2e_tests.yaml b/.github/workflows/e2e_tests.yaml index f31fbc7f..757ae153 100644 --- a/.github/workflows/e2e_tests.yaml +++ b/.github/workflows/e2e_tests.yaml @@ -169,6 +169,7 @@ jobs: checkpoint_format: huggingface device: cpu distributed_backend: null + dpo_output_dir: "." provider_id: huggingface provider_type: inline::huggingface safety: @@ -262,4 +263,4 @@ jobs: uv sync echo "Running comprehensive e2e test suite..." - make test-e2e \ No newline at end of file + make test-e2e diff --git a/run.yaml b/run.yaml index 1196d854..e04bd72e 100644 --- a/run.yaml +++ b/run.yaml @@ -69,6 +69,7 @@ providers: checkpoint_format: huggingface device: cpu distributed_backend: null + dpo_output_dir: "." provider_id: huggingface provider_type: inline::huggingface safety: From bbc3f1c9346f29e1695046da9c5276a68a54c40a Mon Sep 17 00:00:00 2001 From: Pavel Tisnovsky Date: Tue, 26 Aug 2025 15:46:11 +0200 Subject: [PATCH 3/3] X --- .github/workflows/e2e_tests.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/e2e_tests.yaml b/.github/workflows/e2e_tests.yaml index 757ae153..5a339598 100644 --- a/.github/workflows/e2e_tests.yaml +++ b/.github/workflows/e2e_tests.yaml @@ -169,7 +169,7 @@ jobs: checkpoint_format: huggingface device: cpu distributed_backend: null - dpo_output_dir: "." + dpo_output_dir: '.' provider_id: huggingface provider_type: inline::huggingface safety: