From 49eecdaa06a5cb6ec16a596bee69d0cd304eb288 Mon Sep 17 00:00:00 2001 From: Ryan Johnson Date: Thu, 12 Mar 2026 17:00:06 -0400 Subject: [PATCH 1/2] chore(llama-stack): bump version of llamastack client and eventually version --- deploy/helm/rag/Chart.yaml | 4 ++-- deploy/local/Makefile | 2 +- .../distribution/ui/page/playground/agent.py | 3 +-- frontend/pyproject.toml | 4 ++-- frontend/uv.lock | 17 ++++++++--------- 5 files changed, 14 insertions(+), 16 deletions(-) diff --git a/deploy/helm/rag/Chart.yaml b/deploy/helm/rag/Chart.yaml index 5239436..296d15c 100644 --- a/deploy/helm/rag/Chart.yaml +++ b/deploy/helm/rag/Chart.yaml @@ -19,11 +19,11 @@ dependencies: repository: https://rh-ai-quickstart.github.io/ai-architecture-charts condition: configure-pipeline.enabled - name: ingestion-pipeline - version: 0.7.0 + version: 0.7.3 repository: https://rh-ai-quickstart.github.io/ai-architecture-charts condition: ingestion-pipeline.enabled - name: llama-stack - version: 0.7.1 + version: 0.7.3 repository: https://rh-ai-quickstart.github.io/ai-architecture-charts condition: llama-stack.enabled - name: mcp-servers diff --git a/deploy/local/Makefile b/deploy/local/Makefile index 8f74434..87960e3 100644 --- a/deploy/local/Makefile +++ b/deploy/local/Makefile @@ -19,7 +19,7 @@ PROJECT_NAME := rag OLLAMA_MODEL := llama3.2:3b-instruct-fp16 # UI Build Configuration -VERSION ?= 0.5.1 +VERSION ?= 0.6.0 TAVILY_SEARCH_API_KEY ?= "" CONTAINER_REGISTRY ?= quay.io/rh-ai-quickstart DIST_UI_DIR := $(abspath ../../frontend) diff --git a/frontend/llama_stack_ui/distribution/ui/page/playground/agent.py b/frontend/llama_stack_ui/distribution/ui/page/playground/agent.py index 050a6db..31a6241 100644 --- a/frontend/llama_stack_ui/distribution/ui/page/playground/agent.py +++ b/frontend/llama_stack_ui/distribution/ui/page/playground/agent.py @@ -363,8 +363,7 @@ def agent_process_prompt(prompt, state, config): "temperature": config.sampling.temperature, "max_infer_iters": config.sampling.max_infer_iters, "stream": True, - # "max_output_tokens": config.sampling.max_tokens, - + "max_output_tokens": config.sampling.max_tokens, } # Add tools if available diff --git a/frontend/pyproject.toml b/frontend/pyproject.toml index 78f27dd..ee49023 100644 --- a/frontend/pyproject.toml +++ b/frontend/pyproject.toml @@ -10,10 +10,10 @@ requires-python = ">=3.12" dependencies = [ "streamlit", "pandas", - "llama-stack-client==0.5.1", + "llama-stack-client==0.6.0", "requests", "streamlit-option-menu", - "llama-stack==0.5.1", + "llama-stack==0.6.0", "fire", "asyncpg", ] diff --git a/frontend/uv.lock b/frontend/uv.lock index 773f591..87f0abf 100644 --- a/frontend/uv.lock +++ b/frontend/uv.lock @@ -809,7 +809,7 @@ wheels = [ [[package]] name = "llama-stack" -version = "0.5.2" +version = "0.6.0" source = { registry = "https://pypi.org/simple" } dependencies = [ { name = "aiohttp" }, @@ -830,7 +830,6 @@ dependencies = [ { name = "opentelemetry-exporter-otlp-proto-http" }, { name = "opentelemetry-sdk" }, { name = "oracledb" }, - { name = "pillow" }, { name = "prompt-toolkit" }, { name = "psycopg2-binary" }, { name = "pydantic" }, @@ -847,9 +846,9 @@ dependencies = [ { name = "urllib3" }, { name = "uvicorn" }, ] -sdist = { url = "https://files.pythonhosted.org/packages/ce/a8/3724d0c06a06578a639345f5086b93ba234a0ac247ec4ed7854d0d5e5ca6/llama_stack-0.5.2.tar.gz", hash = "sha256:9334c781e4ded6520aa60c3301a9087e9fb8fdaea8e5f30f8e21d85b17231d8d", size = 16035748, upload-time = "2026-03-06T13:25:59.356Z" } +sdist = { url = "https://files.pythonhosted.org/packages/f4/53/5bc3ae19e9a42475b42682456898ced5a0b48e43f918920fc790b665f223/llama_stack-0.6.0.tar.gz", hash = "sha256:d92711791633f5505a4473ffba3f3e26acb700716fddab5aec419d99e614c802", size = 13631563, upload-time = "2026-03-11T15:06:13.071Z" } wheels = [ - { url = "https://files.pythonhosted.org/packages/62/4c/fea3f2ffeead47a934704f1527685106766c5ea69dd99c0a83e872b22aa7/llama_stack-0.5.2-py3-none-any.whl", hash = "sha256:581fda638088ee029aab20afe3c42ba8f7f6ef21c80bd9ebcae20bb13c3409d3", size = 3979442, upload-time = "2026-03-06T13:25:56.581Z" }, + { url = "https://files.pythonhosted.org/packages/9d/17/b4427e1db7409f698c95b6f8b2b9e662bbcf1f819beb1af180bab55ddfb5/llama_stack-0.6.0-py3-none-any.whl", hash = "sha256:b804830664dc91e54c7225a7a081cb1874c48fc18573569c19fac4a9397e8076", size = 770027, upload-time = "2026-03-11T15:06:10.649Z" }, ] [[package]] @@ -871,7 +870,7 @@ wheels = [ [[package]] name = "llama-stack-client" -version = "0.5.2" +version = "0.6.0" source = { registry = "https://pypi.org/simple" } dependencies = [ { name = "anyio" }, @@ -890,9 +889,9 @@ dependencies = [ { name = "tqdm" }, { name = "typing-extensions" }, ] -sdist = { url = "https://files.pythonhosted.org/packages/99/8a/8742475db7cedc2d452a3a7677da7f24aa84bdd262bc97543029c62df772/llama_stack_client-0.5.2.tar.gz", hash = "sha256:17c1bbad90f7699da4eb3cae256e8823caa4d2be945512a45c8c6f89ab899f28", size = 368612, upload-time = "2026-03-06T13:24:22.252Z" } +sdist = { url = "https://files.pythonhosted.org/packages/b7/e9/62dc71e7d6003d9b56a1e632445065f55687c891e62eff1636e10b5dd629/llama_stack_client-0.6.0.tar.gz", hash = "sha256:3290aac36dcafbd1bc0baaf995522e2037f57056672b5a1516af112a4210f3ea", size = 368695, upload-time = "2026-03-11T15:04:19.267Z" } wheels = [ - { url = "https://files.pythonhosted.org/packages/4d/f9/f6224b8819748358a573e3a2b8e299c0b6ba5f9cedf2942188c361c8e555/llama_stack_client-0.5.2-py3-none-any.whl", hash = "sha256:473f4d67ac0b243b0fc29555a0203a742615d31bea606b4332d9e2f193f73d6a", size = 391951, upload-time = "2026-03-06T13:24:20.559Z" }, + { url = "https://files.pythonhosted.org/packages/83/a3/33d3e066a320a993b6f9cca9c8efe8da7deb2045df61235d327d0a05b25f/llama_stack_client-0.6.0-py3-none-any.whl", hash = "sha256:7e514a6ffd92f237aceb062dadc4db44e24a3cd9c4ea35e25173d1e0739beb8e", size = 392001, upload-time = "2026-03-11T15:04:17.772Z" }, ] [[package]] @@ -914,8 +913,8 @@ dependencies = [ requires-dist = [ { name = "asyncpg" }, { name = "fire" }, - { name = "llama-stack", specifier = "==0.5.2" }, - { name = "llama-stack-client", specifier = "==0.5.2" }, + { name = "llama-stack", specifier = "==0.6.0" }, + { name = "llama-stack-client", specifier = "==0.6.0" }, { name = "pandas" }, { name = "requests" }, { name = "streamlit" }, From 667938d523030596799882a50f002a74db406cd8 Mon Sep 17 00:00:00 2001 From: sauagarwa Date: Mon, 16 Mar 2026 16:50:41 -0400 Subject: [PATCH 2/2] fix: sync helm lockfile and track it in git Update rag chart dependencies lock to match Chart.yaml and stop ignoring Chart.lock so ArgoCD manifest generation remains deterministic. Made-with: Cursor --- .gitignore | 2 +- deploy/helm/rag/Chart.lock | 8 ++++---- 2 files changed, 5 insertions(+), 5 deletions(-) diff --git a/.gitignore b/.gitignore index 42d3bf2..bb9509c 100644 --- a/.gitignore +++ b/.gitignore @@ -183,7 +183,7 @@ deploy/helm/secrets # RAG Stack Configuration # User-specific configuration file (contains sensitive data) deploy/helm/rag-values.yaml -deploy/helm/rag/Chart.lock deploy/helm/values.yaml deploy/helm/bootstrap-values.yaml tenant/bootstrap/bootstrap-values.yaml +tenant/bootstrap-values.yaml \ No newline at end of file diff --git a/deploy/helm/rag/Chart.lock b/deploy/helm/rag/Chart.lock index 8dea968..6d4be79 100644 --- a/deploy/helm/rag/Chart.lock +++ b/deploy/helm/rag/Chart.lock @@ -10,12 +10,12 @@ dependencies: version: 0.5.6 - name: ingestion-pipeline repository: https://rh-ai-quickstart.github.io/ai-architecture-charts - version: 0.7.0 + version: 0.7.3 - name: llama-stack repository: https://rh-ai-quickstart.github.io/ai-architecture-charts - version: 0.7.1 + version: 0.7.3 - name: mcp-servers repository: https://rh-ai-quickstart.github.io/ai-architecture-charts version: 0.5.15 -digest: sha256:0dbca435d7b3b408321cb33489ad8f099b4ae64501cde761cb47ea9c8e0abc20 -generated: "2026-03-06T14:32:40.986363-05:00" +digest: sha256:ac4d12af3cc62bd462293d89f20fbe01a7c67fd7ce50ab78a1fe0ff27dfebb55 +generated: "2026-03-16T16:48:25.929533-04:00"