From 49eecdaa06a5cb6ec16a596bee69d0cd304eb288 Mon Sep 17 00:00:00 2001
From: Ryan Johnson <johnson2500@live.com>
Date: Thu, 12 Mar 2026 17:00:06 -0400
Subject: [PATCH 1/2] chore(llama-stack): bump version of llamastack client and
 eventually version

---
 deploy/helm/rag/Chart.yaml                      |  4 ++--
 deploy/local/Makefile                           |  2 +-
 .../distribution/ui/page/playground/agent.py    |  3 +--
 frontend/pyproject.toml                         |  4 ++--
 frontend/uv.lock                                | 17 ++++++++---------
 5 files changed, 14 insertions(+), 16 deletions(-)

diff --git a/deploy/helm/rag/Chart.yaml b/deploy/helm/rag/Chart.yaml
index 5239436..296d15c 100644
--- a/deploy/helm/rag/Chart.yaml
+++ b/deploy/helm/rag/Chart.yaml
@@ -19,11 +19,11 @@ dependencies:
     repository: https://rh-ai-quickstart.github.io/ai-architecture-charts
     condition: configure-pipeline.enabled
   - name: ingestion-pipeline
-    version: 0.7.0
+    version: 0.7.3
     repository: https://rh-ai-quickstart.github.io/ai-architecture-charts
     condition: ingestion-pipeline.enabled
   - name: llama-stack
-    version: 0.7.1
+    version: 0.7.3
     repository: https://rh-ai-quickstart.github.io/ai-architecture-charts
     condition: llama-stack.enabled
   - name: mcp-servers
diff --git a/deploy/local/Makefile b/deploy/local/Makefile
index 8f74434..87960e3 100644
--- a/deploy/local/Makefile
+++ b/deploy/local/Makefile
@@ -19,7 +19,7 @@ PROJECT_NAME := rag
 OLLAMA_MODEL := llama3.2:3b-instruct-fp16
 
 # UI Build Configuration
-VERSION ?= 0.5.1
+VERSION ?= 0.6.0
 TAVILY_SEARCH_API_KEY ?= ""
 CONTAINER_REGISTRY ?= quay.io/rh-ai-quickstart
 DIST_UI_DIR := $(abspath ../../frontend)
diff --git a/frontend/llama_stack_ui/distribution/ui/page/playground/agent.py b/frontend/llama_stack_ui/distribution/ui/page/playground/agent.py
index 050a6db..31a6241 100644
--- a/frontend/llama_stack_ui/distribution/ui/page/playground/agent.py
+++ b/frontend/llama_stack_ui/distribution/ui/page/playground/agent.py
@@ -363,8 +363,7 @@ def agent_process_prompt(prompt, state, config):
         "temperature": config.sampling.temperature,
         "max_infer_iters": config.sampling.max_infer_iters,
         "stream": True,
-       # "max_output_tokens": config.sampling.max_tokens,
-
+        "max_output_tokens": config.sampling.max_tokens,
     }
 
     # Add tools if available
diff --git a/frontend/pyproject.toml b/frontend/pyproject.toml
index 78f27dd..ee49023 100644
--- a/frontend/pyproject.toml
+++ b/frontend/pyproject.toml
@@ -10,10 +10,10 @@ requires-python = ">=3.12"
 dependencies = [
     "streamlit",
     "pandas",
-	"llama-stack-client==0.5.1",
+	"llama-stack-client==0.6.0",
     "requests",
     "streamlit-option-menu",
-    "llama-stack==0.5.1",
+    "llama-stack==0.6.0",
     "fire",
     "asyncpg",
 ]
diff --git a/frontend/uv.lock b/frontend/uv.lock
index 773f591..87f0abf 100644
--- a/frontend/uv.lock
+++ b/frontend/uv.lock
@@ -809,7 +809,7 @@ wheels = [
 
 [[package]]
 name = "llama-stack"
-version = "0.5.2"
+version = "0.6.0"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "aiohttp" },
@@ -830,7 +830,6 @@ dependencies = [
     { name = "opentelemetry-exporter-otlp-proto-http" },
     { name = "opentelemetry-sdk" },
     { name = "oracledb" },
-    { name = "pillow" },
     { name = "prompt-toolkit" },
     { name = "psycopg2-binary" },
     { name = "pydantic" },
@@ -847,9 +846,9 @@ dependencies = [
     { name = "urllib3" },
     { name = "uvicorn" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/ce/a8/3724d0c06a06578a639345f5086b93ba234a0ac247ec4ed7854d0d5e5ca6/llama_stack-0.5.2.tar.gz", hash = "sha256:9334c781e4ded6520aa60c3301a9087e9fb8fdaea8e5f30f8e21d85b17231d8d", size = 16035748, upload-time = "2026-03-06T13:25:59.356Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/f4/53/5bc3ae19e9a42475b42682456898ced5a0b48e43f918920fc790b665f223/llama_stack-0.6.0.tar.gz", hash = "sha256:d92711791633f5505a4473ffba3f3e26acb700716fddab5aec419d99e614c802", size = 13631563, upload-time = "2026-03-11T15:06:13.071Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/62/4c/fea3f2ffeead47a934704f1527685106766c5ea69dd99c0a83e872b22aa7/llama_stack-0.5.2-py3-none-any.whl", hash = "sha256:581fda638088ee029aab20afe3c42ba8f7f6ef21c80bd9ebcae20bb13c3409d3", size = 3979442, upload-time = "2026-03-06T13:25:56.581Z" },
+    { url = "https://files.pythonhosted.org/packages/9d/17/b4427e1db7409f698c95b6f8b2b9e662bbcf1f819beb1af180bab55ddfb5/llama_stack-0.6.0-py3-none-any.whl", hash = "sha256:b804830664dc91e54c7225a7a081cb1874c48fc18573569c19fac4a9397e8076", size = 770027, upload-time = "2026-03-11T15:06:10.649Z" },
 ]
 
 [[package]]
@@ -871,7 +870,7 @@ wheels = [
 
 [[package]]
 name = "llama-stack-client"
-version = "0.5.2"
+version = "0.6.0"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "anyio" },
@@ -890,9 +889,9 @@ dependencies = [
     { name = "tqdm" },
     { name = "typing-extensions" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/99/8a/8742475db7cedc2d452a3a7677da7f24aa84bdd262bc97543029c62df772/llama_stack_client-0.5.2.tar.gz", hash = "sha256:17c1bbad90f7699da4eb3cae256e8823caa4d2be945512a45c8c6f89ab899f28", size = 368612, upload-time = "2026-03-06T13:24:22.252Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/b7/e9/62dc71e7d6003d9b56a1e632445065f55687c891e62eff1636e10b5dd629/llama_stack_client-0.6.0.tar.gz", hash = "sha256:3290aac36dcafbd1bc0baaf995522e2037f57056672b5a1516af112a4210f3ea", size = 368695, upload-time = "2026-03-11T15:04:19.267Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/4d/f9/f6224b8819748358a573e3a2b8e299c0b6ba5f9cedf2942188c361c8e555/llama_stack_client-0.5.2-py3-none-any.whl", hash = "sha256:473f4d67ac0b243b0fc29555a0203a742615d31bea606b4332d9e2f193f73d6a", size = 391951, upload-time = "2026-03-06T13:24:20.559Z" },
+    { url = "https://files.pythonhosted.org/packages/83/a3/33d3e066a320a993b6f9cca9c8efe8da7deb2045df61235d327d0a05b25f/llama_stack_client-0.6.0-py3-none-any.whl", hash = "sha256:7e514a6ffd92f237aceb062dadc4db44e24a3cd9c4ea35e25173d1e0739beb8e", size = 392001, upload-time = "2026-03-11T15:04:17.772Z" },
 ]
 
 [[package]]
@@ -914,8 +913,8 @@ dependencies = [
 requires-dist = [
     { name = "asyncpg" },
     { name = "fire" },
-    { name = "llama-stack", specifier = "==0.5.2" },
-    { name = "llama-stack-client", specifier = "==0.5.2" },
+    { name = "llama-stack", specifier = "==0.6.0" },
+    { name = "llama-stack-client", specifier = "==0.6.0" },
     { name = "pandas" },
     { name = "requests" },
     { name = "streamlit" },

From 667938d523030596799882a50f002a74db406cd8 Mon Sep 17 00:00:00 2001
From: sauagarwa <sauagarw@redhat.com>
Date: Mon, 16 Mar 2026 16:50:41 -0400
Subject: [PATCH 2/2] fix: sync helm lockfile and track it in git

Update rag chart dependencies lock to match Chart.yaml and stop ignoring Chart.lock so ArgoCD manifest generation remains deterministic.

Made-with: Cursor
---
 .gitignore                 | 2 +-
 deploy/helm/rag/Chart.lock | 8 ++++----
 2 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/.gitignore b/.gitignore
index 42d3bf2..bb9509c 100644
--- a/.gitignore
+++ b/.gitignore
@@ -183,7 +183,7 @@ deploy/helm/secrets
 # RAG Stack Configuration
 # User-specific configuration file (contains sensitive data)
 deploy/helm/rag-values.yaml
-deploy/helm/rag/Chart.lock
 deploy/helm/values.yaml
 deploy/helm/bootstrap-values.yaml
 tenant/bootstrap/bootstrap-values.yaml
+tenant/bootstrap-values.yaml
\ No newline at end of file
diff --git a/deploy/helm/rag/Chart.lock b/deploy/helm/rag/Chart.lock
index 8dea968..6d4be79 100644
--- a/deploy/helm/rag/Chart.lock
+++ b/deploy/helm/rag/Chart.lock
@@ -10,12 +10,12 @@ dependencies:
   version: 0.5.6
 - name: ingestion-pipeline
   repository: https://rh-ai-quickstart.github.io/ai-architecture-charts
-  version: 0.7.0
+  version: 0.7.3
 - name: llama-stack
   repository: https://rh-ai-quickstart.github.io/ai-architecture-charts
-  version: 0.7.1
+  version: 0.7.3
 - name: mcp-servers
   repository: https://rh-ai-quickstart.github.io/ai-architecture-charts
   version: 0.5.15
-digest: sha256:0dbca435d7b3b408321cb33489ad8f099b4ae64501cde761cb47ea9c8e0abc20
-generated: "2026-03-06T14:32:40.986363-05:00"
+digest: sha256:ac4d12af3cc62bd462293d89f20fbe01a7c67fd7ce50ab78a1fe0ff27dfebb55
+generated: "2026-03-16T16:48:25.929533-04:00"