Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
4 changes: 2 additions & 2 deletions deploy/helm/rag/Chart.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -2,8 +2,8 @@ apiVersion: v2
name: rag
description: A Helm chart for Kubernetes
type: application
version: 0.2.34
appVersion: "0.2.34"
version: 0.2.35
appVersion: "0.2.35"

dependencies:
- name: pgvector
Expand Down
6 changes: 5 additions & 1 deletion deploy/helm/rag/values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,7 @@ replicaCount: 1
image:
repository: quay.io/rh-ai-quickstart/llamastack-dist-ui
pullPolicy: Always
tag: 0.2.34
tag: 0.2.35

service:
type: ClusterIP
Expand All @@ -16,11 +16,15 @@ livenessProbe:
httpGet:
path: /
port: http
initialDelaySeconds: 60
timeoutSeconds: 15

readinessProbe:
httpGet:
path: /
port: http
initialDelaySeconds: 30
timeoutSeconds: 15

env:
- name: LLAMA_STACK_ENDPOINT
Expand Down
27 changes: 12 additions & 15 deletions frontend/Containerfile
Original file line number Diff line number Diff line change
Expand Up @@ -5,30 +5,27 @@ FROM python:3.12-slim

WORKDIR /app

# Install uv first (rarely changes)
RUN pip install uv
# Install only runtime dependencies at build time.
ENV PIP_NO_CACHE_DIR=1 \
PYTHONDONTWRITEBYTECODE=1 \
PYTHONUNBUFFERED=1

# Copy dependency file first (for better caching)
# Copy dependency metadata first for better layer caching.
COPY pyproject.toml ./

# Install dependencies only (cached unless pyproject.toml changes)
RUN uv pip install --system -r pyproject.toml
# Install dependencies into system site-packages during build.
RUN pip install --no-cache-dir uv && \
uv pip install --system -r pyproject.toml && \
pip uninstall -y uv && \
rm -rf /root/.cache/uv /root/.cache/pip

# Copy application code (invalidates cache only on code changes)
# Copy the rest of the application source.
COPY . /app/

# Set UV cache directory to a writable location
ENV UV_CACHE_DIR=/app/.uv-cache
ENV XDG_CACHE_HOME=/app/.cache

# Create cache directories with proper permissions
RUN mkdir -p /app/.uv-cache /app/.cache && \
chmod -R 777 /app/.uv-cache /app/.cache

# Ensure all app files have proper ownership and permissions for non-root users
RUN chown -R 1001:0 /app && \
chmod -R g+rwX /app

EXPOSE 8501

ENTRYPOINT ["uv", "run", "streamlit", "run", "/app/llama_stack_ui/distribution/ui/app.py", "--server.port=8501", "--server.address=0.0.0.0"]
ENTRYPOINT ["python", "-m", "streamlit", "run", "/app/llama_stack_ui/distribution/ui/app.py", "--server.port=8501", "--server.address=0.0.0.0"]
Loading