From d5c3ef8e6d21b4c90a64dc0f3eaccc04b28960c1 Mon Sep 17 00:00:00 2001 From: varashi Date: Wed, 27 May 2026 09:02:32 +0200 Subject: [PATCH] fix(logging): drop longhorn storageClassName on fluentd PVC, use cluster default MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Logging CR referenced storageClassName: longhorn, but Longhorn was removed from k8s-talos earlier; only `vsan` (vSphere CSI, also cluster default) is available. Fluentd-0 stuck Pending with unbound PVC. Removing the explicit storageClassName lets the PVC bind against the default StorageClass — vsan handles ReadWriteOnce + WaitForFirstConsumer for the 5Gi fluentd buffer fine. Note on StatefulSet volumeClaimTemplates immutability: the existing STS may fail to reconcile this change directly; if so, delete the STS (operator recreates) + delete the Pending PVCs. Co-Authored-By: Claude Opus 4.7 --- .../platform/logging/logging-config/app/logging.yaml | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/cluster-talos/kubernetes/infrastructure/platform/logging/logging-config/app/logging.yaml b/cluster-talos/kubernetes/infrastructure/platform/logging/logging-config/app/logging.yaml index b8997e54..57fcdbb1 100644 --- a/cluster-talos/kubernetes/infrastructure/platform/logging/logging-config/app/logging.yaml +++ b/cluster-talos/kubernetes/infrastructure/platform/logging/logging-config/app/logging.yaml @@ -65,6 +65,9 @@ spec: # File-buffer on a small PVC per replica — survives pod restart, # absorbs vcflogs back-pressure. PVC size chosen to hold ~1h of # peak log volume (LogVerbose=1 on prod plex can push 200MB/h). + # storageClassName omitted on purpose → cluster default (vsan, + # vSphere CSI). Longhorn was removed earlier; vsan handles + # ReadWriteOnce + WaitForFirstConsumer just fine. bufferStorageVolume: pvc: spec: @@ -72,9 +75,6 @@ spec: resources: requests: storage: 5Gi - # k8s-talos default StorageClass is longhorn — change here - # if/when we migrate (memory: longhorn removal planned). - storageClassName: longhorn # Tolerate all nodes so the aggregator can land anywhere if # capacity tightens. tolerations: