Add toleration to make sure the apps run on the gpu worker

2026-03-02 03:43:35 +02:00 · 2026-03-02 03:43:35 +02:00 · 4ab43ca043
commit 4ab43ca043
parent f2ee04efc4
2 changed files with 14 additions and 0 deletions
--- a/manifests/ollama/values.yaml
+++ b/manifests/ollama/values.yaml
@ -20,6 +20,13 @@ resources:
 nodeSelector:
  kubernetes.io/hostname: k3s-worker-5-gpu

+# Tolerate GPU node taint
+tolerations:
+  - key: gpu
+    operator: Equal
+    value: "true"
+    effect: NoSchedule
+
 persistentVolume:
  enabled: true
  size: 30Gi
--- a/manifests/open-webui/values.yaml
+++ b/manifests/open-webui/values.yaml
@ -23,3 +23,10 @@ resources:
 # Schedule on GPU worker node (same as Ollama for low latency)
 nodeSelector:
  kubernetes.io/hostname: k3s-worker-5-gpu
+
+# Tolerate GPU node taint
+tolerations:
+  - key: gpu
+    operator: Equal
+    value: "true"
+    effect: NoSchedule