diff --git a/manifests/ollama/values.yaml b/manifests/ollama/values.yaml index 1b5eb59..0309e4a 100644 --- a/manifests/ollama/values.yaml +++ b/manifests/ollama/values.yaml @@ -20,6 +20,13 @@ resources: nodeSelector: kubernetes.io/hostname: k3s-worker-5-gpu +# Tolerate GPU node taint +tolerations: + - key: gpu + operator: Equal + value: "true" + effect: NoSchedule + persistentVolume: enabled: true size: 30Gi diff --git a/manifests/open-webui/values.yaml b/manifests/open-webui/values.yaml index 1f64395..a2b595f 100644 --- a/manifests/open-webui/values.yaml +++ b/manifests/open-webui/values.yaml @@ -23,3 +23,10 @@ resources: # Schedule on GPU worker node (same as Ollama for low latency) nodeSelector: kubernetes.io/hostname: k3s-worker-5-gpu + +# Tolerate GPU node taint +tolerations: + - key: gpu + operator: Equal + value: "true" + effect: NoSchedule