Add toleration to make sure the apps run on the gpu worker

This commit is contained in:
dvirlabs 2026-03-02 03:43:35 +02:00
parent f2ee04efc4
commit 4ab43ca043
2 changed files with 14 additions and 0 deletions

View File

@ -20,6 +20,13 @@ resources:
nodeSelector:
kubernetes.io/hostname: k3s-worker-5-gpu
# Tolerate GPU node taint
tolerations:
- key: gpu
operator: Equal
value: "true"
effect: NoSchedule
persistentVolume:
enabled: true
size: 30Gi

View File

@ -23,3 +23,10 @@ resources:
# Schedule on GPU worker node (same as Ollama for low latency)
nodeSelector:
kubernetes.io/hostname: k3s-worker-5-gpu
# Tolerate GPU node taint
tolerations:
- key: gpu
operator: Equal
value: "true"
effect: NoSchedule