Add noew selector to make sure the apps run on the gpu worker'

This commit is contained in:
dvirlabs 2026-03-02 03:39:35 +02:00
parent 3a0c78d5de
commit 098ce3bbc4
2 changed files with 15 additions and 0 deletions

View File

@ -1,6 +1,13 @@
service: service:
type: ClusterIP type: ClusterIP
# Enable GPU support
ollama:
gpu:
enabled: true
type: nvidia
number: 1
resources: resources:
requests: requests:
cpu: 2 cpu: 2
@ -9,6 +16,10 @@ resources:
cpu: 4 cpu: 4
memory: 8Gi memory: 8Gi
# Schedule on GPU worker node
nodeSelector:
kubernetes.io/hostname: k3s-worker-5-gpu
persistentVolume: persistentVolume:
enabled: true enabled: true
size: 30Gi size: 30Gi

View File

@ -19,3 +19,7 @@ resources:
limits: limits:
cpu: 500m cpu: 500m
memory: 1Gi memory: 1Gi
# Schedule on GPU worker node (same as Ollama for low latency)
nodeSelector:
kubernetes.io/hostname: k3s-worker-5-gpu