Add noew selector to make sure the apps run on the gpu worker'
This commit is contained in:
parent
3a0c78d5de
commit
098ce3bbc4
@ -1,6 +1,13 @@
|
|||||||
service:
|
service:
|
||||||
type: ClusterIP
|
type: ClusterIP
|
||||||
|
|
||||||
|
# Enable GPU support
|
||||||
|
ollama:
|
||||||
|
gpu:
|
||||||
|
enabled: true
|
||||||
|
type: nvidia
|
||||||
|
number: 1
|
||||||
|
|
||||||
resources:
|
resources:
|
||||||
requests:
|
requests:
|
||||||
cpu: 2
|
cpu: 2
|
||||||
@ -9,6 +16,10 @@ resources:
|
|||||||
cpu: 4
|
cpu: 4
|
||||||
memory: 8Gi
|
memory: 8Gi
|
||||||
|
|
||||||
|
# Schedule on GPU worker node
|
||||||
|
nodeSelector:
|
||||||
|
kubernetes.io/hostname: k3s-worker-5-gpu
|
||||||
|
|
||||||
persistentVolume:
|
persistentVolume:
|
||||||
enabled: true
|
enabled: true
|
||||||
size: 30Gi
|
size: 30Gi
|
||||||
|
|||||||
@ -19,3 +19,7 @@ resources:
|
|||||||
limits:
|
limits:
|
||||||
cpu: 500m
|
cpu: 500m
|
||||||
memory: 1Gi
|
memory: 1Gi
|
||||||
|
|
||||||
|
# Schedule on GPU worker node (same as Ollama for low latency)
|
||||||
|
nodeSelector:
|
||||||
|
kubernetes.io/hostname: k3s-worker-5-gpu
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user