Set open webui to local-path same as ollama

Change ollama to use local-path instead of nfs
Add toleration to make sure the apps run on the gpu worker
2026-03-02 04:17:31 +02:00 · 2026-03-02 03:59:33 +02:00 · 2026-03-02 03:52:54 +02:00 · 2026-03-02 03:48:43 +02:00 · 2026-03-02 03:43:35 +02:00 · 2026-03-02 03:40:19 +02:00
2 changed files with 48 additions and 9 deletions
--- a/manifests/ollama/values.yaml
+++ b/manifests/ollama/values.yaml
@ -1,15 +1,35 @@
 service:
  type: ClusterIP
 # Enable GPU support
 ollama:
  gpu:
    enabled: true
    type: nvidia
    number: 1
 resources:
  requests:
    cpu: 250m
    memory: 1Gi
  limits:
    cpu: 2
    memory: 4Gi
  limits:
    cpu: 4
    memory: 8Gi
 # Schedule on GPU worker node
 nodeSelector:
  kubernetes.io/hostname: k3s-worker-5-gpu
 # Tolerate GPU node taint
 tolerations:
  - key: gpu
    operator: Exists
    effect: NoSchedule
  - key: nvidia.com/gpu
    operator: Exists
    effect: NoSchedule
 persistentVolume:
  enabled: true
-  size: 30Gi
+  size: 50Gi
-  storageClass: nfs-client
+  storageClass: local-path
--- a/manifests/open-webui/values.yaml
+++ b/manifests/open-webui/values.yaml
@ -1,10 +1,11 @@
 service:
  type: ClusterIP
-env:
+# IMPORTANT: disable the embedded Ollama that the chart can deploy
-  - name: OLLAMA_BASE_URL
+ollama:
-    value: http://ollama.ai-stack.svc.cluster.local:11434
+  enabled: false
 # IMPORTANT: set BOTH vars to your existing Ollama service
 extraEnvVars:
  - name: OLLAMA_BASE_URL
    value: http://ollama:11434
@ -18,3 +19,21 @@ resources:
  limits:
    cpu: 500m
    memory: 1Gi
 persistence:
  enabled: true
  storageClass: local-path
  size: 2Gi
 # Schedule on GPU worker node (same as Ollama for low latency)
 nodeSelector:
  kubernetes.io/hostname: k3s-worker-5-gpu
 # Tolerate GPU node taint
 tolerations:
  - key: gpu
    operator: Exists
    effect: NoSchedule
  - key: nvidia.com/gpu
    operator: Exists
    effect: NoSchedule
Author	SHA1	Message	Date
dvirlabs	fbe623fd76	Set open webui to local-path same as ollama	2026-03-02 04:17:31 +02:00
dvirlabs	ae589acb85	Change ollama to use local-path instead of nfs	2026-03-02 03:59:33 +02:00
dvirlabs	06304a462d	Add toleration to make sure the apps run on the gpu worker	2026-03-02 03:52:54 +02:00
dvirlabs	fdc6a5040a	Increase pvc size	2026-03-02 03:48:43 +02:00
dvirlabs	4ab43ca043	Add toleration to make sure the apps run on the gpu worker	2026-03-02 03:43:35 +02:00
dvirlabs	f2ee04efc4	Uncomment the apps	2026-03-02 03:40:19 +02:00
dvirlabs	098ce3bbc4	Add noew selector to make sure the apps run on the gpu worker'	2026-03-02 03:39:35 +02:00
dvirlabs	3a0c78d5de	Comment ai-stack	2025-12-23 10:22:50 +02:00
dvirlabs	5c11223dfb	Increase ollama spec	2025-12-23 05:13:55 +02:00
dvirlabs	db532b6a22	Fix env to open-webui	2025-12-23 04:48:45 +02:00