Set open webui to local-path same as ollama

Change ollama to use local-path instead of nfs
Add toleration to make sure the apps run on the gpu worker
2026-03-02 04:17:31 +02:00 · 2026-03-02 03:59:33 +02:00 · 2026-03-02 03:52:54 +02:00 · 2026-03-02 03:48:43 +02:00 · 2026-03-02 03:43:35 +02:00 · 2026-03-02 03:40:19 +02:00
2 changed files with 48 additions and 9 deletions
--- a/manifests/ollama/values.yaml
+++ b/manifests/ollama/values.yaml
@ -1,15 +1,35 @@
 service:
  type: ClusterIP

+# Enable GPU support
+ollama:
+  gpu:
+    enabled: true
+    type: nvidia
+    number: 1
+
 resources:
  requests:
-    cpu: 250m
-    memory: 1Gi
-  limits:
    cpu: 2
    memory: 4Gi
+  limits:
+    cpu: 4
+    memory: 8Gi
+
+# Schedule on GPU worker node
+nodeSelector:
+  kubernetes.io/hostname: k3s-worker-5-gpu
+
+# Tolerate GPU node taint
+tolerations:
+  - key: gpu
+    operator: Exists
+    effect: NoSchedule
+  - key: nvidia.com/gpu
+    operator: Exists
+    effect: NoSchedule

 persistentVolume:
  enabled: true
-  size: 30Gi
-  storageClass: nfs-client
+  size: 50Gi
+  storageClass: local-path
--- a/manifests/open-webui/values.yaml
+++ b/manifests/open-webui/values.yaml
@ -1,16 +1,17 @@
 service:
  type: ClusterIP

-env:
-  - name: OLLAMA_BASE_URL
-    value: http://ollama.ai-stack.svc.cluster.local:11434
+# IMPORTANT: disable the embedded Ollama that the chart can deploy
+ollama:
+  enabled: false

+# IMPORTANT: set BOTH vars to your existing Ollama service
 extraEnvVars:
  - name: OLLAMA_BASE_URL
    value: http://ollama:11434
  - name: OLLAMA_BASE_URLS
    value: http://ollama:11434
-    
+
 resources:
  requests:
    cpu: 100m
@ -18,3 +19,21 @@ resources:
  limits:
    cpu: 500m
    memory: 1Gi
+
+persistence:
+  enabled: true
+  storageClass: local-path
+  size: 2Gi
+
+# Schedule on GPU worker node (same as Ollama for low latency)
+nodeSelector:
+  kubernetes.io/hostname: k3s-worker-5-gpu
+
+# Tolerate GPU node taint
+tolerations:
+  - key: gpu
+    operator: Exists
+    effect: NoSchedule
+  - key: nvidia.com/gpu
+    operator: Exists
+    effect: NoSchedule
Author	SHA1	Message	Date
dvirlabs	fbe623fd76	Set open webui to local-path same as ollama	2026-03-02 04:17:31 +02:00
dvirlabs	ae589acb85	Change ollama to use local-path instead of nfs	2026-03-02 03:59:33 +02:00
dvirlabs	06304a462d	Add toleration to make sure the apps run on the gpu worker	2026-03-02 03:52:54 +02:00
dvirlabs	fdc6a5040a	Increase pvc size	2026-03-02 03:48:43 +02:00
dvirlabs	4ab43ca043	Add toleration to make sure the apps run on the gpu worker	2026-03-02 03:43:35 +02:00
dvirlabs	f2ee04efc4	Uncomment the apps	2026-03-02 03:40:19 +02:00
dvirlabs	098ce3bbc4	Add noew selector to make sure the apps run on the gpu worker'	2026-03-02 03:39:35 +02:00
dvirlabs	3a0c78d5de	Comment ai-stack	2025-12-23 10:22:50 +02:00
dvirlabs	5c11223dfb	Increase ollama spec	2025-12-23 05:13:55 +02:00
dvirlabs	db532b6a22	Fix env to open-webui	2025-12-23 04:48:45 +02:00