Jelajahi Sumber

pod optimization and advanced settings

duhow 1 tahun lalu
induk
melakukan
18463d935e

+ 4 - 0
kubernetes/helm/templates/_helpers.tpl

@@ -6,6 +6,10 @@
 ollama
 {{- end -}}
 
+{{- define "ollama.url" -}}
+{{- printf "http://%s.%s.svc.cluster.local:%d/api" (include "ollama.name" .) (.Release.Namespace) (.Values.ollama.service.port | int) }}
+{{- end }}
+
 {{- define "chart.name" -}}
 {{- printf "%s-%s" .Chart.Name .Chart.Version | replace "+" "_" | trunc 63 | trimSuffix "-" }}
 {{- end }}

+ 5 - 0
kubernetes/helm/templates/ollama-statefulset.yaml

@@ -23,6 +23,11 @@ spec:
         {{- toYaml . | nindent 8 }}
       {{- end }}
     spec:
+      enableServiceLinks: false
+      automountServiceAccountToken: false
+      {{- with .Values.ollama.runtimeClassName }}
+      runtimeClassName: {{ . }}
+      {{- end }}
       containers:
       - name: {{ include "ollama.name" . }}
         {{- with .Values.ollama.image }}

+ 3 - 1
kubernetes/helm/templates/webui-deployment.yaml

@@ -22,6 +22,8 @@ spec:
         {{- toYaml . | nindent 8 }}
       {{- end }}
     spec:
+      enableServiceLinks: false
+      automountServiceAccountToken: false
       containers:
       - name: {{ .Chart.Name }}
         {{- with .Values.webui.image }}
@@ -39,7 +41,7 @@ spec:
           mountPath: /app/backend/data
         env:
         - name: OLLAMA_API_BASE_URL
-          value: {{ printf "http://%s.%s.svc.cluster.local:%s/api" (include "ollama.name" .) (.Release.Namespace) (.Values.ollama.servicePort) | quote }}
+          value: {{ include "ollama.url" . | quote }}
         tty: true
       {{- with .Values.webui.nodeSelector }}
       nodeSelector:

+ 1 - 1
kubernetes/helm/templates/webui-ingress.yaml

@@ -20,5 +20,5 @@ spec:
           service:
             name: {{ include "open-webui.name" . }}
             port:
-              number: {{ .Values.webui.service.port }}
+              name: http
 {{- end }}

+ 4 - 0
kubernetes/helm/values.yaml

@@ -1,3 +1,5 @@
+nameOverride: ""
+
 ollama:
   annotations: {}
   podAnnotations: {}
@@ -16,6 +18,8 @@ ollama:
     selector: {}
     annotations: {}
   nodeSelector: {}
+  # -- If using a special runtime container such as nvidia, set it here.
+  runtimeClassName: ""
   tolerations:
   - key: nvidia.com/gpu
     operator: Exists