12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758 |
- ---
- apiVersion: v1
- kind: Namespace
- metadata:
- name: ollama
- ---
- apiVersion: apps/v1
- kind: Deployment
- metadata:
- name: ollama
- namespace: ollama
- spec:
- strategy:
- type: Recreate
- selector:
- matchLabels:
- name: ollama
- template:
- metadata:
- labels:
- name: ollama
- spec:
- containers:
- - name: ollama
- image: ollama/ollama:latest
- env:
- - name: PATH
- value: /usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin
- - name: LD_LIBRARY_PATH
- value: /usr/local/nvidia/lib:/usr/local/nvidia/lib64
- - name: NVIDIA_DRIVER_CAPABILITIES
- value: compute,utility
- ports:
- - name: http
- containerPort: 11434
- protocol: TCP
- resources:
- limits:
- nvidia.com/gpu: 1
- tolerations:
- - key: nvidia.com/gpu
- operator: Exists
- effect: NoSchedule
- ---
- apiVersion: v1
- kind: Service
- metadata:
- name: ollama
- namespace: ollama
- spec:
- type: ClusterIP
- selector:
- name: ollama
- ports:
- - port: 80
- name: http
- targetPort: http
- protocol: TCP
|