gpu.yaml 1.1 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758
  1. ---
  2. apiVersion: v1
  3. kind: Namespace
  4. metadata:
  5. name: ollama
  6. ---
  7. apiVersion: apps/v1
  8. kind: Deployment
  9. metadata:
  10. name: ollama
  11. namespace: ollama
  12. spec:
  13. strategy:
  14. type: Recreate
  15. selector:
  16. matchLabels:
  17. name: ollama
  18. template:
  19. metadata:
  20. labels:
  21. name: ollama
  22. spec:
  23. containers:
  24. - name: ollama
  25. image: ollama/ollama:latest
  26. env:
  27. - name: PATH
  28. value: /usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin
  29. - name: LD_LIBRARY_PATH
  30. value: /usr/local/nvidia/lib:/usr/local/nvidia/lib64
  31. - name: NVIDIA_DRIVER_CAPABILITIES
  32. value: compute,utility
  33. ports:
  34. - name: http
  35. containerPort: 11434
  36. protocol: TCP
  37. resources:
  38. limits:
  39. nvidia.com/gpu: 1
  40. tolerations:
  41. - key: nvidia.com/gpu
  42. operator: Exists
  43. effect: NoSchedule
  44. ---
  45. apiVersion: v1
  46. kind: Service
  47. metadata:
  48. name: ollama
  49. namespace: ollama
  50. spec:
  51. type: ClusterIP
  52. selector:
  53. name: ollama
  54. ports:
  55. - port: 80
  56. name: http
  57. targetPort: http
  58. protocol: TCP