gpu.yaml 1.0 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556
  1. ---
  2. apiVersion: v1
  3. kind: Namespace
  4. metadata:
  5. name: ollama
  6. ---
  7. apiVersion: apps/v1
  8. kind: Deployment
  9. metadata:
  10. name: ollama
  11. namespace: ollama
  12. spec:
  13. strategy:
  14. type: Recreate
  15. selector:
  16. matchLabels:
  17. name: ollama
  18. template:
  19. metadata:
  20. labels:
  21. name: ollama
  22. spec:
  23. containers:
  24. - name: ollama
  25. image: ollama/ollama:latest
  26. env:
  27. - name: PATH
  28. value: /usr/local/nvidia/bin:/usr/local/nvidia/lib64:/usr/bin:/usr/sbin:/bin:/sbin
  29. - name: LD_LIBRARY_PATH
  30. value: /usr/local/nvidia/lib64
  31. ports:
  32. - name: http
  33. containerPort: 11434
  34. protocol: TCP
  35. resources:
  36. limits:
  37. nvidia.com/gpu: 1
  38. tolerations:
  39. - key: nvidia.com/gpu
  40. operator: Exists
  41. effect: NoSchedule
  42. ---
  43. apiVersion: v1
  44. kind: Service
  45. metadata:
  46. name: ollama
  47. namespace: ollama
  48. spec:
  49. type: ClusterIP
  50. selector:
  51. name: ollama
  52. ports:
  53. - port: 80
  54. name: http
  55. targetPort: http
  56. protocol: TCP