server.go 5.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241
  1. // Package implements an Ollama registry client and server package registry
  2. package registry
  3. import (
  4. "bytes"
  5. "cmp"
  6. "context"
  7. "errors"
  8. "log"
  9. "net/http"
  10. "net/url"
  11. "path"
  12. "strconv"
  13. "time"
  14. "github.com/minio/minio-go/v7"
  15. "github.com/minio/minio-go/v7/pkg/credentials"
  16. "github.com/ollama/ollama/x/client/ollama"
  17. "github.com/ollama/ollama/x/model"
  18. "github.com/ollama/ollama/x/oweb"
  19. "github.com/ollama/ollama/x/registry/apitype"
  20. "github.com/ollama/ollama/x/utils/upload"
  21. )
  22. // Defaults
  23. const (
  24. DefaultUploadChunkSize = 50 * 1024 * 1024
  25. )
  26. type Server struct {
  27. UploadChunkSize int64 // default is DefaultUploadChunkSize
  28. S3Client *minio.Client
  29. }
  30. func (s *Server) ServeHTTP(w http.ResponseWriter, r *http.Request) {
  31. if err := s.serveHTTP(w, r); err != nil {
  32. log.Printf("error: %v", err) // TODO(bmizerany): take a slog.Logger
  33. var e *ollama.Error
  34. if !errors.As(err, &e) {
  35. e = oweb.ErrInternal
  36. }
  37. w.WriteHeader(cmp.Or(e.Status, 400))
  38. if err := oweb.EncodeJSON(w, e); err != nil {
  39. log.Printf("error encoding error: %v", err)
  40. }
  41. }
  42. }
  43. func (s *Server) serveHTTP(w http.ResponseWriter, r *http.Request) error {
  44. switch r.URL.Path {
  45. case "/v1/push":
  46. return s.handlePush(w, r)
  47. case "/v1/pull":
  48. return s.handlePull(w, r)
  49. default:
  50. return oweb.ErrNotFound
  51. }
  52. }
  53. func (s *Server) uploadChunkSize() int64 {
  54. return cmp.Or(s.UploadChunkSize, DefaultUploadChunkSize)
  55. }
  56. func (s *Server) handlePush(w http.ResponseWriter, r *http.Request) error {
  57. const bucketTODO = "test"
  58. const minimumMultipartSize = 5 * 1024 * 1024 // S3 spec
  59. pr, err := oweb.DecodeUserJSON[apitype.PushRequest]("", r.Body)
  60. if err != nil {
  61. return err
  62. }
  63. mp := model.ParseName(pr.Name)
  64. if !mp.IsComplete() {
  65. return oweb.Invalid("name", pr.Name, "must be complete")
  66. }
  67. m, err := oweb.DecodeUserJSON[apitype.Manifest]("manifest", bytes.NewReader(pr.Manifest))
  68. if err != nil {
  69. return err
  70. }
  71. mcc := &minio.Core{Client: s.s3()}
  72. // TODO(bmizerany): complete uploads before stats for any with ETag
  73. type completeParts struct {
  74. key string
  75. parts []minio.CompletePart
  76. }
  77. completePartsByUploadID := make(map[string]completeParts)
  78. for _, mcp := range pr.CompleteParts {
  79. // parse the URL
  80. u, err := url.Parse(mcp.URL)
  81. if err != nil {
  82. return err
  83. }
  84. q := u.Query()
  85. // Check if this is a part upload, if not, skip
  86. uploadID := q.Get("uploadId")
  87. if uploadID == "" {
  88. // not a part upload
  89. continue
  90. }
  91. // PartNumber is required
  92. queryPartNumber := q.Get("partNumber")
  93. partNumber, err := strconv.Atoi(queryPartNumber)
  94. if err != nil {
  95. return oweb.Invalid("partNumber", queryPartNumber, "invalid or missing PartNumber")
  96. }
  97. // ETag is required
  98. if mcp.ETag == "" {
  99. return oweb.Missing("etag")
  100. }
  101. cp := completePartsByUploadID[uploadID]
  102. cp.key = u.Path
  103. cp.parts = append(cp.parts, minio.CompletePart{
  104. PartNumber: partNumber,
  105. ETag: mcp.ETag,
  106. })
  107. completePartsByUploadID[uploadID] = cp
  108. }
  109. for uploadID, cp := range completePartsByUploadID {
  110. var zeroOpts minio.PutObjectOptions
  111. _, err := mcc.CompleteMultipartUpload(r.Context(), bucketTODO, cp.key, uploadID, cp.parts, zeroOpts)
  112. if err != nil {
  113. var e minio.ErrorResponse
  114. if errors.As(err, &e) && e.Code == "NoSuchUpload" {
  115. return oweb.Invalid("uploadId", uploadID, "")
  116. }
  117. return err
  118. }
  119. }
  120. var requirements []apitype.Requirement
  121. for _, l := range m.Layers {
  122. // TODO(bmizerany): do in parallel
  123. if l.Size == 0 {
  124. continue
  125. }
  126. // TODO(bmizerany): "global" throttle of rate of transfer
  127. pushed, err := s.statObject(r.Context(), l.Digest)
  128. if err != nil {
  129. return err
  130. }
  131. if !pushed {
  132. key := path.Join("blobs", l.Digest)
  133. if l.Size < minimumMultipartSize {
  134. // single part upload
  135. signedURL, err := s.s3().PresignedPutObject(r.Context(), bucketTODO, key, 15*time.Minute)
  136. if err != nil {
  137. return err
  138. }
  139. requirements = append(requirements, apitype.Requirement{
  140. Digest: l.Digest,
  141. Size: l.Size,
  142. URL: signedURL.String(),
  143. })
  144. } else {
  145. uploadID, err := mcc.NewMultipartUpload(r.Context(), bucketTODO, key, minio.PutObjectOptions{})
  146. if err != nil {
  147. return err
  148. }
  149. for partNumber, c := range upload.Chunks(l.Size, s.uploadChunkSize()) {
  150. const timeToStartUpload = 15 * time.Minute
  151. signedURL, err := s.s3().Presign(r.Context(), "PUT", bucketTODO, key, timeToStartUpload, url.Values{
  152. "uploadId": []string{uploadID},
  153. "partNumber": []string{strconv.Itoa(partNumber)},
  154. })
  155. if err != nil {
  156. return err
  157. }
  158. requirements = append(requirements, apitype.Requirement{
  159. Digest: l.Digest,
  160. Offset: c.Offset,
  161. Size: c.N,
  162. URL: signedURL.String(),
  163. })
  164. }
  165. }
  166. }
  167. }
  168. if len(requirements) == 0 {
  169. // Commit the manifest
  170. body := bytes.NewReader(pr.Manifest)
  171. path := path.Join("manifests", path.Join(mp.Parts()...))
  172. _, err := s.s3().PutObject(r.Context(), bucketTODO, path, body, int64(len(pr.Manifest)), minio.PutObjectOptions{})
  173. if err != nil {
  174. return err
  175. }
  176. }
  177. return oweb.EncodeJSON(w, &apitype.PushResponse{Requirements: requirements})
  178. }
  179. func (s *Server) handlePull(w http.ResponseWriter, r *http.Request) error {
  180. // lookup manifest
  181. panic("TODO")
  182. }
  183. func (s *Server) statObject(ctx context.Context, digest string) (pushed bool, err error) {
  184. // HEAD the object
  185. path := path.Join("blobs", digest)
  186. _, err = s.s3().StatObject(ctx, "test", path, minio.StatObjectOptions{})
  187. if err != nil {
  188. if isNoSuchKey(err) {
  189. err = nil
  190. }
  191. return false, err
  192. }
  193. return true, nil
  194. }
  195. func isNoSuchKey(err error) bool {
  196. var e minio.ErrorResponse
  197. return errors.As(err, &e) && e.Code == "NoSuchKey"
  198. }
  199. func (s *Server) s3() *minio.Client {
  200. if s.S3Client != nil {
  201. return s.S3Client
  202. }
  203. s3, err := minio.New("localhost:9000", &minio.Options{
  204. Creds: credentials.NewStaticV4("minioadmin", "minioadmin", ""),
  205. Secure: false,
  206. })
  207. if err != nil {
  208. panic(err)
  209. }
  210. return s3
  211. }