model.go 5.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255
  1. package server
  2. import (
  3. "archive/zip"
  4. "bytes"
  5. "context"
  6. "errors"
  7. "fmt"
  8. "io"
  9. "net/http"
  10. "os"
  11. "path/filepath"
  12. "github.com/ollama/ollama/api"
  13. "github.com/ollama/ollama/convert"
  14. "github.com/ollama/ollama/llm"
  15. "github.com/ollama/ollama/types/model"
  16. )
  17. var intermediateBlobs map[string]string = make(map[string]string)
  18. type layerWithGGML struct {
  19. *Layer
  20. *llm.GGML
  21. }
  22. func parseFromModel(ctx context.Context, name model.Name, fn func(api.ProgressResponse)) (layers []*layerWithGGML, err error) {
  23. modelpath := ParseModelPath(name.String())
  24. manifest, _, err := GetManifest(modelpath)
  25. switch {
  26. case errors.Is(err, os.ErrNotExist):
  27. if err := PullModel(ctx, name.String(), &registryOptions{}, fn); err != nil {
  28. return nil, err
  29. }
  30. modelpath = ParseModelPath(name.String())
  31. manifest, _, err = GetManifest(modelpath)
  32. if err != nil {
  33. return nil, err
  34. }
  35. case err != nil:
  36. return nil, err
  37. }
  38. for _, layer := range manifest.Layers {
  39. layer, err := NewLayerFromLayer(layer.Digest, layer.MediaType, modelpath.GetShortTagname())
  40. if err != nil {
  41. return nil, err
  42. }
  43. switch layer.MediaType {
  44. case "application/vnd.ollama.image.model",
  45. "application/vnd.ollama.image.projector",
  46. "application/vnd.ollama.image.adapter":
  47. blobpath, err := GetBlobsPath(layer.Digest)
  48. if err != nil {
  49. return nil, err
  50. }
  51. blob, err := os.Open(blobpath)
  52. if err != nil {
  53. return nil, err
  54. }
  55. defer blob.Close()
  56. ggml, _, err := llm.DecodeGGML(blob)
  57. if err != nil {
  58. return nil, err
  59. }
  60. layers = append(layers, &layerWithGGML{layer, ggml})
  61. default:
  62. layers = append(layers, &layerWithGGML{layer, nil})
  63. }
  64. }
  65. return layers, nil
  66. }
  67. func parseFromZipFile(_ context.Context, file *os.File, digest string, fn func(api.ProgressResponse)) (layers []*layerWithGGML, err error) {
  68. stat, err := file.Stat()
  69. if err != nil {
  70. return nil, err
  71. }
  72. r, err := zip.NewReader(file, stat.Size())
  73. if err != nil {
  74. return nil, err
  75. }
  76. tempdir, err := os.MkdirTemp(filepath.Dir(file.Name()), "")
  77. if err != nil {
  78. return nil, err
  79. }
  80. defer os.RemoveAll(tempdir)
  81. fn(api.ProgressResponse{Status: "unpacking model metadata"})
  82. for _, f := range r.File {
  83. // TODO(mxyng): this should not write out all files to disk
  84. outfile, err := os.Create(filepath.Join(tempdir, f.Name))
  85. if err != nil {
  86. return nil, err
  87. }
  88. defer outfile.Close()
  89. infile, err := f.Open()
  90. if err != nil {
  91. return nil, err
  92. }
  93. defer infile.Close()
  94. if _, err = io.Copy(outfile, infile); err != nil {
  95. return nil, err
  96. }
  97. if err := outfile.Close(); err != nil {
  98. return nil, err
  99. }
  100. if err := infile.Close(); err != nil {
  101. return nil, err
  102. }
  103. }
  104. mf, err := convert.GetModelFormat(tempdir)
  105. if err != nil {
  106. return nil, err
  107. }
  108. params, err := mf.GetParams(tempdir)
  109. if err != nil {
  110. return nil, err
  111. }
  112. mArch, err := mf.GetModelArch("", tempdir, params)
  113. if err != nil {
  114. return nil, err
  115. }
  116. fn(api.ProgressResponse{Status: "processing tensors"})
  117. if err := mArch.GetTensors(); err != nil {
  118. return nil, err
  119. }
  120. if err := mArch.LoadVocab(); err != nil {
  121. return nil, err
  122. }
  123. fn(api.ProgressResponse{Status: "converting model"})
  124. // TODO(mxyng): this should write directly into a layer
  125. // e.g. NewLayer(arch.Reader(), "application/vnd.ollama.image.model")
  126. temp, err := os.CreateTemp(tempdir, "fp16")
  127. if err != nil {
  128. return nil, err
  129. }
  130. defer temp.Close()
  131. defer os.Remove(temp.Name())
  132. if err = mArch.WriteGGUF(temp); err != nil {
  133. return nil, err
  134. }
  135. if _, err := temp.Seek(0, io.SeekStart); err != nil {
  136. return nil, err
  137. }
  138. layer, err := NewLayer(temp, "application/vnd.ollama.image.model")
  139. if err != nil {
  140. return nil, err
  141. }
  142. bin, err := layer.Open()
  143. if err != nil {
  144. return nil, err
  145. }
  146. defer bin.Close()
  147. ggml, _, err := llm.DecodeGGML(bin)
  148. if err != nil {
  149. return nil, err
  150. }
  151. layers = append(layers, &layerWithGGML{layer, ggml})
  152. intermediateBlobs[digest] = layer.Digest
  153. return layers, nil
  154. }
  155. func parseFromFile(ctx context.Context, file *os.File, digest string, fn func(api.ProgressResponse)) (layers []*layerWithGGML, err error) {
  156. sr := io.NewSectionReader(file, 0, 512)
  157. contentType, err := detectContentType(sr)
  158. if err != nil {
  159. return nil, err
  160. }
  161. switch contentType {
  162. case "gguf", "ggla":
  163. // noop
  164. case "application/zip":
  165. return parseFromZipFile(ctx, file, digest, fn)
  166. default:
  167. return nil, fmt.Errorf("unsupported content type: %s", contentType)
  168. }
  169. stat, err := file.Stat()
  170. if err != nil {
  171. return nil, err
  172. }
  173. var offset int64
  174. for offset < stat.Size() {
  175. ggml, n, err := llm.DecodeGGML(file)
  176. if errors.Is(err, io.EOF) {
  177. break
  178. } else if err != nil {
  179. return nil, err
  180. }
  181. mediatype := "application/vnd.ollama.image.model"
  182. if ggml.Name() == "ggla" {
  183. mediatype = "application/vnd.ollama.image.adapter"
  184. } else if ggml.KV().Architecture() == "clip" {
  185. mediatype = "application/vnd.ollama.image.projector"
  186. }
  187. layer, err := NewLayer(io.NewSectionReader(file, offset, n), mediatype)
  188. if err != nil {
  189. return nil, err
  190. }
  191. layers = append(layers, &layerWithGGML{layer, ggml})
  192. offset = n
  193. }
  194. return layers, nil
  195. }
  196. func detectContentType(r io.Reader) (string, error) {
  197. var b bytes.Buffer
  198. if _, err := io.Copy(&b, r); err != nil {
  199. return "", err
  200. }
  201. if contentType := llm.DetectGGMLType(b.Bytes()); contentType != "" {
  202. return contentType, nil
  203. }
  204. if contentType := http.DetectContentType(b.Bytes()); contentType != "application/octet-stream" {
  205. return contentType, nil
  206. }
  207. return "unknown", nil
  208. }