model.go 5.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258
  1. package server
  2. import (
  3. "archive/zip"
  4. "bytes"
  5. "context"
  6. "errors"
  7. "fmt"
  8. "io"
  9. "net/http"
  10. "os"
  11. "path/filepath"
  12. "github.com/ollama/ollama/api"
  13. "github.com/ollama/ollama/convert"
  14. "github.com/ollama/ollama/llm"
  15. "github.com/ollama/ollama/types/model"
  16. "github.com/ollama/ollama/types/ordered"
  17. )
  18. func parseFromModel(ctx context.Context, name model.Name, fn func(api.ProgressResponse)) (*ordered.Map[*Layer, *llm.GGML], error) {
  19. modelpath := ParseModelPath(name.DisplayLongest())
  20. manifest, _, err := GetManifest(modelpath)
  21. switch {
  22. case errors.Is(err, os.ErrNotExist):
  23. if err := PullModel(ctx, name.DisplayLongest(), &registryOptions{}, fn); err != nil {
  24. return nil, err
  25. }
  26. modelpath = ParseModelPath(name.DisplayLongest())
  27. manifest, _, err = GetManifest(modelpath)
  28. if err != nil {
  29. return nil, err
  30. }
  31. case err != nil:
  32. return nil, err
  33. }
  34. layers := ordered.NewMap[*Layer, *llm.GGML]()
  35. for _, layer := range manifest.Layers {
  36. layer, err := NewLayerFromLayer(layer.Digest, layer.MediaType, modelpath.GetShortTagname())
  37. if err != nil {
  38. return nil, err
  39. }
  40. switch layer.MediaType {
  41. case "application/vnd.ollama.image.model",
  42. "application/vnd.ollama.image.projector",
  43. "application/vnd.ollama.image.adapter":
  44. blobpath, err := GetBlobsPath(layer.Digest)
  45. if err != nil {
  46. return nil, err
  47. }
  48. blob, err := os.Open(blobpath)
  49. if err != nil {
  50. return nil, err
  51. }
  52. defer blob.Close()
  53. ggml, _, err := llm.DecodeGGML(blob)
  54. if err != nil {
  55. return nil, err
  56. }
  57. layers.Add(layer, ggml)
  58. default:
  59. layers.Add(layer, nil)
  60. }
  61. }
  62. return layers, nil
  63. }
  64. func parseFromZipFile(_ context.Context, file *os.File, fn func(api.ProgressResponse)) (*ordered.Map[*Layer, *llm.GGML], error) {
  65. stat, err := file.Stat()
  66. if err != nil {
  67. return nil, err
  68. }
  69. r, err := zip.NewReader(file, stat.Size())
  70. if err != nil {
  71. return nil, err
  72. }
  73. tempdir, err := os.MkdirTemp(filepath.Dir(file.Name()), "")
  74. if err != nil {
  75. return nil, err
  76. }
  77. defer os.RemoveAll(tempdir)
  78. fn(api.ProgressResponse{Status: "unpacking model metadata"})
  79. for _, f := range r.File {
  80. // TODO(mxyng): this should not write out all files to disk
  81. outfile, err := os.Create(filepath.Join(tempdir, f.Name))
  82. if err != nil {
  83. return nil, err
  84. }
  85. infile, err := f.Open()
  86. if err != nil {
  87. return nil, err
  88. }
  89. if _, err = io.Copy(outfile, infile); err != nil {
  90. return nil, err
  91. }
  92. if err := outfile.Close(); err != nil {
  93. return nil, err
  94. }
  95. if err := infile.Close(); err != nil {
  96. return nil, err
  97. }
  98. }
  99. mf, err := convert.GetModelFormat(tempdir)
  100. if err != nil {
  101. return nil, err
  102. }
  103. params, err := mf.GetParams(tempdir)
  104. if err != nil {
  105. return nil, err
  106. }
  107. mArch, err := mf.GetModelArch("", tempdir, params)
  108. if err != nil {
  109. return nil, err
  110. }
  111. fn(api.ProgressResponse{Status: "processing tensors"})
  112. if err := mArch.GetTensors(); err != nil {
  113. return nil, err
  114. }
  115. if err := mArch.LoadVocab(); err != nil {
  116. return nil, err
  117. }
  118. fn(api.ProgressResponse{Status: "converting model"})
  119. // TODO(mxyng): this should write directly into a layer
  120. // e.g. NewLayer(arch.Reader(), "application/vnd.ollama.image.model")
  121. temp, err := os.CreateTemp(tempdir, "fp16")
  122. if err != nil {
  123. return nil, err
  124. }
  125. defer temp.Close()
  126. defer os.Remove(temp.Name())
  127. if err = mArch.WriteGGUF(temp); err != nil {
  128. return nil, err
  129. }
  130. if _, err := temp.Seek(0, io.SeekStart); err != nil {
  131. return nil, err
  132. }
  133. layer, err := NewLayer(temp, "application/vnd.ollama.image.model")
  134. if err != nil {
  135. return nil, fmt.Errorf("aaa: %w", err)
  136. }
  137. blobpath, err := GetBlobsPath(layer.Digest)
  138. if err != nil {
  139. return nil, err
  140. }
  141. bin, err := os.Open(blobpath)
  142. if err != nil {
  143. return nil, err
  144. }
  145. defer bin.Close()
  146. ggml, _, err := llm.DecodeGGML(bin)
  147. if err != nil {
  148. return nil, err
  149. }
  150. layer, err = NewLayerFromLayer(layer.Digest, layer.MediaType, "")
  151. if err != nil {
  152. return nil, err
  153. }
  154. layers := ordered.NewMap[*Layer, *llm.GGML]()
  155. layers.Add(layer, ggml)
  156. return layers, nil
  157. }
  158. func parseFromFile(ctx context.Context, file *os.File, fn func(api.ProgressResponse)) (*ordered.Map[*Layer, *llm.GGML], error) {
  159. sr := io.NewSectionReader(file, 0, 512)
  160. contentType, err := detectContentType(sr)
  161. if err != nil {
  162. return nil, err
  163. }
  164. switch contentType {
  165. case "gguf", "ggla":
  166. // noop
  167. case "application/zip":
  168. return parseFromZipFile(ctx, file, fn)
  169. default:
  170. return nil, fmt.Errorf("unsupported content type: %s", contentType)
  171. }
  172. layers := ordered.NewMap[*Layer, *llm.GGML]()
  173. stat, err := file.Stat()
  174. if err != nil {
  175. return nil, err
  176. }
  177. var offset int64
  178. for offset < stat.Size() {
  179. ggml, n, err := llm.DecodeGGML(file)
  180. if errors.Is(err, io.EOF) {
  181. break
  182. } else if err != nil {
  183. return nil, err
  184. }
  185. mediatype := "application/vnd.ollama.image.model"
  186. if ggml.Name() == "ggla" {
  187. mediatype = "application/vnd.ollama.image.adapter"
  188. } else if ggml.KV().Architecture() == "clip" {
  189. mediatype = "application/vnd.ollama.image.projector"
  190. }
  191. layer, err := NewLayer(io.NewSectionReader(file, offset, n), mediatype)
  192. if err != nil {
  193. return nil, err
  194. }
  195. layers.Add(layer, ggml)
  196. offset = n
  197. }
  198. return layers, nil
  199. }
  200. func detectContentType(r io.Reader) (string, error) {
  201. var b bytes.Buffer
  202. if _, err := io.Copy(&b, r); err != nil {
  203. return "", err
  204. }
  205. if contentType := llm.DetectGGMLType(b.Bytes()); contentType != "" {
  206. return contentType, nil
  207. }
  208. if contentType := http.DetectContentType(b.Bytes()); contentType != "application/octet-stream" {
  209. return contentType, nil
  210. }
  211. return "unknown", nil
  212. }