model.go 5.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252
  1. package server
  2. import (
  3. "archive/zip"
  4. "bytes"
  5. "context"
  6. "errors"
  7. "fmt"
  8. "io"
  9. "net/http"
  10. "os"
  11. "path/filepath"
  12. "github.com/ollama/ollama/api"
  13. "github.com/ollama/ollama/convert"
  14. "github.com/ollama/ollama/llm"
  15. "github.com/ollama/ollama/types/model"
  16. )
  17. var intermediateBlobs map[string]string = make(map[string]string)
  18. type layerWithGGML struct {
  19. *Layer
  20. *llm.GGML
  21. }
  22. func parseFromModel(ctx context.Context, name model.Name, fn func(api.ProgressResponse)) (layers []*layerWithGGML, err error) {
  23. m, err := ParseNamedManifest(name)
  24. switch {
  25. case errors.Is(err, os.ErrNotExist):
  26. if err := PullModel(ctx, name.String(), &registryOptions{}, fn); err != nil {
  27. return nil, err
  28. }
  29. m, err = ParseNamedManifest(name)
  30. if err != nil {
  31. return nil, err
  32. }
  33. case err != nil:
  34. return nil, err
  35. }
  36. for _, layer := range m.Layers {
  37. layer, err := NewLayerFromLayer(layer.Digest, layer.MediaType, name.DisplayShortest())
  38. if err != nil {
  39. return nil, err
  40. }
  41. switch layer.MediaType {
  42. case "application/vnd.ollama.image.model",
  43. "application/vnd.ollama.image.projector",
  44. "application/vnd.ollama.image.adapter":
  45. blobpath, err := GetBlobsPath(layer.Digest)
  46. if err != nil {
  47. return nil, err
  48. }
  49. blob, err := os.Open(blobpath)
  50. if err != nil {
  51. return nil, err
  52. }
  53. defer blob.Close()
  54. ggml, _, err := llm.DecodeGGML(blob)
  55. if err != nil {
  56. return nil, err
  57. }
  58. layers = append(layers, &layerWithGGML{layer, ggml})
  59. default:
  60. layers = append(layers, &layerWithGGML{layer, nil})
  61. }
  62. }
  63. return layers, nil
  64. }
  65. func parseFromZipFile(_ context.Context, file *os.File, digest string, fn func(api.ProgressResponse)) (layers []*layerWithGGML, err error) {
  66. stat, err := file.Stat()
  67. if err != nil {
  68. return nil, err
  69. }
  70. r, err := zip.NewReader(file, stat.Size())
  71. if err != nil {
  72. return nil, err
  73. }
  74. tempdir, err := os.MkdirTemp(filepath.Dir(file.Name()), "")
  75. if err != nil {
  76. return nil, err
  77. }
  78. defer os.RemoveAll(tempdir)
  79. fn(api.ProgressResponse{Status: "unpacking model metadata"})
  80. for _, f := range r.File {
  81. // TODO(mxyng): this should not write out all files to disk
  82. outfile, err := os.Create(filepath.Join(tempdir, f.Name))
  83. if err != nil {
  84. return nil, err
  85. }
  86. defer outfile.Close()
  87. infile, err := f.Open()
  88. if err != nil {
  89. return nil, err
  90. }
  91. defer infile.Close()
  92. if _, err = io.Copy(outfile, infile); err != nil {
  93. return nil, err
  94. }
  95. if err := outfile.Close(); err != nil {
  96. return nil, err
  97. }
  98. if err := infile.Close(); err != nil {
  99. return nil, err
  100. }
  101. }
  102. mf, err := convert.GetModelFormat(tempdir)
  103. if err != nil {
  104. return nil, err
  105. }
  106. params, err := mf.GetParams(tempdir)
  107. if err != nil {
  108. return nil, err
  109. }
  110. mArch, err := mf.GetModelArch("", tempdir, params)
  111. if err != nil {
  112. return nil, err
  113. }
  114. fn(api.ProgressResponse{Status: "processing tensors"})
  115. if err := mArch.GetTensors(); err != nil {
  116. return nil, err
  117. }
  118. if err := mArch.LoadVocab(); err != nil {
  119. return nil, err
  120. }
  121. fn(api.ProgressResponse{Status: "converting model"})
  122. // TODO(mxyng): this should write directly into a layer
  123. // e.g. NewLayer(arch.Reader(), "application/vnd.ollama.image.model")
  124. temp, err := os.CreateTemp(tempdir, "fp16")
  125. if err != nil {
  126. return nil, err
  127. }
  128. defer temp.Close()
  129. defer os.Remove(temp.Name())
  130. if err = mArch.WriteGGUF(temp); err != nil {
  131. return nil, err
  132. }
  133. if _, err := temp.Seek(0, io.SeekStart); err != nil {
  134. return nil, err
  135. }
  136. layer, err := NewLayer(temp, "application/vnd.ollama.image.model")
  137. if err != nil {
  138. return nil, err
  139. }
  140. bin, err := layer.Open()
  141. if err != nil {
  142. return nil, err
  143. }
  144. defer bin.Close()
  145. ggml, _, err := llm.DecodeGGML(bin)
  146. if err != nil {
  147. return nil, err
  148. }
  149. layers = append(layers, &layerWithGGML{layer, ggml})
  150. intermediateBlobs[digest] = layer.Digest
  151. return layers, nil
  152. }
  153. func parseFromFile(ctx context.Context, file *os.File, digest string, fn func(api.ProgressResponse)) (layers []*layerWithGGML, err error) {
  154. sr := io.NewSectionReader(file, 0, 512)
  155. contentType, err := detectContentType(sr)
  156. if err != nil {
  157. return nil, err
  158. }
  159. switch contentType {
  160. case "gguf", "ggla":
  161. // noop
  162. case "application/zip":
  163. return parseFromZipFile(ctx, file, digest, fn)
  164. default:
  165. return nil, fmt.Errorf("unsupported content type: %s", contentType)
  166. }
  167. stat, err := file.Stat()
  168. if err != nil {
  169. return nil, err
  170. }
  171. var offset int64
  172. for offset < stat.Size() {
  173. ggml, n, err := llm.DecodeGGML(file)
  174. if errors.Is(err, io.EOF) {
  175. break
  176. } else if err != nil {
  177. return nil, err
  178. }
  179. mediatype := "application/vnd.ollama.image.model"
  180. if ggml.Name() == "ggla" {
  181. mediatype = "application/vnd.ollama.image.adapter"
  182. } else if ggml.KV().Architecture() == "clip" {
  183. mediatype = "application/vnd.ollama.image.projector"
  184. }
  185. layer, err := NewLayer(io.NewSectionReader(file, offset, n), mediatype)
  186. if err != nil {
  187. return nil, err
  188. }
  189. layers = append(layers, &layerWithGGML{layer, ggml})
  190. offset = n
  191. }
  192. return layers, nil
  193. }
  194. func detectContentType(r io.Reader) (string, error) {
  195. var b bytes.Buffer
  196. if _, err := io.Copy(&b, r); err != nil {
  197. return "", err
  198. }
  199. if contentType := llm.DetectGGMLType(b.Bytes()); contentType != "" {
  200. return contentType, nil
  201. }
  202. if contentType := http.DetectContentType(b.Bytes()); contentType != "application/octet-stream" {
  203. return contentType, nil
  204. }
  205. return "unknown", nil
  206. }