model.go 8.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396
  1. package server
  2. import (
  3. "archive/zip"
  4. "bytes"
  5. "context"
  6. "encoding/json"
  7. "errors"
  8. "fmt"
  9. "io"
  10. "log/slog"
  11. "net/http"
  12. "os"
  13. "path/filepath"
  14. "slices"
  15. "strings"
  16. "text/template/parse"
  17. "github.com/google/uuid"
  18. "github.com/ollama/ollama/api"
  19. "github.com/ollama/ollama/convert"
  20. "github.com/ollama/ollama/llm"
  21. "github.com/ollama/ollama/template"
  22. "github.com/ollama/ollama/types/model"
  23. )
  24. var intermediateBlobs map[string]string = make(map[string]string)
  25. type layerGGML struct {
  26. *Layer
  27. *llm.GGML
  28. }
  29. func parseFromModel(ctx context.Context, name model.Name, fn func(api.ProgressResponse)) (layers []*layerGGML, err error) {
  30. m, err := ParseNamedManifest(name)
  31. switch {
  32. case errors.Is(err, os.ErrNotExist):
  33. if err := PullModel(ctx, name.String(), &registryOptions{}, fn); err != nil {
  34. return nil, err
  35. }
  36. m, err = ParseNamedManifest(name)
  37. if err != nil {
  38. return nil, err
  39. }
  40. case err != nil:
  41. return nil, err
  42. }
  43. for _, layer := range m.Layers {
  44. layer, err := NewLayerFromLayer(layer.Digest, layer.MediaType, name.DisplayShortest())
  45. if err != nil {
  46. return nil, err
  47. }
  48. switch layer.MediaType {
  49. case "application/vnd.ollama.image.model",
  50. "application/vnd.ollama.image.projector",
  51. "application/vnd.ollama.image.adapter":
  52. blobpath, err := GetBlobsPath(layer.Digest)
  53. if err != nil {
  54. return nil, err
  55. }
  56. blob, err := os.Open(blobpath)
  57. if err != nil {
  58. return nil, err
  59. }
  60. defer blob.Close()
  61. ggml, _, err := llm.DecodeGGML(blob, 0)
  62. if err != nil {
  63. return nil, err
  64. }
  65. layers = append(layers, &layerGGML{layer, ggml})
  66. default:
  67. layers = append(layers, &layerGGML{layer, nil})
  68. }
  69. }
  70. return layers, nil
  71. }
  72. func extractFromZipFile(p string, file *os.File, fn func(api.ProgressResponse)) error {
  73. stat, err := file.Stat()
  74. if err != nil {
  75. return err
  76. }
  77. r, err := zip.NewReader(file, stat.Size())
  78. if err != nil {
  79. return err
  80. }
  81. fn(api.ProgressResponse{Status: "unpacking model metadata"})
  82. for _, f := range r.File {
  83. if !filepath.IsLocal(f.Name) {
  84. return fmt.Errorf("%w: %s", zip.ErrInsecurePath, f.Name)
  85. }
  86. n := filepath.Join(p, f.Name)
  87. if err := os.MkdirAll(filepath.Dir(n), 0o750); err != nil {
  88. return err
  89. }
  90. // TODO(mxyng): this should not write out all files to disk
  91. outfile, err := os.Create(n)
  92. if err != nil {
  93. return err
  94. }
  95. defer outfile.Close()
  96. infile, err := f.Open()
  97. if err != nil {
  98. return err
  99. }
  100. defer infile.Close()
  101. if _, err = io.Copy(outfile, infile); err != nil {
  102. return err
  103. }
  104. if err := outfile.Close(); err != nil {
  105. return err
  106. }
  107. if err := infile.Close(); err != nil {
  108. return err
  109. }
  110. }
  111. return nil
  112. }
  113. func parseFromZipFile(_ context.Context, file *os.File, digest string, fn func(api.ProgressResponse)) (layers []*layerGGML, err error) {
  114. tempDir, err := os.MkdirTemp(filepath.Dir(file.Name()), "")
  115. if err != nil {
  116. return nil, err
  117. }
  118. defer os.RemoveAll(tempDir)
  119. if err := extractFromZipFile(tempDir, file, fn); err != nil {
  120. return nil, err
  121. }
  122. mf, err := convert.GetModelFormat(tempDir)
  123. if err != nil {
  124. return nil, err
  125. }
  126. params, err := mf.GetParams(tempDir)
  127. if err != nil {
  128. return nil, err
  129. }
  130. mArch, err := mf.GetModelArch("", tempDir, params)
  131. if err != nil {
  132. return nil, err
  133. }
  134. fn(api.ProgressResponse{Status: "processing tensors"})
  135. if err := mArch.GetTensors(); err != nil {
  136. return nil, err
  137. }
  138. if err := mArch.LoadVocab(); err != nil {
  139. return nil, err
  140. }
  141. fn(api.ProgressResponse{Status: "converting model"})
  142. // TODO(mxyng): this should write directly into a layer
  143. // e.g. NewLayer(arch.Reader(), "application/vnd.ollama.image.model")
  144. temp, err := os.CreateTemp(tempDir, "fp16")
  145. if err != nil {
  146. return nil, err
  147. }
  148. defer temp.Close()
  149. defer os.Remove(temp.Name())
  150. if err = mArch.WriteGGUF(temp); err != nil {
  151. return nil, err
  152. }
  153. if _, err := temp.Seek(0, io.SeekStart); err != nil {
  154. return nil, err
  155. }
  156. layer, err := NewLayer(temp, "application/vnd.ollama.image.model")
  157. if err != nil {
  158. return nil, err
  159. }
  160. bin, err := layer.Open()
  161. if err != nil {
  162. return nil, err
  163. }
  164. defer bin.Close()
  165. ggml, _, err := llm.DecodeGGML(bin, 0)
  166. if err != nil {
  167. return nil, err
  168. }
  169. layers = append(layers, &layerGGML{layer, ggml})
  170. intermediateBlobs[digest] = layer.Digest
  171. return detectChatTemplate(layers)
  172. }
  173. func parseFromFile(ctx context.Context, file *os.File, digest string, fn func(api.ProgressResponse)) (layers []*layerGGML, err error) {
  174. sr := io.NewSectionReader(file, 0, 512)
  175. contentType, err := detectContentType(sr)
  176. if err != nil {
  177. return nil, err
  178. }
  179. switch contentType {
  180. case "gguf", "ggla":
  181. // noop
  182. case "application/zip":
  183. return parseFromZipFile(ctx, file, digest, fn)
  184. default:
  185. return nil, fmt.Errorf("unsupported content type: %s", contentType)
  186. }
  187. stat, err := file.Stat()
  188. if err != nil {
  189. return nil, err
  190. }
  191. var offset int64
  192. for offset < stat.Size() {
  193. ggml, n, err := llm.DecodeGGML(file, 0)
  194. if errors.Is(err, io.EOF) {
  195. break
  196. } else if err != nil {
  197. return nil, err
  198. }
  199. mediatype := "application/vnd.ollama.image.model"
  200. if ggml.Name() == "ggla" {
  201. mediatype = "application/vnd.ollama.image.adapter"
  202. } else if ggml.KV().Architecture() == "clip" {
  203. mediatype = "application/vnd.ollama.image.projector"
  204. }
  205. layer, err := NewLayer(io.NewSectionReader(file, offset, n), mediatype)
  206. if err != nil {
  207. return nil, err
  208. }
  209. layers = append(layers, &layerGGML{layer, ggml})
  210. offset = n
  211. }
  212. return detectChatTemplate(layers)
  213. }
  214. func detectChatTemplate(layers []*layerGGML) ([]*layerGGML, error) {
  215. for _, layer := range layers {
  216. if s := layer.GGML.KV().ChatTemplate(); s != "" {
  217. if t, err := template.Named(s); err != nil {
  218. slog.Debug("template detection", "error", err)
  219. } else {
  220. tmpl, err := NewLayer(t.Reader(), "application/vnd.ollama.image.template")
  221. if err != nil {
  222. return nil, err
  223. }
  224. tmpl.status = fmt.Sprintf("using autodetected template %s", t.Name)
  225. layers = append(layers, &layerGGML{tmpl, nil})
  226. }
  227. }
  228. }
  229. return layers, nil
  230. }
  231. func detectContentType(r io.Reader) (string, error) {
  232. var b bytes.Buffer
  233. if _, err := io.Copy(&b, r); err != nil {
  234. return "", err
  235. }
  236. if contentType := llm.DetectGGMLType(b.Bytes()); contentType != "" {
  237. return contentType, nil
  238. }
  239. if contentType := http.DetectContentType(b.Bytes()); contentType != "application/octet-stream" {
  240. return contentType, nil
  241. }
  242. return "unknown", nil
  243. }
  244. // parseToolCalls attempts to parse a JSON string into a slice of ToolCalls.
  245. // mxyng: this only really works if the input contains tool calls in some JSON format
  246. func (m *Model) parseToolCalls(s string) ([]api.ToolCall, bool) {
  247. // create a subtree from the node that ranges over .ToolCalls
  248. tmpl := m.Template.Subtree(func(n parse.Node) bool {
  249. if t, ok := n.(*parse.RangeNode); ok {
  250. return slices.Contains(template.Identifiers(t.Pipe), "ToolCalls")
  251. }
  252. return false
  253. })
  254. if tmpl == nil {
  255. return nil, false
  256. }
  257. var b bytes.Buffer
  258. if err := tmpl.Execute(&b, map[string][]map[string]any{
  259. "ToolCalls": {
  260. {
  261. "Function": map[string]any{
  262. "Name": "@@name@@",
  263. "Arguments": "@@arguments@@",
  264. },
  265. },
  266. },
  267. }); err != nil {
  268. return nil, false
  269. }
  270. var kv map[string]string
  271. // execute the subtree with placeholders to identify the keys
  272. if err := json.Unmarshal(b.Bytes(), &kv); err != nil {
  273. return nil, false
  274. }
  275. // find the keys that correspond to the name and arguments fields
  276. var name, arguments string
  277. for k, v := range kv {
  278. switch v {
  279. case "@@name@@":
  280. name = k
  281. case "@@arguments@@":
  282. arguments = k
  283. }
  284. }
  285. var sm []map[string]any
  286. decoder := json.NewDecoder(strings.NewReader(s))
  287. for {
  288. // incrementally decode the JSON into a list of JSON objects
  289. // skipping over any invalid tokens
  290. if err := decoder.Decode(&sm); err != nil {
  291. if errors.Is(err, io.EOF) {
  292. break
  293. }
  294. if errors.As(err, new(*json.SyntaxError)) {
  295. r := decoder.Buffered()
  296. if _, err := r.Read(make([]byte, decoder.InputOffset()+1)); err != nil {
  297. break
  298. }
  299. decoder = json.NewDecoder(r)
  300. continue
  301. }
  302. return nil, false
  303. }
  304. // break as soon as a valid object is decoded
  305. break
  306. }
  307. var toolCalls []api.ToolCall
  308. for _, kv := range sm {
  309. call := api.ToolCall{
  310. ID: uuid.New().String(),
  311. Type: "function",
  312. }
  313. for k, v := range kv {
  314. switch k {
  315. case name:
  316. call.Function.Name = v.(string)
  317. case arguments:
  318. call.Function.Arguments = v.(map[string]any)
  319. }
  320. }
  321. toolCalls = append(toolCalls, call)
  322. }
  323. if len(toolCalls) > 0 {
  324. return toolCalls, true
  325. }
  326. return nil, false
  327. }