model.go 9.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421
  1. package server
  2. import (
  3. "archive/zip"
  4. "bytes"
  5. "context"
  6. "encoding/json"
  7. "errors"
  8. "fmt"
  9. "io"
  10. "log/slog"
  11. "net/http"
  12. "os"
  13. "path/filepath"
  14. "slices"
  15. "strings"
  16. "text/template/parse"
  17. "github.com/Masterminds/semver/v3"
  18. "github.com/ollama/ollama/api"
  19. "github.com/ollama/ollama/convert"
  20. "github.com/ollama/ollama/llm"
  21. "github.com/ollama/ollama/template"
  22. "github.com/ollama/ollama/types/model"
  23. )
  24. var intermediateBlobs map[string]string = make(map[string]string)
  25. type layerGGML struct {
  26. *Layer
  27. *llm.GGML
  28. }
  29. func parseFromModel(ctx context.Context, name model.Name, fn func(api.ProgressResponse)) (layers []*layerGGML, version *semver.Version, err error) {
  30. m, err := ParseNamedManifest(name)
  31. switch {
  32. case errors.Is(err, os.ErrNotExist):
  33. if err := PullModel(ctx, name.String(), &registryOptions{}, fn); err != nil {
  34. return nil, version, err
  35. }
  36. m, err = ParseNamedManifest(name)
  37. if err != nil {
  38. return nil, version, err
  39. }
  40. case err != nil:
  41. return nil, version, err
  42. }
  43. version = m.Ollama
  44. for _, layer := range m.Layers {
  45. layer, err := NewLayerFromLayer(layer.Digest, layer.MediaType, name.DisplayShortest())
  46. if err != nil {
  47. return nil, version, err
  48. }
  49. switch layer.MediaType {
  50. case "application/vnd.ollama.image.model",
  51. "application/vnd.ollama.image.projector",
  52. "application/vnd.ollama.image.adapter":
  53. blobpath, err := GetBlobsPath(layer.Digest)
  54. if err != nil {
  55. return nil, version, err
  56. }
  57. blob, err := os.Open(blobpath)
  58. if err != nil {
  59. return nil, version, err
  60. }
  61. defer blob.Close()
  62. ggml, _, err := llm.DecodeGGML(blob, 0)
  63. if err != nil {
  64. return nil, version, err
  65. }
  66. layers = append(layers, &layerGGML{layer, ggml})
  67. default:
  68. layers = append(layers, &layerGGML{layer, nil})
  69. }
  70. }
  71. return layers, version, nil
  72. }
  73. func extractFromZipFile(p string, file *os.File, fn func(api.ProgressResponse)) error {
  74. stat, err := file.Stat()
  75. if err != nil {
  76. return err
  77. }
  78. r, err := zip.NewReader(file, stat.Size())
  79. if err != nil {
  80. return err
  81. }
  82. fn(api.ProgressResponse{Status: "unpacking model metadata"})
  83. for _, f := range r.File {
  84. if !filepath.IsLocal(f.Name) {
  85. return fmt.Errorf("%w: %s", zip.ErrInsecurePath, f.Name)
  86. }
  87. n := filepath.Join(p, f.Name)
  88. if err := os.MkdirAll(filepath.Dir(n), 0o750); err != nil {
  89. return err
  90. }
  91. // TODO(mxyng): this should not write out all files to disk
  92. outfile, err := os.Create(n)
  93. if err != nil {
  94. return err
  95. }
  96. defer outfile.Close()
  97. infile, err := f.Open()
  98. if err != nil {
  99. return err
  100. }
  101. defer infile.Close()
  102. if _, err = io.Copy(outfile, infile); err != nil {
  103. return err
  104. }
  105. if err := outfile.Close(); err != nil {
  106. return err
  107. }
  108. if err := infile.Close(); err != nil {
  109. return err
  110. }
  111. }
  112. return nil
  113. }
  114. func parseFromZipFile(_ context.Context, file *os.File, digest string, fn func(api.ProgressResponse)) (layers []*layerGGML, err error) {
  115. tempDir, err := os.MkdirTemp(filepath.Dir(file.Name()), "")
  116. if err != nil {
  117. return nil, err
  118. }
  119. defer os.RemoveAll(tempDir)
  120. if err := extractFromZipFile(tempDir, file, fn); err != nil {
  121. return nil, err
  122. }
  123. mf, err := convert.GetModelFormat(tempDir)
  124. if err != nil {
  125. return nil, err
  126. }
  127. params, err := mf.GetParams(tempDir)
  128. if err != nil {
  129. return nil, err
  130. }
  131. mArch, err := mf.GetModelArch("", tempDir, params)
  132. if err != nil {
  133. return nil, err
  134. }
  135. fn(api.ProgressResponse{Status: "processing tensors"})
  136. if err := mArch.GetTensors(); err != nil {
  137. return nil, err
  138. }
  139. if err := mArch.LoadVocab(); err != nil {
  140. return nil, err
  141. }
  142. fn(api.ProgressResponse{Status: "converting model"})
  143. // TODO(mxyng): this should write directly into a layer
  144. // e.g. NewLayer(arch.Reader(), "application/vnd.ollama.image.model")
  145. temp, err := os.CreateTemp(tempDir, "fp16")
  146. if err != nil {
  147. return nil, err
  148. }
  149. defer temp.Close()
  150. defer os.Remove(temp.Name())
  151. if err = mArch.WriteGGUF(temp); err != nil {
  152. return nil, err
  153. }
  154. if _, err := temp.Seek(0, io.SeekStart); err != nil {
  155. return nil, err
  156. }
  157. layer, err := NewLayer(temp, "application/vnd.ollama.image.model")
  158. if err != nil {
  159. return nil, err
  160. }
  161. bin, err := layer.Open()
  162. if err != nil {
  163. return nil, err
  164. }
  165. defer bin.Close()
  166. ggml, _, err := llm.DecodeGGML(bin, 0)
  167. if err != nil {
  168. return nil, err
  169. }
  170. layers = append(layers, &layerGGML{layer, ggml})
  171. intermediateBlobs[digest] = layer.Digest
  172. return detectChatTemplate(layers)
  173. }
  174. func parseFromFile(ctx context.Context, file *os.File, digest string, fn func(api.ProgressResponse)) (layers []*layerGGML, err error) {
  175. sr := io.NewSectionReader(file, 0, 512)
  176. contentType, err := detectContentType(sr)
  177. if err != nil {
  178. return nil, err
  179. }
  180. switch contentType {
  181. case "gguf", "ggla":
  182. // noop
  183. case "application/zip":
  184. return parseFromZipFile(ctx, file, digest, fn)
  185. default:
  186. return nil, fmt.Errorf("unsupported content type: %s", contentType)
  187. }
  188. stat, err := file.Stat()
  189. if err != nil {
  190. return nil, err
  191. }
  192. var offset int64
  193. for offset < stat.Size() {
  194. ggml, n, err := llm.DecodeGGML(file, 0)
  195. if errors.Is(err, io.EOF) {
  196. break
  197. } else if err != nil {
  198. return nil, err
  199. }
  200. mediatype := "application/vnd.ollama.image.model"
  201. if ggml.Name() == "ggla" {
  202. mediatype = "application/vnd.ollama.image.adapter"
  203. } else if ggml.KV().Architecture() == "clip" {
  204. mediatype = "application/vnd.ollama.image.projector"
  205. }
  206. layer, err := NewLayer(io.NewSectionReader(file, offset, n), mediatype)
  207. if err != nil {
  208. return nil, err
  209. }
  210. layers = append(layers, &layerGGML{layer, ggml})
  211. offset = n
  212. }
  213. return detectChatTemplate(layers)
  214. }
  215. func detectChatTemplate(layers []*layerGGML) ([]*layerGGML, error) {
  216. for _, layer := range layers {
  217. if s := layer.GGML.KV().ChatTemplate(); s != "" {
  218. if t, err := template.Named(s); err != nil {
  219. slog.Debug("template detection", "error", err)
  220. } else {
  221. layer, err := NewLayer(t.Reader(), "application/vnd.ollama.image.template")
  222. if err != nil {
  223. return nil, err
  224. }
  225. layer.status = fmt.Sprintf("using autodetected template %s", t.Name)
  226. layers = append(layers, &layerGGML{layer, nil})
  227. if t.Parameters != nil {
  228. var b bytes.Buffer
  229. if err := json.NewEncoder(&b).Encode(t.Parameters); err != nil {
  230. return nil, err
  231. }
  232. layer, err := NewLayer(&b, "application/vnd.ollama.image.params")
  233. if err != nil {
  234. return nil, err
  235. }
  236. layers = append(layers, &layerGGML{layer, nil})
  237. }
  238. }
  239. }
  240. }
  241. return layers, nil
  242. }
  243. func detectContentType(r io.Reader) (string, error) {
  244. var b bytes.Buffer
  245. if _, err := io.Copy(&b, r); err != nil {
  246. return "", err
  247. }
  248. if contentType := llm.DetectGGMLType(b.Bytes()); contentType != "" {
  249. return contentType, nil
  250. }
  251. if contentType := http.DetectContentType(b.Bytes()); contentType != "application/octet-stream" {
  252. return contentType, nil
  253. }
  254. return "unknown", nil
  255. }
  256. // parseToolCalls attempts to parse a JSON string into a slice of ToolCalls.
  257. // mxyng: this only really works if the input contains tool calls in some JSON format
  258. func (m *Model) parseToolCalls(s string) ([]api.ToolCall, bool) {
  259. // create a subtree from the node that ranges over .ToolCalls
  260. tmpl := m.Template.Subtree(func(n parse.Node) bool {
  261. if t, ok := n.(*parse.RangeNode); ok {
  262. return slices.Contains(template.Identifiers(t.Pipe), "ToolCalls")
  263. }
  264. return false
  265. })
  266. if tmpl == nil {
  267. return nil, false
  268. }
  269. var b bytes.Buffer
  270. if err := tmpl.Execute(&b, map[string][]api.ToolCall{
  271. "ToolCalls": {
  272. {
  273. Function: api.ToolCallFunction{
  274. Name: "@@name@@",
  275. Arguments: api.ToolCallFunctionArguments{
  276. "@@argument@@": 1,
  277. },
  278. },
  279. },
  280. },
  281. }); err != nil {
  282. return nil, false
  283. }
  284. var kv map[string]any
  285. // execute the subtree with placeholders to identify the keys
  286. // trim any commands that might exist in the template
  287. if err := json.Unmarshal(bytes.TrimSuffix(b.Bytes(), []byte(",")), &kv); err != nil {
  288. return nil, false
  289. }
  290. // find the keys that correspond to the name and arguments fields
  291. var name, arguments string
  292. for k, v := range kv {
  293. switch v.(type) {
  294. case string:
  295. name = k
  296. case map[string]any:
  297. arguments = k
  298. }
  299. }
  300. if name == "" || arguments == "" {
  301. return nil, false
  302. }
  303. var objs []map[string]any
  304. for offset := 0; offset < len(s); {
  305. var obj map[string]any
  306. decoder := json.NewDecoder(strings.NewReader(s[offset:]))
  307. if err := decoder.Decode(&obj); errors.Is(err, io.EOF) || errors.Is(err, io.ErrUnexpectedEOF) {
  308. break
  309. } else if syntax := &(json.SyntaxError{}); errors.As(err, &syntax) {
  310. // skip over any syntax errors
  311. offset += int(syntax.Offset)
  312. } else if unmarshalType := &(json.UnmarshalTypeError{}); errors.As(err, &unmarshalType) {
  313. // skip over any unmarshalable types
  314. offset += int(unmarshalType.Offset)
  315. } else if err != nil {
  316. slog.Error("parseToolCalls", "error", err)
  317. return nil, false
  318. } else {
  319. offset += int(decoder.InputOffset())
  320. // collect all nested objects
  321. var collect func(any) []map[string]any
  322. collect = func(obj any) (all []map[string]any) {
  323. switch o := obj.(type) {
  324. case map[string]any:
  325. all = append(all, o)
  326. for _, v := range o {
  327. all = append(all, collect(v)...)
  328. }
  329. case []any:
  330. for _, v := range o {
  331. all = append(all, collect(v)...)
  332. }
  333. }
  334. return all
  335. }
  336. objs = append(objs, collect(obj)...)
  337. }
  338. }
  339. var toolCalls []api.ToolCall
  340. for _, kv := range objs {
  341. n, nok := kv[name].(string)
  342. a, aok := kv[arguments].(map[string]any)
  343. if nok && aok {
  344. toolCalls = append(toolCalls, api.ToolCall{
  345. Function: api.ToolCallFunction{
  346. Name: n,
  347. Arguments: a,
  348. },
  349. })
  350. }
  351. }
  352. return toolCalls, len(toolCalls) > 0
  353. }