model.go 9.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387
  1. package server
  2. import (
  3. "archive/zip"
  4. "bytes"
  5. "context"
  6. "encoding/json"
  7. "errors"
  8. "fmt"
  9. "io"
  10. "log/slog"
  11. "net/http"
  12. "os"
  13. "path/filepath"
  14. "slices"
  15. "strings"
  16. "text/template/parse"
  17. "github.com/ollama/ollama/api"
  18. "github.com/ollama/ollama/convert"
  19. "github.com/ollama/ollama/llm"
  20. "github.com/ollama/ollama/template"
  21. "github.com/ollama/ollama/types/model"
  22. )
  23. var intermediateBlobs map[string]string = make(map[string]string)
  24. type layerGGML struct {
  25. Layer
  26. *llm.GGML
  27. }
  28. func parseFromModel(ctx context.Context, name model.Name, fn func(api.ProgressResponse)) (layers []*layerGGML, err error) {
  29. m, err := ParseNamedManifest(name)
  30. switch {
  31. case errors.Is(err, os.ErrNotExist):
  32. if err := PullModel(ctx, name.String(), &registryOptions{}, fn); err != nil {
  33. return nil, err
  34. }
  35. m, err = ParseNamedManifest(name)
  36. if err != nil {
  37. return nil, err
  38. }
  39. case err != nil:
  40. return nil, err
  41. }
  42. for _, layer := range m.Layers {
  43. layer, err := NewLayerFromLayer(layer.Digest, layer.MediaType, name.DisplayShortest())
  44. if err != nil {
  45. return nil, err
  46. }
  47. switch layer.MediaType {
  48. case "application/vnd.ollama.image.model",
  49. "application/vnd.ollama.image.projector",
  50. "application/vnd.ollama.image.adapter":
  51. blobpath, err := GetBlobsPath(layer.Digest)
  52. if err != nil {
  53. return nil, err
  54. }
  55. blob, err := os.Open(blobpath)
  56. if err != nil {
  57. return nil, err
  58. }
  59. defer blob.Close()
  60. ggml, _, err := llm.DecodeGGML(blob, 0)
  61. if err != nil {
  62. return nil, err
  63. }
  64. layers = append(layers, &layerGGML{layer, ggml})
  65. default:
  66. layers = append(layers, &layerGGML{layer, nil})
  67. }
  68. }
  69. return layers, nil
  70. }
  71. func parseFromZipFile(_ context.Context, command string, baseLayers []*layerGGML, f *os.File, digest string, fn func(api.ProgressResponse)) (layers []*layerGGML, err error) {
  72. fi, err := f.Stat()
  73. if err != nil {
  74. return nil, err
  75. }
  76. r, err := zip.NewReader(f, fi.Size())
  77. if err != nil {
  78. return nil, err
  79. }
  80. p, err := os.MkdirTemp(filepath.Dir(f.Name()), "")
  81. if err != nil {
  82. return nil, err
  83. }
  84. defer os.RemoveAll(p)
  85. // TODO(mxyng): this should write directly into a layer
  86. // e.g. NewLayer(arch.Reader(), "application/vnd.ollama.image.model")
  87. t, err := os.CreateTemp(p, "fp16")
  88. if err != nil {
  89. return nil, err
  90. }
  91. defer t.Close()
  92. defer os.Remove(t.Name())
  93. var layerType string
  94. switch command {
  95. case "adapter":
  96. var baseModel *llm.GGML
  97. for _, l := range baseLayers {
  98. if l.GGML != nil {
  99. baseModel = l.GGML
  100. break
  101. }
  102. }
  103. if baseModel == nil {
  104. return nil, fmt.Errorf("no base model specified for the adapter")
  105. }
  106. fn(api.ProgressResponse{
  107. Status: "converting adapter",
  108. })
  109. if err := convert.ConvertAdapter(convert.NewZipReader(r, p, 32<<20), t, baseModel.KV(), fn); err != nil {
  110. return nil, err
  111. }
  112. layerType = "application/vnd.ollama.image.adapter"
  113. case "model":
  114. fn(api.ProgressResponse{
  115. Status: "converting model",
  116. })
  117. if err := convert.ConvertModel(convert.NewZipReader(r, p, 32<<20), t, fn); err != nil {
  118. return nil, err
  119. }
  120. layerType = "application/vnd.ollama.image.model"
  121. }
  122. if _, err := t.Seek(0, io.SeekStart); err != nil {
  123. return nil, err
  124. }
  125. layer, err := NewLayer(t, layerType)
  126. if err != nil {
  127. return nil, err
  128. }
  129. bin, err := layer.Open()
  130. if err != nil {
  131. return nil, err
  132. }
  133. defer bin.Close()
  134. ggml, _, err := llm.DecodeGGML(bin, 0)
  135. if err != nil {
  136. return nil, err
  137. }
  138. layers = append(layers, &layerGGML{layer, ggml})
  139. intermediateBlobs[digest] = layer.Digest
  140. return detectChatTemplate(layers)
  141. }
  142. func parseFromFile(ctx context.Context, command string, baseLayers []*layerGGML, file *os.File, digest string, fn func(api.ProgressResponse)) (layers []*layerGGML, err error) {
  143. sr := io.NewSectionReader(file, 0, 512)
  144. contentType, err := detectContentType(sr)
  145. if err != nil {
  146. return nil, err
  147. }
  148. switch contentType {
  149. case "gguf", "ggla":
  150. // noop
  151. case "application/zip":
  152. return parseFromZipFile(ctx, command, baseLayers, file, digest, fn)
  153. default:
  154. return nil, fmt.Errorf("unsupported content type: %s", contentType)
  155. }
  156. stat, err := file.Stat()
  157. if err != nil {
  158. return nil, err
  159. }
  160. var offset int64
  161. for offset < stat.Size() {
  162. ggml, n, err := llm.DecodeGGML(file, 0)
  163. if errors.Is(err, io.EOF) {
  164. break
  165. } else if err != nil {
  166. return nil, err
  167. }
  168. mediatype := "application/vnd.ollama.image.model"
  169. if ggml.Name() == "ggla" || ggml.KV().Kind() == "adapter" {
  170. mediatype = "application/vnd.ollama.image.adapter"
  171. } else if ggml.KV().Architecture() == "clip" {
  172. mediatype = "application/vnd.ollama.image.projector"
  173. }
  174. var layer Layer
  175. if digest != "" && n == stat.Size() && offset == 0 {
  176. layer, err = NewLayerFromLayer(digest, mediatype, file.Name())
  177. if err != nil {
  178. slog.Debug("could not create new layer from layer", "error", err)
  179. }
  180. }
  181. // Fallback to creating layer from file copy (either NewLayerFromLayer failed, or digest empty/n != stat.Size())
  182. if layer.Digest == "" {
  183. layer, err = NewLayer(io.NewSectionReader(file, offset, n), mediatype)
  184. if err != nil {
  185. return nil, err
  186. }
  187. }
  188. layers = append(layers, &layerGGML{layer, ggml})
  189. offset = n
  190. }
  191. return detectChatTemplate(layers)
  192. }
  193. func detectChatTemplate(layers []*layerGGML) ([]*layerGGML, error) {
  194. for _, layer := range layers {
  195. if s := layer.GGML.KV().ChatTemplate(); s != "" {
  196. if t, err := template.Named(s); err != nil {
  197. slog.Debug("template detection", "error", err)
  198. } else {
  199. layer, err := NewLayer(t.Reader(), "application/vnd.ollama.image.template")
  200. if err != nil {
  201. return nil, err
  202. }
  203. layer.status = fmt.Sprintf("using autodetected template %s", t.Name)
  204. layers = append(layers, &layerGGML{layer, nil})
  205. if t.Parameters != nil {
  206. var b bytes.Buffer
  207. if err := json.NewEncoder(&b).Encode(t.Parameters); err != nil {
  208. return nil, err
  209. }
  210. layer, err := NewLayer(&b, "application/vnd.ollama.image.params")
  211. if err != nil {
  212. return nil, err
  213. }
  214. layers = append(layers, &layerGGML{layer, nil})
  215. }
  216. }
  217. }
  218. }
  219. return layers, nil
  220. }
  221. func detectContentType(r io.Reader) (string, error) {
  222. var b bytes.Buffer
  223. if _, err := io.Copy(&b, r); err != nil {
  224. return "", err
  225. }
  226. if contentType := llm.DetectGGMLType(b.Bytes()); contentType != "" {
  227. return contentType, nil
  228. }
  229. if contentType := http.DetectContentType(b.Bytes()); contentType != "application/octet-stream" {
  230. return contentType, nil
  231. }
  232. return "unknown", nil
  233. }
  234. // parseToolCalls attempts to parse a JSON string into a slice of ToolCalls.
  235. // mxyng: this only really works if the input contains tool calls in some JSON format
  236. func (m *Model) parseToolCalls(s string) ([]api.ToolCall, bool) {
  237. // create a subtree from the node that ranges over .ToolCalls
  238. tmpl := m.Template.Subtree(func(n parse.Node) bool {
  239. if t, ok := n.(*parse.RangeNode); ok {
  240. return slices.Contains(template.Identifiers(t.Pipe), "ToolCalls")
  241. }
  242. return false
  243. })
  244. if tmpl == nil {
  245. return nil, false
  246. }
  247. var b bytes.Buffer
  248. if err := tmpl.Execute(&b, map[string][]api.ToolCall{
  249. "ToolCalls": {
  250. {
  251. Function: api.ToolCallFunction{
  252. Name: "@@name@@",
  253. Arguments: api.ToolCallFunctionArguments{
  254. "@@argument@@": 1,
  255. },
  256. },
  257. },
  258. },
  259. }); err != nil {
  260. return nil, false
  261. }
  262. var kv map[string]any
  263. // execute the subtree with placeholders to identify the keys
  264. // trim any commands that might exist in the template
  265. if err := json.Unmarshal(bytes.TrimSuffix(b.Bytes(), []byte(",")), &kv); err != nil {
  266. return nil, false
  267. }
  268. // find the keys that correspond to the name and arguments fields
  269. var name, arguments string
  270. for k, v := range kv {
  271. switch v.(type) {
  272. case string:
  273. name = k
  274. case map[string]any:
  275. arguments = k
  276. }
  277. }
  278. if name == "" || arguments == "" {
  279. return nil, false
  280. }
  281. var objs []map[string]any
  282. for offset := 0; offset < len(s); {
  283. var obj map[string]any
  284. decoder := json.NewDecoder(strings.NewReader(s[offset:]))
  285. if err := decoder.Decode(&obj); errors.Is(err, io.EOF) || errors.Is(err, io.ErrUnexpectedEOF) {
  286. break
  287. } else if syntax := &(json.SyntaxError{}); errors.As(err, &syntax) {
  288. // skip over any syntax errors
  289. offset += int(syntax.Offset)
  290. } else if unmarshalType := &(json.UnmarshalTypeError{}); errors.As(err, &unmarshalType) {
  291. // skip over any unmarshalable types
  292. offset += int(unmarshalType.Offset)
  293. } else if err != nil {
  294. slog.Error("parseToolCalls", "error", err)
  295. return nil, false
  296. } else {
  297. offset += int(decoder.InputOffset())
  298. // collect all nested objects
  299. var collect func(any) []map[string]any
  300. collect = func(obj any) (all []map[string]any) {
  301. switch o := obj.(type) {
  302. case map[string]any:
  303. all = append(all, o)
  304. for _, v := range o {
  305. all = append(all, collect(v)...)
  306. }
  307. case []any:
  308. for _, v := range o {
  309. all = append(all, collect(v)...)
  310. }
  311. }
  312. return all
  313. }
  314. objs = append(objs, collect(obj)...)
  315. }
  316. }
  317. var toolCalls []api.ToolCall
  318. for _, kv := range objs {
  319. n, nok := kv[name].(string)
  320. a, aok := kv[arguments].(map[string]any)
  321. if nok && aok {
  322. toolCalls = append(toolCalls, api.ToolCall{
  323. Function: api.ToolCallFunction{
  324. Name: n,
  325. Arguments: a,
  326. },
  327. })
  328. }
  329. }
  330. return toolCalls, len(toolCalls) > 0
  331. }