cmd.go 34 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464
  1. package cmd
  2. import (
  3. "archive/zip"
  4. "bufio"
  5. "bytes"
  6. "context"
  7. "crypto/ed25519"
  8. "crypto/rand"
  9. "crypto/sha256"
  10. "encoding/pem"
  11. "errors"
  12. "fmt"
  13. "io"
  14. "log"
  15. "math"
  16. "net"
  17. "net/http"
  18. "os"
  19. "os/signal"
  20. "path/filepath"
  21. "regexp"
  22. "runtime"
  23. "slices"
  24. "strconv"
  25. "strings"
  26. "sync/atomic"
  27. "syscall"
  28. "time"
  29. "github.com/containerd/console"
  30. "github.com/mattn/go-runewidth"
  31. "github.com/olekukonko/tablewriter"
  32. "github.com/spf13/cobra"
  33. "golang.org/x/crypto/ssh"
  34. "golang.org/x/term"
  35. "github.com/ollama/ollama/api"
  36. "github.com/ollama/ollama/auth"
  37. "github.com/ollama/ollama/envconfig"
  38. "github.com/ollama/ollama/format"
  39. "github.com/ollama/ollama/parser"
  40. "github.com/ollama/ollama/progress"
  41. "github.com/ollama/ollama/server"
  42. "github.com/ollama/ollama/types/errtypes"
  43. "github.com/ollama/ollama/types/model"
  44. "github.com/ollama/ollama/version"
  45. )
  46. func CreateHandler(cmd *cobra.Command, args []string) error {
  47. filename, _ := cmd.Flags().GetString("file")
  48. filename, err := filepath.Abs(filename)
  49. if err != nil {
  50. return err
  51. }
  52. client, err := api.ClientFromEnvironment()
  53. if err != nil {
  54. return err
  55. }
  56. p := progress.NewProgress(os.Stderr)
  57. defer p.Stop()
  58. f, err := os.Open(filename)
  59. if err != nil {
  60. return err
  61. }
  62. defer f.Close()
  63. modelfile, err := parser.ParseFile(f)
  64. if err != nil {
  65. return err
  66. }
  67. home, err := os.UserHomeDir()
  68. if err != nil {
  69. return err
  70. }
  71. status := "transferring model data"
  72. spinner := progress.NewSpinner(status)
  73. p.Add(status, spinner)
  74. defer p.Stop()
  75. for i := range modelfile.Commands {
  76. switch modelfile.Commands[i].Name {
  77. case "model", "adapter":
  78. path := modelfile.Commands[i].Args
  79. if path == "~" {
  80. path = home
  81. } else if strings.HasPrefix(path, "~/") {
  82. path = filepath.Join(home, path[2:])
  83. }
  84. if !filepath.IsAbs(path) {
  85. path = filepath.Join(filepath.Dir(filename), path)
  86. }
  87. fi, err := os.Stat(path)
  88. if errors.Is(err, os.ErrNotExist) && modelfile.Commands[i].Name == "model" {
  89. continue
  90. } else if err != nil {
  91. return err
  92. }
  93. if fi.IsDir() {
  94. // this is likely a safetensors or pytorch directory
  95. // TODO make this work w/ adapters
  96. tempfile, err := tempZipFiles(path)
  97. if err != nil {
  98. return err
  99. }
  100. defer os.RemoveAll(tempfile)
  101. path = tempfile
  102. }
  103. digest, err := createBlob(cmd, client, path, spinner)
  104. if err != nil {
  105. return err
  106. }
  107. modelfile.Commands[i].Args = "@" + digest
  108. }
  109. }
  110. bars := make(map[string]*progress.Bar)
  111. fn := func(resp api.ProgressResponse) error {
  112. if resp.Digest != "" {
  113. spinner.Stop()
  114. bar, ok := bars[resp.Digest]
  115. if !ok {
  116. bar = progress.NewBar(fmt.Sprintf("pulling %s...", resp.Digest[7:19]), resp.Total, resp.Completed)
  117. bars[resp.Digest] = bar
  118. p.Add(resp.Digest, bar)
  119. }
  120. bar.Set(resp.Completed)
  121. } else if status != resp.Status {
  122. spinner.Stop()
  123. status = resp.Status
  124. spinner = progress.NewSpinner(status)
  125. p.Add(status, spinner)
  126. }
  127. return nil
  128. }
  129. quantize, _ := cmd.Flags().GetString("quantize")
  130. request := api.CreateRequest{Name: args[0], Modelfile: modelfile.String(), Quantize: quantize}
  131. if err := client.Create(cmd.Context(), &request, fn); err != nil {
  132. return err
  133. }
  134. return nil
  135. }
  136. func tempZipFiles(path string) (string, error) {
  137. tempfile, err := os.CreateTemp("", "ollama-tf")
  138. if err != nil {
  139. return "", err
  140. }
  141. defer tempfile.Close()
  142. detectContentType := func(path string) (string, error) {
  143. f, err := os.Open(path)
  144. if err != nil {
  145. return "", err
  146. }
  147. defer f.Close()
  148. var b bytes.Buffer
  149. b.Grow(512)
  150. if _, err := io.CopyN(&b, f, 512); err != nil && !errors.Is(err, io.EOF) {
  151. return "", err
  152. }
  153. contentType, _, _ := strings.Cut(http.DetectContentType(b.Bytes()), ";")
  154. return contentType, nil
  155. }
  156. glob := func(pattern, contentType string) ([]string, error) {
  157. matches, err := filepath.Glob(pattern)
  158. if err != nil {
  159. return nil, err
  160. }
  161. for _, safetensor := range matches {
  162. if ct, err := detectContentType(safetensor); err != nil {
  163. return nil, err
  164. } else if ct != contentType {
  165. return nil, fmt.Errorf("invalid content type: expected %s for %s", ct, safetensor)
  166. }
  167. }
  168. return matches, nil
  169. }
  170. var files []string
  171. if st, _ := glob(filepath.Join(path, "model*.safetensors"), "application/octet-stream"); len(st) > 0 {
  172. // safetensors files might be unresolved git lfs references; skip if they are
  173. // covers model-x-of-y.safetensors, model.fp32-x-of-y.safetensors, model.safetensors
  174. files = append(files, st...)
  175. } else if st, _ := glob(filepath.Join(path, "adapters.safetensors"), "application/octet-stream"); len(st) > 0 {
  176. // covers adapters.safetensors
  177. files = append(files, st...)
  178. } else if st, _ := glob(filepath.Join(path, "adapter_model.safetensors"), "application/octet-stream"); len(st) > 0 {
  179. // covers adapter_model.safetensors
  180. files = append(files, st...)
  181. } else if pt, _ := glob(filepath.Join(path, "pytorch_model*.bin"), "application/zip"); len(pt) > 0 {
  182. // pytorch files might also be unresolved git lfs references; skip if they are
  183. // covers pytorch_model-x-of-y.bin, pytorch_model.fp32-x-of-y.bin, pytorch_model.bin
  184. files = append(files, pt...)
  185. } else if pt, _ := glob(filepath.Join(path, "consolidated*.pth"), "application/zip"); len(pt) > 0 {
  186. // pytorch files might also be unresolved git lfs references; skip if they are
  187. // covers consolidated.x.pth, consolidated.pth
  188. files = append(files, pt...)
  189. } else {
  190. return "", errors.New("no safetensors or torch files found")
  191. }
  192. // add configuration files, json files are detected as text/plain
  193. js, err := glob(filepath.Join(path, "*.json"), "text/plain")
  194. if err != nil {
  195. return "", err
  196. }
  197. files = append(files, js...)
  198. // bert models require a nested config.json
  199. // TODO(mxyng): merge this with the glob above
  200. js, err = glob(filepath.Join(path, "**/*.json"), "text/plain")
  201. if err != nil {
  202. return "", err
  203. }
  204. files = append(files, js...)
  205. if tks, _ := glob(filepath.Join(path, "tokenizer.model"), "application/octet-stream"); len(tks) > 0 {
  206. // add tokenizer.model if it exists, tokenizer.json is automatically picked up by the previous glob
  207. // tokenizer.model might be a unresolved git lfs reference; error if it is
  208. files = append(files, tks...)
  209. } else if tks, _ := glob(filepath.Join(path, "**/tokenizer.model"), "text/plain"); len(tks) > 0 {
  210. // some times tokenizer.model is in a subdirectory (e.g. meta-llama/Meta-Llama-3-8B)
  211. files = append(files, tks...)
  212. }
  213. zipfile := zip.NewWriter(tempfile)
  214. defer zipfile.Close()
  215. for _, file := range files {
  216. f, err := os.Open(file)
  217. if err != nil {
  218. return "", err
  219. }
  220. defer f.Close()
  221. fi, err := f.Stat()
  222. if err != nil {
  223. return "", err
  224. }
  225. zfi, err := zip.FileInfoHeader(fi)
  226. if err != nil {
  227. return "", err
  228. }
  229. zfi.Name, err = filepath.Rel(path, file)
  230. if err != nil {
  231. return "", err
  232. }
  233. zf, err := zipfile.CreateHeader(zfi)
  234. if err != nil {
  235. return "", err
  236. }
  237. if _, err := io.Copy(zf, f); err != nil {
  238. return "", err
  239. }
  240. }
  241. return tempfile.Name(), nil
  242. }
  243. func createBlob(cmd *cobra.Command, client *api.Client, path string, spinner *progress.Spinner) (string, error) {
  244. bin, err := os.Open(path)
  245. if err != nil {
  246. return "", err
  247. }
  248. defer bin.Close()
  249. // Get file info to retrieve the size
  250. fileInfo, err := bin.Stat()
  251. if err != nil {
  252. return "", err
  253. }
  254. fileSize := fileInfo.Size()
  255. hash := sha256.New()
  256. if _, err := io.Copy(hash, bin); err != nil {
  257. return "", err
  258. }
  259. if _, err := bin.Seek(0, io.SeekStart); err != nil {
  260. return "", err
  261. }
  262. var pw progressWriter
  263. status := "transferring model data 0%"
  264. spinner.SetMessage(status)
  265. done := make(chan struct{})
  266. defer close(done)
  267. go func() {
  268. ticker := time.NewTicker(60 * time.Millisecond)
  269. defer ticker.Stop()
  270. for {
  271. select {
  272. case <-ticker.C:
  273. spinner.SetMessage(fmt.Sprintf("transferring model data %d%%", int(100*pw.n.Load()/fileSize)))
  274. case <-done:
  275. spinner.SetMessage("transferring model data 100%")
  276. return
  277. }
  278. }
  279. }()
  280. digest := fmt.Sprintf("sha256:%x", hash.Sum(nil))
  281. if err = client.CreateBlob(cmd.Context(), digest, io.TeeReader(bin, &pw)); err != nil {
  282. return "", err
  283. }
  284. return digest, nil
  285. }
  286. type progressWriter struct {
  287. n atomic.Int64
  288. }
  289. func (w *progressWriter) Write(p []byte) (n int, err error) {
  290. w.n.Add(int64(len(p)))
  291. return len(p), nil
  292. }
  293. func loadOrUnloadModel(cmd *cobra.Command, opts *runOptions) error {
  294. p := progress.NewProgress(os.Stderr)
  295. defer p.StopAndClear()
  296. spinner := progress.NewSpinner("")
  297. p.Add("", spinner)
  298. client, err := api.ClientFromEnvironment()
  299. if err != nil {
  300. return err
  301. }
  302. req := &api.GenerateRequest{
  303. Model: opts.Model,
  304. KeepAlive: opts.KeepAlive,
  305. }
  306. return client.Generate(cmd.Context(), req, func(api.GenerateResponse) error { return nil })
  307. }
  308. func StopHandler(cmd *cobra.Command, args []string) error {
  309. opts := &runOptions{
  310. Model: args[0],
  311. KeepAlive: &api.Duration{Duration: 0},
  312. }
  313. if err := loadOrUnloadModel(cmd, opts); err != nil {
  314. if strings.Contains(err.Error(), "not found") {
  315. return fmt.Errorf("couldn't find model \"%s\" to stop", args[0])
  316. }
  317. }
  318. return nil
  319. }
  320. func RunHandler(cmd *cobra.Command, args []string) error {
  321. interactive := true
  322. opts := runOptions{
  323. Model: args[0],
  324. WordWrap: os.Getenv("TERM") == "xterm-256color",
  325. Options: map[string]interface{}{},
  326. }
  327. format, err := cmd.Flags().GetString("format")
  328. if err != nil {
  329. return err
  330. }
  331. opts.Format = format
  332. keepAlive, err := cmd.Flags().GetString("keepalive")
  333. if err != nil {
  334. return err
  335. }
  336. if keepAlive != "" {
  337. d, err := time.ParseDuration(keepAlive)
  338. if err != nil {
  339. return err
  340. }
  341. opts.KeepAlive = &api.Duration{Duration: d}
  342. }
  343. prompts := args[1:]
  344. // prepend stdin to the prompt if provided
  345. if !term.IsTerminal(int(os.Stdin.Fd())) {
  346. in, err := io.ReadAll(os.Stdin)
  347. if err != nil {
  348. return err
  349. }
  350. prompts = append([]string{string(in)}, prompts...)
  351. opts.WordWrap = false
  352. interactive = false
  353. }
  354. opts.Prompt = strings.Join(prompts, " ")
  355. if len(prompts) > 0 {
  356. interactive = false
  357. }
  358. nowrap, err := cmd.Flags().GetBool("nowordwrap")
  359. if err != nil {
  360. return err
  361. }
  362. opts.WordWrap = !nowrap
  363. // Fill out the rest of the options based on information about the
  364. // model.
  365. client, err := api.ClientFromEnvironment()
  366. if err != nil {
  367. return err
  368. }
  369. name := args[0]
  370. info, err := func() (*api.ShowResponse, error) {
  371. showReq := &api.ShowRequest{Name: name}
  372. info, err := client.Show(cmd.Context(), showReq)
  373. var se api.StatusError
  374. if errors.As(err, &se) && se.StatusCode == http.StatusNotFound {
  375. if err := PullHandler(cmd, []string{name}); err != nil {
  376. return nil, err
  377. }
  378. return client.Show(cmd.Context(), &api.ShowRequest{Name: name})
  379. }
  380. return info, err
  381. }()
  382. if err != nil {
  383. return err
  384. }
  385. opts.MultiModal = slices.Contains(info.Details.Families, "clip")
  386. opts.ParentModel = info.Details.ParentModel
  387. if interactive {
  388. if err := loadOrUnloadModel(cmd, &opts); err != nil {
  389. return err
  390. }
  391. for _, msg := range info.Messages {
  392. switch msg.Role {
  393. case "user":
  394. fmt.Printf(">>> %s\n", msg.Content)
  395. case "assistant":
  396. state := &displayResponseState{}
  397. displayResponse(msg.Content, opts.WordWrap, state)
  398. fmt.Println()
  399. fmt.Println()
  400. }
  401. }
  402. return generateInteractive(cmd, opts)
  403. }
  404. return generate(cmd, opts)
  405. }
  406. func errFromUnknownKey(unknownKeyErr error) error {
  407. // find SSH public key in the error message
  408. sshKeyPattern := `ssh-\w+ [^\s"]+`
  409. re := regexp.MustCompile(sshKeyPattern)
  410. matches := re.FindStringSubmatch(unknownKeyErr.Error())
  411. if len(matches) > 0 {
  412. serverPubKey := matches[0]
  413. localPubKey, err := auth.GetPublicKey()
  414. if err != nil {
  415. return unknownKeyErr
  416. }
  417. if runtime.GOOS == "linux" && serverPubKey != localPubKey {
  418. // try the ollama service public key
  419. svcPubKey, err := os.ReadFile("/usr/share/ollama/.ollama/id_ed25519.pub")
  420. if err != nil {
  421. return unknownKeyErr
  422. }
  423. localPubKey = strings.TrimSpace(string(svcPubKey))
  424. }
  425. // check if the returned public key matches the local public key, this prevents adding a remote key to the user's account
  426. if serverPubKey != localPubKey {
  427. return unknownKeyErr
  428. }
  429. var msg strings.Builder
  430. msg.WriteString(unknownKeyErr.Error())
  431. msg.WriteString("\n\nYour ollama key is:\n")
  432. msg.WriteString(localPubKey)
  433. msg.WriteString("\nAdd your key at:\n")
  434. msg.WriteString("https://ollama.com/settings/keys")
  435. return errors.New(msg.String())
  436. }
  437. return unknownKeyErr
  438. }
  439. func PushHandler(cmd *cobra.Command, args []string) error {
  440. client, err := api.ClientFromEnvironment()
  441. if err != nil {
  442. return err
  443. }
  444. insecure, err := cmd.Flags().GetBool("insecure")
  445. if err != nil {
  446. return err
  447. }
  448. p := progress.NewProgress(os.Stderr)
  449. defer p.Stop()
  450. bars := make(map[string]*progress.Bar)
  451. var status string
  452. var spinner *progress.Spinner
  453. fn := func(resp api.ProgressResponse) error {
  454. if resp.Digest != "" {
  455. if spinner != nil {
  456. spinner.Stop()
  457. }
  458. bar, ok := bars[resp.Digest]
  459. if !ok {
  460. bar = progress.NewBar(fmt.Sprintf("pushing %s...", resp.Digest[7:19]), resp.Total, resp.Completed)
  461. bars[resp.Digest] = bar
  462. p.Add(resp.Digest, bar)
  463. }
  464. bar.Set(resp.Completed)
  465. } else if status != resp.Status {
  466. if spinner != nil {
  467. spinner.Stop()
  468. }
  469. status = resp.Status
  470. spinner = progress.NewSpinner(status)
  471. p.Add(status, spinner)
  472. }
  473. return nil
  474. }
  475. request := api.PushRequest{Name: args[0], Insecure: insecure}
  476. if err := client.Push(cmd.Context(), &request, fn); err != nil {
  477. if spinner != nil {
  478. spinner.Stop()
  479. }
  480. if strings.Contains(err.Error(), "access denied") {
  481. return errors.New("you are not authorized to push to this namespace, create the model under a namespace you own")
  482. }
  483. host := model.ParseName(args[0]).Host
  484. isOllamaHost := strings.HasSuffix(host, ".ollama.ai") || strings.HasSuffix(host, ".ollama.com")
  485. if strings.Contains(err.Error(), errtypes.UnknownOllamaKeyErrMsg) && isOllamaHost {
  486. // the user has not added their ollama key to ollama.com
  487. // re-throw an error with a more user-friendly message
  488. return errFromUnknownKey(err)
  489. }
  490. return err
  491. }
  492. spinner.Stop()
  493. return nil
  494. }
  495. func ListHandler(cmd *cobra.Command, args []string) error {
  496. client, err := api.ClientFromEnvironment()
  497. if err != nil {
  498. return err
  499. }
  500. models, err := client.List(cmd.Context())
  501. if err != nil {
  502. return err
  503. }
  504. var data [][]string
  505. for _, m := range models.Models {
  506. if len(args) == 0 || strings.HasPrefix(m.Name, args[0]) {
  507. data = append(data, []string{m.Name, m.Digest[:12], format.HumanBytes(m.Size), format.HumanTime(m.ModifiedAt, "Never")})
  508. }
  509. }
  510. table := tablewriter.NewWriter(os.Stdout)
  511. table.SetHeader([]string{"NAME", "ID", "SIZE", "MODIFIED"})
  512. table.SetHeaderAlignment(tablewriter.ALIGN_LEFT)
  513. table.SetAlignment(tablewriter.ALIGN_LEFT)
  514. table.SetHeaderLine(false)
  515. table.SetBorder(false)
  516. table.SetNoWhiteSpace(true)
  517. table.SetTablePadding(" ")
  518. table.AppendBulk(data)
  519. table.Render()
  520. return nil
  521. }
  522. func ListRunningHandler(cmd *cobra.Command, args []string) error {
  523. client, err := api.ClientFromEnvironment()
  524. if err != nil {
  525. return err
  526. }
  527. models, err := client.ListRunning(cmd.Context())
  528. if err != nil {
  529. return err
  530. }
  531. var data [][]string
  532. for _, m := range models.Models {
  533. if len(args) == 0 || strings.HasPrefix(m.Name, args[0]) {
  534. var procStr string
  535. switch {
  536. case m.SizeVRAM == 0:
  537. procStr = "100% CPU"
  538. case m.SizeVRAM == m.Size:
  539. procStr = "100% GPU"
  540. case m.SizeVRAM > m.Size || m.Size == 0:
  541. procStr = "Unknown"
  542. default:
  543. sizeCPU := m.Size - m.SizeVRAM
  544. cpuPercent := math.Round(float64(sizeCPU) / float64(m.Size) * 100)
  545. procStr = fmt.Sprintf("%d%%/%d%% CPU/GPU", int(cpuPercent), int(100-cpuPercent))
  546. }
  547. var until string
  548. delta := time.Since(m.ExpiresAt)
  549. if delta > 0 {
  550. until = "Stopping..."
  551. } else {
  552. until = format.HumanTime(m.ExpiresAt, "Never")
  553. }
  554. data = append(data, []string{m.Name, m.Digest[:12], format.HumanBytes(m.Size), procStr, until})
  555. }
  556. }
  557. table := tablewriter.NewWriter(os.Stdout)
  558. table.SetHeader([]string{"NAME", "ID", "SIZE", "PROCESSOR", "UNTIL"})
  559. table.SetHeaderAlignment(tablewriter.ALIGN_LEFT)
  560. table.SetAlignment(tablewriter.ALIGN_LEFT)
  561. table.SetHeaderLine(false)
  562. table.SetBorder(false)
  563. table.SetNoWhiteSpace(true)
  564. table.SetTablePadding(" ")
  565. table.AppendBulk(data)
  566. table.Render()
  567. return nil
  568. }
  569. func DeleteHandler(cmd *cobra.Command, args []string) error {
  570. client, err := api.ClientFromEnvironment()
  571. if err != nil {
  572. return err
  573. }
  574. for _, name := range args {
  575. req := api.DeleteRequest{Name: name}
  576. if err := client.Delete(cmd.Context(), &req); err != nil {
  577. return err
  578. }
  579. fmt.Printf("deleted '%s'\n", name)
  580. }
  581. return nil
  582. }
  583. func ShowHandler(cmd *cobra.Command, args []string) error {
  584. client, err := api.ClientFromEnvironment()
  585. if err != nil {
  586. return err
  587. }
  588. license, errLicense := cmd.Flags().GetBool("license")
  589. modelfile, errModelfile := cmd.Flags().GetBool("modelfile")
  590. parameters, errParams := cmd.Flags().GetBool("parameters")
  591. system, errSystem := cmd.Flags().GetBool("system")
  592. template, errTemplate := cmd.Flags().GetBool("template")
  593. for _, boolErr := range []error{errLicense, errModelfile, errParams, errSystem, errTemplate} {
  594. if boolErr != nil {
  595. return errors.New("error retrieving flags")
  596. }
  597. }
  598. flagsSet := 0
  599. showType := ""
  600. if license {
  601. flagsSet++
  602. showType = "license"
  603. }
  604. if modelfile {
  605. flagsSet++
  606. showType = "modelfile"
  607. }
  608. if parameters {
  609. flagsSet++
  610. showType = "parameters"
  611. }
  612. if system {
  613. flagsSet++
  614. showType = "system"
  615. }
  616. if template {
  617. flagsSet++
  618. showType = "template"
  619. }
  620. if flagsSet > 1 {
  621. return errors.New("only one of '--license', '--modelfile', '--parameters', '--system', or '--template' can be specified")
  622. }
  623. req := api.ShowRequest{Name: args[0]}
  624. resp, err := client.Show(cmd.Context(), &req)
  625. if err != nil {
  626. return err
  627. }
  628. if flagsSet == 1 {
  629. switch showType {
  630. case "license":
  631. fmt.Println(resp.License)
  632. case "modelfile":
  633. fmt.Println(resp.Modelfile)
  634. case "parameters":
  635. fmt.Println(resp.Parameters)
  636. case "system":
  637. fmt.Println(resp.System)
  638. case "template":
  639. fmt.Println(resp.Template)
  640. }
  641. return nil
  642. }
  643. return showInfo(resp, os.Stdout)
  644. }
  645. func showInfo(resp *api.ShowResponse, w io.Writer) error {
  646. tableRender := func(header string, rows func() [][]string) {
  647. fmt.Fprintln(w, " ", header)
  648. table := tablewriter.NewWriter(w)
  649. table.SetAlignment(tablewriter.ALIGN_LEFT)
  650. table.SetBorder(false)
  651. table.SetNoWhiteSpace(true)
  652. table.SetTablePadding(" ")
  653. switch header {
  654. case "Template", "System", "License":
  655. table.SetColWidth(100)
  656. }
  657. table.AppendBulk(rows())
  658. table.Render()
  659. fmt.Fprintln(w)
  660. }
  661. tableRender("Model", func() (rows [][]string) {
  662. if resp.ModelInfo != nil {
  663. arch := resp.ModelInfo["general.architecture"].(string)
  664. rows = append(rows, []string{"", "architecture", arch})
  665. rows = append(rows, []string{"", "parameters", format.HumanNumber(uint64(resp.ModelInfo["general.parameter_count"].(float64)))})
  666. rows = append(rows, []string{"", "context length", strconv.FormatFloat(resp.ModelInfo[fmt.Sprintf("%s.context_length", arch)].(float64), 'f', -1, 64)})
  667. rows = append(rows, []string{"", "embedding length", strconv.FormatFloat(resp.ModelInfo[fmt.Sprintf("%s.embedding_length", arch)].(float64), 'f', -1, 64)})
  668. } else {
  669. rows = append(rows, []string{"", "architecture", resp.Details.Family})
  670. rows = append(rows, []string{"", "parameters", resp.Details.ParameterSize})
  671. }
  672. rows = append(rows, []string{"", "quantization", resp.Details.QuantizationLevel})
  673. return
  674. })
  675. if resp.ProjectorInfo != nil {
  676. tableRender("Projector", func() (rows [][]string) {
  677. arch := resp.ProjectorInfo["general.architecture"].(string)
  678. rows = append(rows, []string{"", "architecture", arch})
  679. rows = append(rows, []string{"", "parameters", format.HumanNumber(uint64(resp.ProjectorInfo["general.parameter_count"].(float64)))})
  680. rows = append(rows, []string{"", "embedding length", strconv.FormatFloat(resp.ProjectorInfo[fmt.Sprintf("%s.vision.embedding_length", arch)].(float64), 'f', -1, 64)})
  681. rows = append(rows, []string{"", "dimensions", strconv.FormatFloat(resp.ProjectorInfo[fmt.Sprintf("%s.vision.projection_dim", arch)].(float64), 'f', -1, 64)})
  682. return
  683. })
  684. }
  685. if resp.Parameters != "" {
  686. tableRender("Parameters", func() (rows [][]string) {
  687. scanner := bufio.NewScanner(strings.NewReader(resp.Parameters))
  688. for scanner.Scan() {
  689. if text := scanner.Text(); text != "" {
  690. rows = append(rows, append([]string{""}, strings.Fields(text)...))
  691. }
  692. }
  693. return
  694. })
  695. }
  696. head := func(s string, n int) (rows [][]string) {
  697. scanner := bufio.NewScanner(strings.NewReader(s))
  698. for scanner.Scan() && (len(rows) < n || n < 0) {
  699. if text := scanner.Text(); text != "" {
  700. rows = append(rows, []string{"", strings.TrimSpace(text)})
  701. }
  702. }
  703. return
  704. }
  705. if resp.System != "" {
  706. tableRender("System", func() [][]string {
  707. return head(resp.System, 2)
  708. })
  709. }
  710. if resp.License != "" {
  711. tableRender("License", func() [][]string {
  712. return head(resp.License, 2)
  713. })
  714. }
  715. return nil
  716. }
  717. func CopyHandler(cmd *cobra.Command, args []string) error {
  718. client, err := api.ClientFromEnvironment()
  719. if err != nil {
  720. return err
  721. }
  722. req := api.CopyRequest{Source: args[0], Destination: args[1]}
  723. if err := client.Copy(cmd.Context(), &req); err != nil {
  724. return err
  725. }
  726. fmt.Printf("copied '%s' to '%s'\n", args[0], args[1])
  727. return nil
  728. }
  729. func PullHandler(cmd *cobra.Command, args []string) error {
  730. insecure, err := cmd.Flags().GetBool("insecure")
  731. if err != nil {
  732. return err
  733. }
  734. client, err := api.ClientFromEnvironment()
  735. if err != nil {
  736. return err
  737. }
  738. p := progress.NewProgress(os.Stderr)
  739. defer p.Stop()
  740. bars := make(map[string]*progress.Bar)
  741. var status string
  742. var spinner *progress.Spinner
  743. fn := func(resp api.ProgressResponse) error {
  744. if resp.Digest != "" {
  745. if spinner != nil {
  746. spinner.Stop()
  747. }
  748. bar, ok := bars[resp.Digest]
  749. if !ok {
  750. bar = progress.NewBar(fmt.Sprintf("pulling %s...", resp.Digest[7:19]), resp.Total, resp.Completed)
  751. bars[resp.Digest] = bar
  752. p.Add(resp.Digest, bar)
  753. }
  754. bar.Set(resp.Completed)
  755. } else if status != resp.Status {
  756. if spinner != nil {
  757. spinner.Stop()
  758. }
  759. status = resp.Status
  760. spinner = progress.NewSpinner(status)
  761. p.Add(status, spinner)
  762. }
  763. return nil
  764. }
  765. request := api.PullRequest{Name: args[0], Insecure: insecure}
  766. if err := client.Pull(cmd.Context(), &request, fn); err != nil {
  767. return err
  768. }
  769. return nil
  770. }
  771. type generateContextKey string
  772. type runOptions struct {
  773. Model string
  774. ParentModel string
  775. Prompt string
  776. Messages []api.Message
  777. WordWrap bool
  778. Format string
  779. System string
  780. Images []api.ImageData
  781. Options map[string]interface{}
  782. MultiModal bool
  783. KeepAlive *api.Duration
  784. }
  785. type displayResponseState struct {
  786. lineLength int
  787. wordBuffer string
  788. }
  789. func displayResponse(content string, wordWrap bool, state *displayResponseState) {
  790. termWidth, _, _ := term.GetSize(int(os.Stdout.Fd()))
  791. if wordWrap && termWidth >= 10 {
  792. for _, ch := range content {
  793. if state.lineLength+1 > termWidth-5 {
  794. if runewidth.StringWidth(state.wordBuffer) > termWidth-10 {
  795. fmt.Printf("%s%c", state.wordBuffer, ch)
  796. state.wordBuffer = ""
  797. state.lineLength = 0
  798. continue
  799. }
  800. // backtrack the length of the last word and clear to the end of the line
  801. a := runewidth.StringWidth(state.wordBuffer)
  802. if a > 0 {
  803. fmt.Printf("\x1b[%dD", a)
  804. }
  805. fmt.Printf("\x1b[K\n")
  806. fmt.Printf("%s%c", state.wordBuffer, ch)
  807. chWidth := runewidth.RuneWidth(ch)
  808. state.lineLength = runewidth.StringWidth(state.wordBuffer) + chWidth
  809. } else {
  810. fmt.Print(string(ch))
  811. state.lineLength += runewidth.RuneWidth(ch)
  812. if runewidth.RuneWidth(ch) >= 2 {
  813. state.wordBuffer = ""
  814. continue
  815. }
  816. switch ch {
  817. case ' ':
  818. state.wordBuffer = ""
  819. case '\n':
  820. state.lineLength = 0
  821. default:
  822. state.wordBuffer += string(ch)
  823. }
  824. }
  825. }
  826. } else {
  827. fmt.Printf("%s%s", state.wordBuffer, content)
  828. if len(state.wordBuffer) > 0 {
  829. state.wordBuffer = ""
  830. }
  831. }
  832. }
  833. func chat(cmd *cobra.Command, opts runOptions) (*api.Message, error) {
  834. client, err := api.ClientFromEnvironment()
  835. if err != nil {
  836. return nil, err
  837. }
  838. p := progress.NewProgress(os.Stderr)
  839. defer p.StopAndClear()
  840. spinner := progress.NewSpinner("")
  841. p.Add("", spinner)
  842. cancelCtx, cancel := context.WithCancel(cmd.Context())
  843. defer cancel()
  844. sigChan := make(chan os.Signal, 1)
  845. signal.Notify(sigChan, syscall.SIGINT)
  846. go func() {
  847. <-sigChan
  848. cancel()
  849. }()
  850. var state *displayResponseState = &displayResponseState{}
  851. var latest api.ChatResponse
  852. var fullResponse strings.Builder
  853. var role string
  854. fn := func(response api.ChatResponse) error {
  855. p.StopAndClear()
  856. latest = response
  857. role = response.Message.Role
  858. content := response.Message.Content
  859. fullResponse.WriteString(content)
  860. displayResponse(content, opts.WordWrap, state)
  861. return nil
  862. }
  863. req := &api.ChatRequest{
  864. Model: opts.Model,
  865. Messages: opts.Messages,
  866. Format: opts.Format,
  867. Options: opts.Options,
  868. }
  869. if opts.KeepAlive != nil {
  870. req.KeepAlive = opts.KeepAlive
  871. }
  872. if err := client.Chat(cancelCtx, req, fn); err != nil {
  873. if errors.Is(err, context.Canceled) {
  874. return nil, nil
  875. }
  876. return nil, err
  877. }
  878. if len(opts.Messages) > 0 {
  879. fmt.Println()
  880. fmt.Println()
  881. }
  882. verbose, err := cmd.Flags().GetBool("verbose")
  883. if err != nil {
  884. return nil, err
  885. }
  886. if verbose {
  887. latest.Summary()
  888. }
  889. return &api.Message{Role: role, Content: fullResponse.String()}, nil
  890. }
  891. func generate(cmd *cobra.Command, opts runOptions) error {
  892. client, err := api.ClientFromEnvironment()
  893. if err != nil {
  894. return err
  895. }
  896. p := progress.NewProgress(os.Stderr)
  897. defer p.StopAndClear()
  898. spinner := progress.NewSpinner("")
  899. p.Add("", spinner)
  900. var latest api.GenerateResponse
  901. generateContext, ok := cmd.Context().Value(generateContextKey("context")).([]int)
  902. if !ok {
  903. generateContext = []int{}
  904. }
  905. ctx, cancel := context.WithCancel(cmd.Context())
  906. defer cancel()
  907. sigChan := make(chan os.Signal, 1)
  908. signal.Notify(sigChan, syscall.SIGINT)
  909. go func() {
  910. <-sigChan
  911. cancel()
  912. }()
  913. var state *displayResponseState = &displayResponseState{}
  914. fn := func(response api.GenerateResponse) error {
  915. p.StopAndClear()
  916. latest = response
  917. content := response.Response
  918. displayResponse(content, opts.WordWrap, state)
  919. return nil
  920. }
  921. if opts.MultiModal {
  922. opts.Prompt, opts.Images, err = extractFileData(opts.Prompt)
  923. if err != nil {
  924. return err
  925. }
  926. }
  927. request := api.GenerateRequest{
  928. Model: opts.Model,
  929. Prompt: opts.Prompt,
  930. Context: generateContext,
  931. Images: opts.Images,
  932. Format: opts.Format,
  933. System: opts.System,
  934. Options: opts.Options,
  935. KeepAlive: opts.KeepAlive,
  936. }
  937. if err := client.Generate(ctx, &request, fn); err != nil {
  938. if errors.Is(err, context.Canceled) {
  939. return nil
  940. }
  941. return err
  942. }
  943. if opts.Prompt != "" {
  944. fmt.Println()
  945. fmt.Println()
  946. }
  947. if !latest.Done {
  948. return nil
  949. }
  950. verbose, err := cmd.Flags().GetBool("verbose")
  951. if err != nil {
  952. return err
  953. }
  954. if verbose {
  955. latest.Summary()
  956. }
  957. ctx = context.WithValue(cmd.Context(), generateContextKey("context"), latest.Context)
  958. cmd.SetContext(ctx)
  959. return nil
  960. }
  961. func RunServer(_ *cobra.Command, _ []string) error {
  962. if err := initializeKeypair(); err != nil {
  963. return err
  964. }
  965. ln, err := net.Listen("tcp", envconfig.Host().Host)
  966. if err != nil {
  967. return err
  968. }
  969. err = server.Serve(ln)
  970. if errors.Is(err, http.ErrServerClosed) {
  971. return nil
  972. }
  973. return err
  974. }
  975. func initializeKeypair() error {
  976. home, err := os.UserHomeDir()
  977. if err != nil {
  978. return err
  979. }
  980. privKeyPath := filepath.Join(home, ".ollama", "id_ed25519")
  981. pubKeyPath := filepath.Join(home, ".ollama", "id_ed25519.pub")
  982. _, err = os.Stat(privKeyPath)
  983. if os.IsNotExist(err) {
  984. fmt.Printf("Couldn't find '%s'. Generating new private key.\n", privKeyPath)
  985. cryptoPublicKey, cryptoPrivateKey, err := ed25519.GenerateKey(rand.Reader)
  986. if err != nil {
  987. return err
  988. }
  989. privateKeyBytes, err := ssh.MarshalPrivateKey(cryptoPrivateKey, "")
  990. if err != nil {
  991. return err
  992. }
  993. if err := os.MkdirAll(filepath.Dir(privKeyPath), 0o755); err != nil {
  994. return fmt.Errorf("could not create directory %w", err)
  995. }
  996. if err := os.WriteFile(privKeyPath, pem.EncodeToMemory(privateKeyBytes), 0o600); err != nil {
  997. return err
  998. }
  999. sshPublicKey, err := ssh.NewPublicKey(cryptoPublicKey)
  1000. if err != nil {
  1001. return err
  1002. }
  1003. publicKeyBytes := ssh.MarshalAuthorizedKey(sshPublicKey)
  1004. if err := os.WriteFile(pubKeyPath, publicKeyBytes, 0o644); err != nil {
  1005. return err
  1006. }
  1007. fmt.Printf("Your new public key is: \n\n%s\n", publicKeyBytes)
  1008. }
  1009. return nil
  1010. }
  1011. func checkServerHeartbeat(cmd *cobra.Command, _ []string) error {
  1012. client, err := api.ClientFromEnvironment()
  1013. if err != nil {
  1014. return err
  1015. }
  1016. if err := client.Heartbeat(cmd.Context()); err != nil {
  1017. if !strings.Contains(err.Error(), " refused") {
  1018. return err
  1019. }
  1020. if err := startApp(cmd.Context(), client); err != nil {
  1021. return errors.New("could not connect to ollama app, is it running?")
  1022. }
  1023. }
  1024. return nil
  1025. }
  1026. func versionHandler(cmd *cobra.Command, _ []string) {
  1027. client, err := api.ClientFromEnvironment()
  1028. if err != nil {
  1029. return
  1030. }
  1031. serverVersion, err := client.Version(cmd.Context())
  1032. if err != nil {
  1033. fmt.Println("Warning: could not connect to a running Ollama instance")
  1034. }
  1035. if serverVersion != "" {
  1036. fmt.Printf("ollama version is %s\n", serverVersion)
  1037. }
  1038. if serverVersion != version.Version {
  1039. fmt.Printf("Warning: client version is %s\n", version.Version)
  1040. }
  1041. }
  1042. func appendEnvDocs(cmd *cobra.Command, envs []envconfig.EnvVar) {
  1043. if len(envs) == 0 {
  1044. return
  1045. }
  1046. envUsage := `
  1047. Environment Variables:
  1048. `
  1049. for _, e := range envs {
  1050. envUsage += fmt.Sprintf(" %-24s %s\n", e.Name, e.Description)
  1051. }
  1052. cmd.SetUsageTemplate(cmd.UsageTemplate() + envUsage)
  1053. }
  1054. func NewCLI() *cobra.Command {
  1055. log.SetFlags(log.LstdFlags | log.Lshortfile)
  1056. cobra.EnableCommandSorting = false
  1057. if runtime.GOOS == "windows" {
  1058. console.ConsoleFromFile(os.Stdin) //nolint:errcheck
  1059. }
  1060. rootCmd := &cobra.Command{
  1061. Use: "ollama",
  1062. Short: "Large language model runner",
  1063. SilenceUsage: true,
  1064. SilenceErrors: true,
  1065. CompletionOptions: cobra.CompletionOptions{
  1066. DisableDefaultCmd: true,
  1067. },
  1068. Run: func(cmd *cobra.Command, args []string) {
  1069. if version, _ := cmd.Flags().GetBool("version"); version {
  1070. versionHandler(cmd, args)
  1071. return
  1072. }
  1073. cmd.Print(cmd.UsageString())
  1074. },
  1075. }
  1076. rootCmd.Flags().BoolP("version", "v", false, "Show version information")
  1077. createCmd := &cobra.Command{
  1078. Use: "create MODEL",
  1079. Short: "Create a model from a Modelfile",
  1080. Args: cobra.ExactArgs(1),
  1081. PreRunE: checkServerHeartbeat,
  1082. RunE: CreateHandler,
  1083. }
  1084. createCmd.Flags().StringP("file", "f", "Modelfile", "Name of the Modelfile")
  1085. createCmd.Flags().StringP("quantize", "q", "", "Quantize model to this level (e.g. q4_0)")
  1086. showCmd := &cobra.Command{
  1087. Use: "show MODEL",
  1088. Short: "Show information for a model",
  1089. Args: cobra.ExactArgs(1),
  1090. PreRunE: checkServerHeartbeat,
  1091. RunE: ShowHandler,
  1092. }
  1093. showCmd.Flags().Bool("license", false, "Show license of a model")
  1094. showCmd.Flags().Bool("modelfile", false, "Show Modelfile of a model")
  1095. showCmd.Flags().Bool("parameters", false, "Show parameters of a model")
  1096. showCmd.Flags().Bool("template", false, "Show template of a model")
  1097. showCmd.Flags().Bool("system", false, "Show system message of a model")
  1098. runCmd := &cobra.Command{
  1099. Use: "run MODEL [PROMPT]",
  1100. Short: "Run a model",
  1101. Args: cobra.MinimumNArgs(1),
  1102. PreRunE: checkServerHeartbeat,
  1103. RunE: RunHandler,
  1104. }
  1105. runCmd.Flags().String("keepalive", "", "Duration to keep a model loaded (e.g. 5m)")
  1106. runCmd.Flags().Bool("verbose", false, "Show timings for response")
  1107. runCmd.Flags().Bool("insecure", false, "Use an insecure registry")
  1108. runCmd.Flags().Bool("nowordwrap", false, "Don't wrap words to the next line automatically")
  1109. runCmd.Flags().String("format", "", "Response format (e.g. json)")
  1110. stopCmd := &cobra.Command{
  1111. Use: "stop MODEL",
  1112. Short: "Stop a running model",
  1113. Args: cobra.ExactArgs(1),
  1114. PreRunE: checkServerHeartbeat,
  1115. RunE: StopHandler,
  1116. }
  1117. serveCmd := &cobra.Command{
  1118. Use: "serve",
  1119. Aliases: []string{"start"},
  1120. Short: "Start ollama",
  1121. Args: cobra.ExactArgs(0),
  1122. RunE: RunServer,
  1123. }
  1124. pullCmd := &cobra.Command{
  1125. Use: "pull MODEL",
  1126. Short: "Pull a model from a registry",
  1127. Args: cobra.ExactArgs(1),
  1128. PreRunE: checkServerHeartbeat,
  1129. RunE: PullHandler,
  1130. }
  1131. pullCmd.Flags().Bool("insecure", false, "Use an insecure registry")
  1132. pushCmd := &cobra.Command{
  1133. Use: "push MODEL",
  1134. Short: "Push a model to a registry",
  1135. Args: cobra.ExactArgs(1),
  1136. PreRunE: checkServerHeartbeat,
  1137. RunE: PushHandler,
  1138. }
  1139. pushCmd.Flags().Bool("insecure", false, "Use an insecure registry")
  1140. listCmd := &cobra.Command{
  1141. Use: "list",
  1142. Aliases: []string{"ls"},
  1143. Short: "List models",
  1144. PreRunE: checkServerHeartbeat,
  1145. RunE: ListHandler,
  1146. }
  1147. psCmd := &cobra.Command{
  1148. Use: "ps",
  1149. Short: "List running models",
  1150. PreRunE: checkServerHeartbeat,
  1151. RunE: ListRunningHandler,
  1152. }
  1153. copyCmd := &cobra.Command{
  1154. Use: "cp SOURCE DESTINATION",
  1155. Short: "Copy a model",
  1156. Args: cobra.ExactArgs(2),
  1157. PreRunE: checkServerHeartbeat,
  1158. RunE: CopyHandler,
  1159. }
  1160. deleteCmd := &cobra.Command{
  1161. Use: "rm MODEL [MODEL...]",
  1162. Short: "Remove a model",
  1163. Args: cobra.MinimumNArgs(1),
  1164. PreRunE: checkServerHeartbeat,
  1165. RunE: DeleteHandler,
  1166. }
  1167. envVars := envconfig.AsMap()
  1168. envs := []envconfig.EnvVar{envVars["OLLAMA_HOST"]}
  1169. for _, cmd := range []*cobra.Command{
  1170. createCmd,
  1171. showCmd,
  1172. runCmd,
  1173. stopCmd,
  1174. pullCmd,
  1175. pushCmd,
  1176. listCmd,
  1177. psCmd,
  1178. copyCmd,
  1179. deleteCmd,
  1180. serveCmd,
  1181. } {
  1182. switch cmd {
  1183. case runCmd:
  1184. appendEnvDocs(cmd, []envconfig.EnvVar{envVars["OLLAMA_HOST"], envVars["OLLAMA_NOHISTORY"]})
  1185. case serveCmd:
  1186. appendEnvDocs(cmd, []envconfig.EnvVar{
  1187. envVars["OLLAMA_DEBUG"],
  1188. envVars["OLLAMA_HOST"],
  1189. envVars["OLLAMA_KEEP_ALIVE"],
  1190. envVars["OLLAMA_MAX_LOADED_MODELS"],
  1191. envVars["OLLAMA_MAX_QUEUE"],
  1192. envVars["OLLAMA_MODELS"],
  1193. envVars["OLLAMA_NUM_PARALLEL"],
  1194. envVars["OLLAMA_NOPRUNE"],
  1195. envVars["OLLAMA_ORIGINS"],
  1196. envVars["OLLAMA_SCHED_SPREAD"],
  1197. envVars["OLLAMA_TMPDIR"],
  1198. envVars["OLLAMA_FLASH_ATTENTION"],
  1199. envVars["OLLAMA_LLM_LIBRARY"],
  1200. envVars["OLLAMA_GPU_OVERHEAD"],
  1201. envVars["OLLAMA_LOAD_TIMEOUT"],
  1202. })
  1203. default:
  1204. appendEnvDocs(cmd, envs)
  1205. }
  1206. }
  1207. rootCmd.AddCommand(
  1208. serveCmd,
  1209. createCmd,
  1210. showCmd,
  1211. runCmd,
  1212. stopCmd,
  1213. pullCmd,
  1214. pushCmd,
  1215. listCmd,
  1216. psCmd,
  1217. copyCmd,
  1218. deleteCmd,
  1219. )
  1220. return rootCmd
  1221. }