cmd.go 34 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498
  1. package cmd
  2. import (
  3. "archive/zip"
  4. "bytes"
  5. "context"
  6. "crypto/ed25519"
  7. "crypto/rand"
  8. "crypto/sha256"
  9. "encoding/json"
  10. "encoding/pem"
  11. "errors"
  12. "fmt"
  13. "io"
  14. "log"
  15. "math"
  16. "net"
  17. "net/http"
  18. "net/url"
  19. "os"
  20. "os/signal"
  21. "path/filepath"
  22. "regexp"
  23. "runtime"
  24. "slices"
  25. "strings"
  26. "syscall"
  27. "time"
  28. "github.com/containerd/console"
  29. "github.com/mattn/go-runewidth"
  30. "github.com/olekukonko/tablewriter"
  31. "github.com/spf13/cobra"
  32. "golang.org/x/crypto/ssh"
  33. "golang.org/x/term"
  34. "github.com/ollama/ollama/api"
  35. "github.com/ollama/ollama/auth"
  36. "github.com/ollama/ollama/envconfig"
  37. "github.com/ollama/ollama/format"
  38. "github.com/ollama/ollama/parser"
  39. "github.com/ollama/ollama/progress"
  40. "github.com/ollama/ollama/server"
  41. "github.com/ollama/ollama/types/errtypes"
  42. "github.com/ollama/ollama/types/model"
  43. "github.com/ollama/ollama/version"
  44. )
  45. func CreateHandler(cmd *cobra.Command, args []string) error {
  46. filename, _ := cmd.Flags().GetString("file")
  47. filename, err := filepath.Abs(filename)
  48. if err != nil {
  49. return err
  50. }
  51. client, err := api.ClientFromEnvironment()
  52. if err != nil {
  53. return err
  54. }
  55. p := progress.NewProgress(os.Stderr)
  56. defer p.Stop()
  57. f, err := os.Open(filename)
  58. if err != nil {
  59. return err
  60. }
  61. defer f.Close()
  62. modelfile, err := parser.ParseFile(f)
  63. if err != nil {
  64. return err
  65. }
  66. home, err := os.UserHomeDir()
  67. if err != nil {
  68. return err
  69. }
  70. status := "transferring model data"
  71. spinner := progress.NewSpinner(status)
  72. p.Add(status, spinner)
  73. for i := range modelfile.Commands {
  74. switch modelfile.Commands[i].Name {
  75. case "model", "adapter":
  76. path := modelfile.Commands[i].Args
  77. if path == "~" {
  78. path = home
  79. } else if strings.HasPrefix(path, "~/") {
  80. path = filepath.Join(home, path[2:])
  81. }
  82. if !filepath.IsAbs(path) {
  83. path = filepath.Join(filepath.Dir(filename), path)
  84. }
  85. fi, err := os.Stat(path)
  86. if errors.Is(err, os.ErrNotExist) && modelfile.Commands[i].Name == "model" {
  87. continue
  88. } else if err != nil {
  89. return err
  90. }
  91. if fi.IsDir() {
  92. // this is likely a safetensors or pytorch directory
  93. // TODO make this work w/ adapters
  94. tempfile, err := tempZipFiles(path)
  95. if err != nil {
  96. return err
  97. }
  98. defer os.RemoveAll(tempfile)
  99. path = tempfile
  100. }
  101. digest, err := createBlob(cmd, client, path)
  102. if err != nil {
  103. return err
  104. }
  105. modelfile.Commands[i].Args = "@" + digest
  106. }
  107. }
  108. bars := make(map[string]*progress.Bar)
  109. fn := func(resp api.ProgressResponse) error {
  110. if resp.Digest != "" {
  111. spinner.Stop()
  112. bar, ok := bars[resp.Digest]
  113. if !ok {
  114. bar = progress.NewBar(fmt.Sprintf("pulling %s...", resp.Digest[7:19]), resp.Total, resp.Completed)
  115. bars[resp.Digest] = bar
  116. p.Add(resp.Digest, bar)
  117. }
  118. bar.Set(resp.Completed)
  119. } else if status != resp.Status {
  120. spinner.Stop()
  121. status = resp.Status
  122. spinner = progress.NewSpinner(status)
  123. p.Add(status, spinner)
  124. }
  125. return nil
  126. }
  127. quantize, _ := cmd.Flags().GetString("quantize")
  128. request := api.CreateRequest{Name: args[0], Modelfile: modelfile.String(), Quantize: quantize}
  129. if err := client.Create(cmd.Context(), &request, fn); err != nil {
  130. return err
  131. }
  132. return nil
  133. }
  134. func tempZipFiles(path string) (string, error) {
  135. tempfile, err := os.CreateTemp("", "ollama-tf")
  136. if err != nil {
  137. return "", err
  138. }
  139. defer tempfile.Close()
  140. detectContentType := func(path string) (string, error) {
  141. f, err := os.Open(path)
  142. if err != nil {
  143. return "", err
  144. }
  145. defer f.Close()
  146. var b bytes.Buffer
  147. b.Grow(512)
  148. if _, err := io.CopyN(&b, f, 512); err != nil && !errors.Is(err, io.EOF) {
  149. return "", err
  150. }
  151. contentType, _, _ := strings.Cut(http.DetectContentType(b.Bytes()), ";")
  152. return contentType, nil
  153. }
  154. glob := func(pattern, contentType string) ([]string, error) {
  155. matches, err := filepath.Glob(pattern)
  156. if err != nil {
  157. return nil, err
  158. }
  159. for _, safetensor := range matches {
  160. if ct, err := detectContentType(safetensor); err != nil {
  161. return nil, err
  162. } else if ct != contentType {
  163. return nil, fmt.Errorf("invalid content type: expected %s for %s", ct, safetensor)
  164. }
  165. }
  166. return matches, nil
  167. }
  168. var files []string
  169. if st, _ := glob(filepath.Join(path, "model*.safetensors"), "application/octet-stream"); len(st) > 0 {
  170. // safetensors files might be unresolved git lfs references; skip if they are
  171. // covers model-x-of-y.safetensors, model.fp32-x-of-y.safetensors, model.safetensors
  172. files = append(files, st...)
  173. } else if pt, _ := glob(filepath.Join(path, "pytorch_model*.bin"), "application/zip"); len(pt) > 0 {
  174. // pytorch files might also be unresolved git lfs references; skip if they are
  175. // covers pytorch_model-x-of-y.bin, pytorch_model.fp32-x-of-y.bin, pytorch_model.bin
  176. files = append(files, pt...)
  177. } else if pt, _ := glob(filepath.Join(path, "consolidated*.pth"), "application/zip"); len(pt) > 0 {
  178. // pytorch files might also be unresolved git lfs references; skip if they are
  179. // covers consolidated.x.pth, consolidated.pth
  180. files = append(files, pt...)
  181. } else {
  182. return "", errors.New("no safetensors or torch files found")
  183. }
  184. // add configuration files, json files are detected as text/plain
  185. js, err := glob(filepath.Join(path, "*.json"), "text/plain")
  186. if err != nil {
  187. return "", err
  188. }
  189. files = append(files, js...)
  190. if tks, _ := glob(filepath.Join(path, "tokenizer.model"), "application/octet-stream"); len(tks) > 0 {
  191. // add tokenizer.model if it exists, tokenizer.json is automatically picked up by the previous glob
  192. // tokenizer.model might be a unresolved git lfs reference; error if it is
  193. files = append(files, tks...)
  194. } else if tks, _ := glob(filepath.Join(path, "**/tokenizer.model"), "text/plain"); len(tks) > 0 {
  195. // some times tokenizer.model is in a subdirectory (e.g. meta-llama/Meta-Llama-3-8B)
  196. files = append(files, tks...)
  197. }
  198. zipfile := zip.NewWriter(tempfile)
  199. defer zipfile.Close()
  200. for _, file := range files {
  201. f, err := os.Open(file)
  202. if err != nil {
  203. return "", err
  204. }
  205. defer f.Close()
  206. fi, err := f.Stat()
  207. if err != nil {
  208. return "", err
  209. }
  210. zfi, err := zip.FileInfoHeader(fi)
  211. if err != nil {
  212. return "", err
  213. }
  214. zf, err := zipfile.CreateHeader(zfi)
  215. if err != nil {
  216. return "", err
  217. }
  218. if _, err := io.Copy(zf, f); err != nil {
  219. return "", err
  220. }
  221. }
  222. return tempfile.Name(), nil
  223. }
  224. var ErrBlobExists = errors.New("blob exists")
  225. func createBlob(cmd *cobra.Command, client *api.Client, path string) (string, error) {
  226. bin, err := os.Open(path)
  227. if err != nil {
  228. return "", err
  229. }
  230. defer bin.Close()
  231. hash := sha256.New()
  232. if _, err := io.Copy(hash, bin); err != nil {
  233. return "", err
  234. }
  235. if _, err := bin.Seek(0, io.SeekStart); err != nil {
  236. return "", err
  237. }
  238. digest := fmt.Sprintf("sha256:%x", hash.Sum(nil))
  239. // Here, we want to check if the server is local
  240. // If true, call, createBlobLocal
  241. // This should find the model directory, copy blob over, and return the digest
  242. // If this fails, just upload it
  243. // If this is successful, return the digest
  244. // Resolve server to IP
  245. // Check if server is local
  246. /* if client.IsLocal() {
  247. digest = strings.ReplaceAll(digest, ":", "-")
  248. config, err := client.HeadBlob(cmd.Context(), digest)
  249. if err != nil {
  250. return "", err
  251. }
  252. modelDir := config.ModelDir
  253. // Get blob destination
  254. dest := filepath.Join(modelDir, "blobs", digest)
  255. err = createBlobLocal(path, dest)
  256. if err == nil {
  257. return digest, nil
  258. }
  259. } */
  260. if client.IsLocal() {
  261. dest, err := getLocalPath(cmd.Context(), digest)
  262. if errors.Is(err, ErrBlobExists) {
  263. return digest, nil
  264. }
  265. if err == nil {
  266. err = createBlobLocal(path, dest)
  267. if err == nil {
  268. return digest, nil
  269. }
  270. }
  271. }
  272. if err = client.CreateBlob(cmd.Context(), digest, bin); err != nil {
  273. return "", err
  274. }
  275. return digest, nil
  276. }
  277. func getLocalPath(ctx context.Context, digest string) (string, error) {
  278. ollamaHost := envconfig.Host
  279. client := http.DefaultClient
  280. base := &url.URL{
  281. Scheme: ollamaHost.Scheme,
  282. Host: net.JoinHostPort(ollamaHost.Host, ollamaHost.Port),
  283. }
  284. data, err := json.Marshal(digest)
  285. if err != nil {
  286. return "", err
  287. }
  288. reqBody := bytes.NewReader(data)
  289. path := fmt.Sprintf("/api/blobs/%s", digest)
  290. requestURL := base.JoinPath(path)
  291. request, err := http.NewRequestWithContext(ctx, http.MethodPost, requestURL.String(), reqBody)
  292. if err != nil {
  293. return "", err
  294. }
  295. authz, err := api.Authorization(ctx, request)
  296. if err != nil {
  297. return "", err
  298. }
  299. request.Header.Set("Authorization", authz)
  300. request.Header.Set("User-Agent", fmt.Sprintf("ollama/%s (%s %s) Go/%s", version.Version, runtime.GOARCH, runtime.GOOS, runtime.Version()))
  301. request.Header.Set("X-Redirect-Create", "1")
  302. resp, err := client.Do(request)
  303. if err != nil {
  304. return "", err
  305. }
  306. defer resp.Body.Close()
  307. if resp.StatusCode == http.StatusTemporaryRedirect {
  308. dest := resp.Header.Get("LocalLocation")
  309. return dest, nil
  310. }
  311. return "", ErrBlobExists
  312. }
  313. func createBlobLocal(path string, dest string) error {
  314. // This function should be called if the server is local
  315. // It should find the model directory, copy the blob over, and return the digest
  316. dirPath := filepath.Dir(dest)
  317. if err := os.MkdirAll(dirPath, 0o755); err != nil {
  318. return err
  319. }
  320. // Copy blob over
  321. sourceFile, err := os.Open(path)
  322. if err != nil {
  323. return fmt.Errorf("could not open source file: %v", err)
  324. }
  325. defer sourceFile.Close()
  326. destFile, err := os.Create(dest)
  327. if err != nil {
  328. return fmt.Errorf("could not create destination file: %v", err)
  329. }
  330. defer destFile.Close()
  331. _, err = io.CopyBuffer(destFile, sourceFile, make([]byte, 4*1024*1024))
  332. if err != nil {
  333. return fmt.Errorf("error copying file: %v", err)
  334. }
  335. err = destFile.Sync()
  336. if err != nil {
  337. return fmt.Errorf("error flushing file: %v", err)
  338. }
  339. return nil
  340. }
  341. func RunHandler(cmd *cobra.Command, args []string) error {
  342. interactive := true
  343. opts := runOptions{
  344. Model: args[0],
  345. WordWrap: os.Getenv("TERM") == "xterm-256color",
  346. Options: map[string]interface{}{},
  347. }
  348. format, err := cmd.Flags().GetString("format")
  349. if err != nil {
  350. return err
  351. }
  352. opts.Format = format
  353. keepAlive, err := cmd.Flags().GetString("keepalive")
  354. if err != nil {
  355. return err
  356. }
  357. if keepAlive != "" {
  358. d, err := time.ParseDuration(keepAlive)
  359. if err != nil {
  360. return err
  361. }
  362. opts.KeepAlive = &api.Duration{Duration: d}
  363. }
  364. prompts := args[1:]
  365. // prepend stdin to the prompt if provided
  366. if !term.IsTerminal(int(os.Stdin.Fd())) {
  367. in, err := io.ReadAll(os.Stdin)
  368. if err != nil {
  369. return err
  370. }
  371. prompts = append([]string{string(in)}, prompts...)
  372. opts.WordWrap = false
  373. interactive = false
  374. }
  375. opts.Prompt = strings.Join(prompts, " ")
  376. if len(prompts) > 0 {
  377. interactive = false
  378. }
  379. nowrap, err := cmd.Flags().GetBool("nowordwrap")
  380. if err != nil {
  381. return err
  382. }
  383. opts.WordWrap = !nowrap
  384. // Fill out the rest of the options based on information about the
  385. // model.
  386. client, err := api.ClientFromEnvironment()
  387. if err != nil {
  388. return err
  389. }
  390. name := args[0]
  391. info, err := func() (*api.ShowResponse, error) {
  392. showReq := &api.ShowRequest{Name: name}
  393. info, err := client.Show(cmd.Context(), showReq)
  394. var se api.StatusError
  395. if errors.As(err, &se) && se.StatusCode == http.StatusNotFound {
  396. if err := PullHandler(cmd, []string{name}); err != nil {
  397. return nil, err
  398. }
  399. return client.Show(cmd.Context(), &api.ShowRequest{Name: name})
  400. }
  401. return info, err
  402. }()
  403. if err != nil {
  404. return err
  405. }
  406. opts.MultiModal = slices.Contains(info.Details.Families, "clip")
  407. opts.ParentModel = info.Details.ParentModel
  408. opts.Messages = append(opts.Messages, info.Messages...)
  409. if interactive {
  410. return generateInteractive(cmd, opts)
  411. }
  412. return generate(cmd, opts)
  413. }
  414. func errFromUnknownKey(unknownKeyErr error) error {
  415. // find SSH public key in the error message
  416. sshKeyPattern := `ssh-\w+ [^\s"]+`
  417. re := regexp.MustCompile(sshKeyPattern)
  418. matches := re.FindStringSubmatch(unknownKeyErr.Error())
  419. if len(matches) > 0 {
  420. serverPubKey := matches[0]
  421. publicKey, err := auth.GetPublicKey()
  422. if err != nil {
  423. return unknownKeyErr
  424. }
  425. localPubKey := strings.TrimSpace(string(ssh.MarshalAuthorizedKey(publicKey)))
  426. if runtime.GOOS == "linux" && serverPubKey != localPubKey {
  427. // try the ollama service public key
  428. svcPubKey, err := os.ReadFile("/usr/share/ollama/.ollama/id_ed25519.pub")
  429. if err != nil {
  430. return unknownKeyErr
  431. }
  432. localPubKey = strings.TrimSpace(string(svcPubKey))
  433. }
  434. // check if the returned public key matches the local public key, this prevents adding a remote key to the user's account
  435. if serverPubKey != localPubKey {
  436. return unknownKeyErr
  437. }
  438. var msg strings.Builder
  439. msg.WriteString(unknownKeyErr.Error())
  440. msg.WriteString("\n\nYour ollama key is:\n")
  441. msg.WriteString(localPubKey)
  442. msg.WriteString("\nAdd your key at:\n")
  443. msg.WriteString("https://ollama.com/settings/keys")
  444. return errors.New(msg.String())
  445. }
  446. return unknownKeyErr
  447. }
  448. func PushHandler(cmd *cobra.Command, args []string) error {
  449. client, err := api.ClientFromEnvironment()
  450. if err != nil {
  451. return err
  452. }
  453. insecure, err := cmd.Flags().GetBool("insecure")
  454. if err != nil {
  455. return err
  456. }
  457. p := progress.NewProgress(os.Stderr)
  458. defer p.Stop()
  459. bars := make(map[string]*progress.Bar)
  460. var status string
  461. var spinner *progress.Spinner
  462. fn := func(resp api.ProgressResponse) error {
  463. if resp.Digest != "" {
  464. if spinner != nil {
  465. spinner.Stop()
  466. }
  467. bar, ok := bars[resp.Digest]
  468. if !ok {
  469. bar = progress.NewBar(fmt.Sprintf("pushing %s...", resp.Digest[7:19]), resp.Total, resp.Completed)
  470. bars[resp.Digest] = bar
  471. p.Add(resp.Digest, bar)
  472. }
  473. bar.Set(resp.Completed)
  474. } else if status != resp.Status {
  475. if spinner != nil {
  476. spinner.Stop()
  477. }
  478. status = resp.Status
  479. spinner = progress.NewSpinner(status)
  480. p.Add(status, spinner)
  481. }
  482. return nil
  483. }
  484. request := api.PushRequest{Name: args[0], Insecure: insecure}
  485. if err := client.Push(cmd.Context(), &request, fn); err != nil {
  486. if spinner != nil {
  487. spinner.Stop()
  488. }
  489. if strings.Contains(err.Error(), "access denied") {
  490. return errors.New("you are not authorized to push to this namespace, create the model under a namespace you own")
  491. }
  492. host := model.ParseName(args[0]).Host
  493. isOllamaHost := strings.HasSuffix(host, ".ollama.ai") || strings.HasSuffix(host, ".ollama.com")
  494. if strings.Contains(err.Error(), errtypes.UnknownOllamaKeyErrMsg) && isOllamaHost {
  495. // the user has not added their ollama key to ollama.com
  496. // re-throw an error with a more user-friendly message
  497. return errFromUnknownKey(err)
  498. }
  499. return err
  500. }
  501. spinner.Stop()
  502. return nil
  503. }
  504. func ListHandler(cmd *cobra.Command, args []string) error {
  505. client, err := api.ClientFromEnvironment()
  506. if err != nil {
  507. return err
  508. }
  509. models, err := client.List(cmd.Context())
  510. if err != nil {
  511. return err
  512. }
  513. var data [][]string
  514. for _, m := range models.Models {
  515. if len(args) == 0 || strings.HasPrefix(m.Name, args[0]) {
  516. data = append(data, []string{m.Name, m.Digest[:12], format.HumanBytes(m.Size), format.HumanTime(m.ModifiedAt, "Never")})
  517. }
  518. }
  519. table := tablewriter.NewWriter(os.Stdout)
  520. table.SetHeader([]string{"NAME", "ID", "SIZE", "MODIFIED"})
  521. table.SetHeaderAlignment(tablewriter.ALIGN_LEFT)
  522. table.SetAlignment(tablewriter.ALIGN_LEFT)
  523. table.SetHeaderLine(false)
  524. table.SetBorder(false)
  525. table.SetNoWhiteSpace(true)
  526. table.SetTablePadding("\t")
  527. table.AppendBulk(data)
  528. table.Render()
  529. return nil
  530. }
  531. func ListRunningHandler(cmd *cobra.Command, args []string) error {
  532. client, err := api.ClientFromEnvironment()
  533. if err != nil {
  534. return err
  535. }
  536. models, err := client.ListRunning(cmd.Context())
  537. if err != nil {
  538. return err
  539. }
  540. var data [][]string
  541. for _, m := range models.Models {
  542. if len(args) == 0 || strings.HasPrefix(m.Name, args[0]) {
  543. var procStr string
  544. switch {
  545. case m.SizeVRAM == 0:
  546. procStr = "100% CPU"
  547. case m.SizeVRAM == m.Size:
  548. procStr = "100% GPU"
  549. case m.SizeVRAM > m.Size || m.Size == 0:
  550. procStr = "Unknown"
  551. default:
  552. sizeCPU := m.Size - m.SizeVRAM
  553. cpuPercent := math.Round(float64(sizeCPU) / float64(m.Size) * 100)
  554. procStr = fmt.Sprintf("%d%%/%d%% CPU/GPU", int(cpuPercent), int(100-cpuPercent))
  555. }
  556. data = append(data, []string{m.Name, m.Digest[:12], format.HumanBytes(m.Size), procStr, format.HumanTime(m.ExpiresAt, "Never")})
  557. }
  558. }
  559. table := tablewriter.NewWriter(os.Stdout)
  560. table.SetHeader([]string{"NAME", "ID", "SIZE", "PROCESSOR", "UNTIL"})
  561. table.SetHeaderAlignment(tablewriter.ALIGN_LEFT)
  562. table.SetAlignment(tablewriter.ALIGN_LEFT)
  563. table.SetHeaderLine(false)
  564. table.SetBorder(false)
  565. table.SetNoWhiteSpace(true)
  566. table.SetTablePadding("\t")
  567. table.AppendBulk(data)
  568. table.Render()
  569. return nil
  570. }
  571. func DeleteHandler(cmd *cobra.Command, args []string) error {
  572. client, err := api.ClientFromEnvironment()
  573. if err != nil {
  574. return err
  575. }
  576. for _, name := range args {
  577. req := api.DeleteRequest{Name: name}
  578. if err := client.Delete(cmd.Context(), &req); err != nil {
  579. return err
  580. }
  581. fmt.Printf("deleted '%s'\n", name)
  582. }
  583. return nil
  584. }
  585. func ShowHandler(cmd *cobra.Command, args []string) error {
  586. client, err := api.ClientFromEnvironment()
  587. if err != nil {
  588. return err
  589. }
  590. license, errLicense := cmd.Flags().GetBool("license")
  591. modelfile, errModelfile := cmd.Flags().GetBool("modelfile")
  592. parameters, errParams := cmd.Flags().GetBool("parameters")
  593. system, errSystem := cmd.Flags().GetBool("system")
  594. template, errTemplate := cmd.Flags().GetBool("template")
  595. for _, boolErr := range []error{errLicense, errModelfile, errParams, errSystem, errTemplate} {
  596. if boolErr != nil {
  597. return errors.New("error retrieving flags")
  598. }
  599. }
  600. flagsSet := 0
  601. showType := ""
  602. if license {
  603. flagsSet++
  604. showType = "license"
  605. }
  606. if modelfile {
  607. flagsSet++
  608. showType = "modelfile"
  609. }
  610. if parameters {
  611. flagsSet++
  612. showType = "parameters"
  613. }
  614. if system {
  615. flagsSet++
  616. showType = "system"
  617. }
  618. if template {
  619. flagsSet++
  620. showType = "template"
  621. }
  622. if flagsSet > 1 {
  623. return errors.New("only one of '--license', '--modelfile', '--parameters', '--system', or '--template' can be specified")
  624. }
  625. req := api.ShowRequest{Name: args[0]}
  626. resp, err := client.Show(cmd.Context(), &req)
  627. if err != nil {
  628. return err
  629. }
  630. if flagsSet == 1 {
  631. switch showType {
  632. case "license":
  633. fmt.Println(resp.License)
  634. case "modelfile":
  635. fmt.Println(resp.Modelfile)
  636. case "parameters":
  637. fmt.Println(resp.Parameters)
  638. case "system":
  639. fmt.Println(resp.System)
  640. case "template":
  641. fmt.Println(resp.Template)
  642. }
  643. return nil
  644. }
  645. showInfo(resp)
  646. return nil
  647. }
  648. func showInfo(resp *api.ShowResponse) {
  649. arch := resp.ModelInfo["general.architecture"].(string)
  650. modelData := [][]string{
  651. {"arch", arch},
  652. {"parameters", resp.Details.ParameterSize},
  653. {"quantization", resp.Details.QuantizationLevel},
  654. {"context length", fmt.Sprintf("%v", resp.ModelInfo[fmt.Sprintf("%s.context_length", arch)].(float64))},
  655. {"embedding length", fmt.Sprintf("%v", resp.ModelInfo[fmt.Sprintf("%s.embedding_length", arch)].(float64))},
  656. }
  657. mainTableData := [][]string{
  658. {"Model"},
  659. {renderSubTable(modelData, false)},
  660. }
  661. if resp.ProjectorInfo != nil {
  662. projectorData := [][]string{
  663. {"arch", "clip"},
  664. {"parameters", format.HumanNumber(uint64(resp.ProjectorInfo["general.parameter_count"].(float64)))},
  665. }
  666. if projectorType, ok := resp.ProjectorInfo["clip.projector_type"]; ok {
  667. projectorData = append(projectorData, []string{"projector type", projectorType.(string)})
  668. }
  669. projectorData = append(projectorData,
  670. []string{"embedding length", fmt.Sprintf("%v", resp.ProjectorInfo["clip.vision.embedding_length"].(float64))},
  671. []string{"projection dimensionality", fmt.Sprintf("%v", resp.ProjectorInfo["clip.vision.projection_dim"].(float64))},
  672. )
  673. mainTableData = append(mainTableData,
  674. []string{"Projector"},
  675. []string{renderSubTable(projectorData, false)},
  676. )
  677. }
  678. if resp.Parameters != "" {
  679. mainTableData = append(mainTableData, []string{"Parameters"}, []string{formatParams(resp.Parameters)})
  680. }
  681. if resp.System != "" {
  682. mainTableData = append(mainTableData, []string{"System"}, []string{renderSubTable(twoLines(resp.System), true)})
  683. }
  684. if resp.License != "" {
  685. mainTableData = append(mainTableData, []string{"License"}, []string{renderSubTable(twoLines(resp.License), true)})
  686. }
  687. table := tablewriter.NewWriter(os.Stdout)
  688. table.SetAutoWrapText(false)
  689. table.SetBorder(false)
  690. table.SetAlignment(tablewriter.ALIGN_LEFT)
  691. for _, v := range mainTableData {
  692. table.Append(v)
  693. }
  694. table.Render()
  695. }
  696. func renderSubTable(data [][]string, file bool) string {
  697. var buf bytes.Buffer
  698. table := tablewriter.NewWriter(&buf)
  699. table.SetAutoWrapText(!file)
  700. table.SetBorder(false)
  701. table.SetNoWhiteSpace(true)
  702. table.SetTablePadding("\t")
  703. table.SetAlignment(tablewriter.ALIGN_LEFT)
  704. for _, v := range data {
  705. table.Append(v)
  706. }
  707. table.Render()
  708. renderedTable := buf.String()
  709. lines := strings.Split(renderedTable, "\n")
  710. for i, line := range lines {
  711. lines[i] = "\t" + line
  712. }
  713. return strings.Join(lines, "\n")
  714. }
  715. func twoLines(s string) [][]string {
  716. lines := strings.Split(s, "\n")
  717. res := [][]string{}
  718. count := 0
  719. for _, line := range lines {
  720. line = strings.TrimSpace(line)
  721. if line != "" {
  722. count++
  723. res = append(res, []string{line})
  724. if count == 2 {
  725. return res
  726. }
  727. }
  728. }
  729. return res
  730. }
  731. func formatParams(s string) string {
  732. lines := strings.Split(s, "\n")
  733. table := [][]string{}
  734. for _, line := range lines {
  735. table = append(table, strings.Fields(line))
  736. }
  737. return renderSubTable(table, false)
  738. }
  739. func CopyHandler(cmd *cobra.Command, args []string) error {
  740. client, err := api.ClientFromEnvironment()
  741. if err != nil {
  742. return err
  743. }
  744. req := api.CopyRequest{Source: args[0], Destination: args[1]}
  745. if err := client.Copy(cmd.Context(), &req); err != nil {
  746. return err
  747. }
  748. fmt.Printf("copied '%s' to '%s'\n", args[0], args[1])
  749. return nil
  750. }
  751. func PullHandler(cmd *cobra.Command, args []string) error {
  752. insecure, err := cmd.Flags().GetBool("insecure")
  753. if err != nil {
  754. return err
  755. }
  756. client, err := api.ClientFromEnvironment()
  757. if err != nil {
  758. return err
  759. }
  760. p := progress.NewProgress(os.Stderr)
  761. defer p.Stop()
  762. bars := make(map[string]*progress.Bar)
  763. var status string
  764. var spinner *progress.Spinner
  765. fn := func(resp api.ProgressResponse) error {
  766. if resp.Digest != "" {
  767. if spinner != nil {
  768. spinner.Stop()
  769. }
  770. bar, ok := bars[resp.Digest]
  771. if !ok {
  772. bar = progress.NewBar(fmt.Sprintf("pulling %s...", resp.Digest[7:19]), resp.Total, resp.Completed)
  773. bars[resp.Digest] = bar
  774. p.Add(resp.Digest, bar)
  775. }
  776. bar.Set(resp.Completed)
  777. } else if status != resp.Status {
  778. if spinner != nil {
  779. spinner.Stop()
  780. }
  781. status = resp.Status
  782. spinner = progress.NewSpinner(status)
  783. p.Add(status, spinner)
  784. }
  785. return nil
  786. }
  787. request := api.PullRequest{Name: args[0], Insecure: insecure}
  788. if err := client.Pull(cmd.Context(), &request, fn); err != nil {
  789. return err
  790. }
  791. return nil
  792. }
  793. type generateContextKey string
  794. type runOptions struct {
  795. Model string
  796. ParentModel string
  797. Prompt string
  798. Messages []api.Message
  799. WordWrap bool
  800. Format string
  801. System string
  802. Template string
  803. Images []api.ImageData
  804. Options map[string]interface{}
  805. MultiModal bool
  806. KeepAlive *api.Duration
  807. }
  808. type displayResponseState struct {
  809. lineLength int
  810. wordBuffer string
  811. }
  812. func displayResponse(content string, wordWrap bool, state *displayResponseState) {
  813. termWidth, _, _ := term.GetSize(int(os.Stdout.Fd()))
  814. if wordWrap && termWidth >= 10 {
  815. for _, ch := range content {
  816. if state.lineLength+1 > termWidth-5 {
  817. if runewidth.StringWidth(state.wordBuffer) > termWidth-10 {
  818. fmt.Printf("%s%c", state.wordBuffer, ch)
  819. state.wordBuffer = ""
  820. state.lineLength = 0
  821. continue
  822. }
  823. // backtrack the length of the last word and clear to the end of the line
  824. a := runewidth.StringWidth(state.wordBuffer)
  825. if a > 0 {
  826. fmt.Printf("\x1b[%dD", a)
  827. }
  828. fmt.Printf("\x1b[K\n")
  829. fmt.Printf("%s%c", state.wordBuffer, ch)
  830. chWidth := runewidth.RuneWidth(ch)
  831. state.lineLength = runewidth.StringWidth(state.wordBuffer) + chWidth
  832. } else {
  833. fmt.Print(string(ch))
  834. state.lineLength += runewidth.RuneWidth(ch)
  835. if runewidth.RuneWidth(ch) >= 2 {
  836. state.wordBuffer = ""
  837. continue
  838. }
  839. switch ch {
  840. case ' ':
  841. state.wordBuffer = ""
  842. case '\n':
  843. state.lineLength = 0
  844. default:
  845. state.wordBuffer += string(ch)
  846. }
  847. }
  848. }
  849. } else {
  850. fmt.Printf("%s%s", state.wordBuffer, content)
  851. if len(state.wordBuffer) > 0 {
  852. state.wordBuffer = ""
  853. }
  854. }
  855. }
  856. func chat(cmd *cobra.Command, opts runOptions) (*api.Message, error) {
  857. client, err := api.ClientFromEnvironment()
  858. if err != nil {
  859. return nil, err
  860. }
  861. p := progress.NewProgress(os.Stderr)
  862. defer p.StopAndClear()
  863. spinner := progress.NewSpinner("")
  864. p.Add("", spinner)
  865. cancelCtx, cancel := context.WithCancel(cmd.Context())
  866. defer cancel()
  867. sigChan := make(chan os.Signal, 1)
  868. signal.Notify(sigChan, syscall.SIGINT)
  869. go func() {
  870. <-sigChan
  871. cancel()
  872. }()
  873. var state *displayResponseState = &displayResponseState{}
  874. var latest api.ChatResponse
  875. var fullResponse strings.Builder
  876. var role string
  877. fn := func(response api.ChatResponse) error {
  878. p.StopAndClear()
  879. latest = response
  880. role = response.Message.Role
  881. content := response.Message.Content
  882. fullResponse.WriteString(content)
  883. displayResponse(content, opts.WordWrap, state)
  884. return nil
  885. }
  886. req := &api.ChatRequest{
  887. Model: opts.Model,
  888. Messages: opts.Messages,
  889. Format: opts.Format,
  890. Options: opts.Options,
  891. }
  892. if opts.KeepAlive != nil {
  893. req.KeepAlive = opts.KeepAlive
  894. }
  895. if err := client.Chat(cancelCtx, req, fn); err != nil {
  896. if errors.Is(err, context.Canceled) {
  897. return nil, nil
  898. }
  899. return nil, err
  900. }
  901. if len(opts.Messages) > 0 {
  902. fmt.Println()
  903. fmt.Println()
  904. }
  905. verbose, err := cmd.Flags().GetBool("verbose")
  906. if err != nil {
  907. return nil, err
  908. }
  909. if verbose {
  910. latest.Summary()
  911. }
  912. return &api.Message{Role: role, Content: fullResponse.String()}, nil
  913. }
  914. func generate(cmd *cobra.Command, opts runOptions) error {
  915. client, err := api.ClientFromEnvironment()
  916. if err != nil {
  917. return err
  918. }
  919. p := progress.NewProgress(os.Stderr)
  920. defer p.StopAndClear()
  921. spinner := progress.NewSpinner("")
  922. p.Add("", spinner)
  923. var latest api.GenerateResponse
  924. generateContext, ok := cmd.Context().Value(generateContextKey("context")).([]int)
  925. if !ok {
  926. generateContext = []int{}
  927. }
  928. ctx, cancel := context.WithCancel(cmd.Context())
  929. defer cancel()
  930. sigChan := make(chan os.Signal, 1)
  931. signal.Notify(sigChan, syscall.SIGINT)
  932. go func() {
  933. <-sigChan
  934. cancel()
  935. }()
  936. var state *displayResponseState = &displayResponseState{}
  937. fn := func(response api.GenerateResponse) error {
  938. p.StopAndClear()
  939. latest = response
  940. content := response.Response
  941. displayResponse(content, opts.WordWrap, state)
  942. return nil
  943. }
  944. if opts.MultiModal {
  945. opts.Prompt, opts.Images, err = extractFileData(opts.Prompt)
  946. if err != nil {
  947. return err
  948. }
  949. }
  950. request := api.GenerateRequest{
  951. Model: opts.Model,
  952. Prompt: opts.Prompt,
  953. Context: generateContext,
  954. Images: opts.Images,
  955. Format: opts.Format,
  956. System: opts.System,
  957. Template: opts.Template,
  958. Options: opts.Options,
  959. KeepAlive: opts.KeepAlive,
  960. }
  961. if err := client.Generate(ctx, &request, fn); err != nil {
  962. if errors.Is(err, context.Canceled) {
  963. return nil
  964. }
  965. return err
  966. }
  967. if opts.Prompt != "" {
  968. fmt.Println()
  969. fmt.Println()
  970. }
  971. if !latest.Done {
  972. return nil
  973. }
  974. verbose, err := cmd.Flags().GetBool("verbose")
  975. if err != nil {
  976. return err
  977. }
  978. if verbose {
  979. latest.Summary()
  980. }
  981. ctx = context.WithValue(cmd.Context(), generateContextKey("context"), latest.Context)
  982. cmd.SetContext(ctx)
  983. return nil
  984. }
  985. func RunServer(cmd *cobra.Command, _ []string) error {
  986. if err := initializeKeypair(); err != nil {
  987. return err
  988. }
  989. ln, err := net.Listen("tcp", net.JoinHostPort(envconfig.Host.Host, envconfig.Host.Port))
  990. if err != nil {
  991. return err
  992. }
  993. err = server.Serve(ln)
  994. if errors.Is(err, http.ErrServerClosed) {
  995. return nil
  996. }
  997. return err
  998. }
  999. func initializeKeypair() error {
  1000. home, err := os.UserHomeDir()
  1001. if err != nil {
  1002. return err
  1003. }
  1004. privKeyPath := filepath.Join(home, ".ollama", "id_ed25519")
  1005. pubKeyPath := filepath.Join(home, ".ollama", "id_ed25519.pub")
  1006. _, err = os.Stat(privKeyPath)
  1007. if os.IsNotExist(err) {
  1008. fmt.Printf("Couldn't find '%s'. Generating new private key.\n", privKeyPath)
  1009. cryptoPublicKey, cryptoPrivateKey, err := ed25519.GenerateKey(rand.Reader)
  1010. if err != nil {
  1011. return err
  1012. }
  1013. privateKeyBytes, err := ssh.MarshalPrivateKey(cryptoPrivateKey, "")
  1014. if err != nil {
  1015. return err
  1016. }
  1017. if err := os.MkdirAll(filepath.Dir(privKeyPath), 0o755); err != nil {
  1018. return fmt.Errorf("could not create directory %w", err)
  1019. }
  1020. if err := os.WriteFile(privKeyPath, pem.EncodeToMemory(privateKeyBytes), 0o600); err != nil {
  1021. return err
  1022. }
  1023. sshPublicKey, err := ssh.NewPublicKey(cryptoPublicKey)
  1024. if err != nil {
  1025. return err
  1026. }
  1027. publicKeyBytes := ssh.MarshalAuthorizedKey(sshPublicKey)
  1028. if err := os.WriteFile(pubKeyPath, publicKeyBytes, 0o644); err != nil {
  1029. return err
  1030. }
  1031. fmt.Printf("Your new public key is: \n\n%s\n", publicKeyBytes)
  1032. }
  1033. return nil
  1034. }
  1035. func checkServerHeartbeat(cmd *cobra.Command, _ []string) error {
  1036. client, err := api.ClientFromEnvironment()
  1037. if err != nil {
  1038. return err
  1039. }
  1040. if err := client.Heartbeat(cmd.Context()); err != nil {
  1041. if !strings.Contains(err.Error(), " refused") {
  1042. return err
  1043. }
  1044. if err := startApp(cmd.Context(), client); err != nil {
  1045. return fmt.Errorf("could not connect to ollama app, is it running?")
  1046. }
  1047. }
  1048. return nil
  1049. }
  1050. func versionHandler(cmd *cobra.Command, _ []string) {
  1051. client, err := api.ClientFromEnvironment()
  1052. if err != nil {
  1053. return
  1054. }
  1055. serverVersion, err := client.Version(cmd.Context())
  1056. if err != nil {
  1057. fmt.Println("Warning: could not connect to a running Ollama instance")
  1058. }
  1059. if serverVersion != "" {
  1060. fmt.Printf("ollama version is %s\n", serverVersion)
  1061. }
  1062. if serverVersion != version.Version {
  1063. fmt.Printf("Warning: client version is %s\n", version.Version)
  1064. }
  1065. }
  1066. func appendEnvDocs(cmd *cobra.Command, envs []envconfig.EnvVar) {
  1067. if len(envs) == 0 {
  1068. return
  1069. }
  1070. envUsage := `
  1071. Environment Variables:
  1072. `
  1073. for _, e := range envs {
  1074. envUsage += fmt.Sprintf(" %-24s %s\n", e.Name, e.Description)
  1075. }
  1076. cmd.SetUsageTemplate(cmd.UsageTemplate() + envUsage)
  1077. }
  1078. func NewCLI() *cobra.Command {
  1079. log.SetFlags(log.LstdFlags | log.Lshortfile)
  1080. cobra.EnableCommandSorting = false
  1081. if runtime.GOOS == "windows" {
  1082. console.ConsoleFromFile(os.Stdin) //nolint:errcheck
  1083. }
  1084. rootCmd := &cobra.Command{
  1085. Use: "ollama",
  1086. Short: "Large language model runner",
  1087. SilenceUsage: true,
  1088. SilenceErrors: true,
  1089. CompletionOptions: cobra.CompletionOptions{
  1090. DisableDefaultCmd: true,
  1091. },
  1092. Run: func(cmd *cobra.Command, args []string) {
  1093. if version, _ := cmd.Flags().GetBool("version"); version {
  1094. versionHandler(cmd, args)
  1095. return
  1096. }
  1097. cmd.Print(cmd.UsageString())
  1098. },
  1099. }
  1100. rootCmd.Flags().BoolP("version", "v", false, "Show version information")
  1101. createCmd := &cobra.Command{
  1102. Use: "create MODEL",
  1103. Short: "Create a model from a Modelfile",
  1104. Args: cobra.ExactArgs(1),
  1105. PreRunE: checkServerHeartbeat,
  1106. RunE: CreateHandler,
  1107. }
  1108. createCmd.Flags().StringP("file", "f", "Modelfile", "Name of the Modelfile")
  1109. createCmd.Flags().StringP("quantize", "q", "", "Quantize model to this level (e.g. q4_0)")
  1110. showCmd := &cobra.Command{
  1111. Use: "show MODEL",
  1112. Short: "Show information for a model",
  1113. Args: cobra.ExactArgs(1),
  1114. PreRunE: checkServerHeartbeat,
  1115. RunE: ShowHandler,
  1116. }
  1117. showCmd.Flags().Bool("license", false, "Show license of a model")
  1118. showCmd.Flags().Bool("modelfile", false, "Show Modelfile of a model")
  1119. showCmd.Flags().Bool("parameters", false, "Show parameters of a model")
  1120. showCmd.Flags().Bool("template", false, "Show template of a model")
  1121. showCmd.Flags().Bool("system", false, "Show system message of a model")
  1122. runCmd := &cobra.Command{
  1123. Use: "run MODEL [PROMPT]",
  1124. Short: "Run a model",
  1125. Args: cobra.MinimumNArgs(1),
  1126. PreRunE: checkServerHeartbeat,
  1127. RunE: RunHandler,
  1128. }
  1129. runCmd.Flags().String("keepalive", "", "Duration to keep a model loaded (e.g. 5m)")
  1130. runCmd.Flags().Bool("verbose", false, "Show timings for response")
  1131. runCmd.Flags().Bool("insecure", false, "Use an insecure registry")
  1132. runCmd.Flags().Bool("nowordwrap", false, "Don't wrap words to the next line automatically")
  1133. runCmd.Flags().String("format", "", "Response format (e.g. json)")
  1134. serveCmd := &cobra.Command{
  1135. Use: "serve",
  1136. Aliases: []string{"start"},
  1137. Short: "Start ollama",
  1138. Args: cobra.ExactArgs(0),
  1139. RunE: RunServer,
  1140. }
  1141. pullCmd := &cobra.Command{
  1142. Use: "pull MODEL",
  1143. Short: "Pull a model from a registry",
  1144. Args: cobra.ExactArgs(1),
  1145. PreRunE: checkServerHeartbeat,
  1146. RunE: PullHandler,
  1147. }
  1148. pullCmd.Flags().Bool("insecure", false, "Use an insecure registry")
  1149. pushCmd := &cobra.Command{
  1150. Use: "push MODEL",
  1151. Short: "Push a model to a registry",
  1152. Args: cobra.ExactArgs(1),
  1153. PreRunE: checkServerHeartbeat,
  1154. RunE: PushHandler,
  1155. }
  1156. pushCmd.Flags().Bool("insecure", false, "Use an insecure registry")
  1157. listCmd := &cobra.Command{
  1158. Use: "list",
  1159. Aliases: []string{"ls"},
  1160. Short: "List models",
  1161. PreRunE: checkServerHeartbeat,
  1162. RunE: ListHandler,
  1163. }
  1164. psCmd := &cobra.Command{
  1165. Use: "ps",
  1166. Short: "List running models",
  1167. PreRunE: checkServerHeartbeat,
  1168. RunE: ListRunningHandler,
  1169. }
  1170. copyCmd := &cobra.Command{
  1171. Use: "cp SOURCE DESTINATION",
  1172. Short: "Copy a model",
  1173. Args: cobra.ExactArgs(2),
  1174. PreRunE: checkServerHeartbeat,
  1175. RunE: CopyHandler,
  1176. }
  1177. deleteCmd := &cobra.Command{
  1178. Use: "rm MODEL [MODEL...]",
  1179. Short: "Remove a model",
  1180. Args: cobra.MinimumNArgs(1),
  1181. PreRunE: checkServerHeartbeat,
  1182. RunE: DeleteHandler,
  1183. }
  1184. envVars := envconfig.AsMap()
  1185. envs := []envconfig.EnvVar{envVars["OLLAMA_HOST"]}
  1186. for _, cmd := range []*cobra.Command{
  1187. createCmd,
  1188. showCmd,
  1189. runCmd,
  1190. pullCmd,
  1191. pushCmd,
  1192. listCmd,
  1193. psCmd,
  1194. copyCmd,
  1195. deleteCmd,
  1196. serveCmd,
  1197. } {
  1198. switch cmd {
  1199. case runCmd:
  1200. appendEnvDocs(cmd, []envconfig.EnvVar{envVars["OLLAMA_HOST"], envVars["OLLAMA_NOHISTORY"]})
  1201. case serveCmd:
  1202. appendEnvDocs(cmd, []envconfig.EnvVar{
  1203. envVars["OLLAMA_DEBUG"],
  1204. envVars["OLLAMA_HOST"],
  1205. envVars["OLLAMA_KEEP_ALIVE"],
  1206. envVars["OLLAMA_MAX_LOADED_MODELS"],
  1207. envVars["OLLAMA_MAX_QUEUE"],
  1208. envVars["OLLAMA_MODELS"],
  1209. envVars["OLLAMA_NUM_PARALLEL"],
  1210. envVars["OLLAMA_NOPRUNE"],
  1211. envVars["OLLAMA_ORIGINS"],
  1212. envVars["OLLAMA_TMPDIR"],
  1213. envVars["OLLAMA_FLASH_ATTENTION"],
  1214. envVars["OLLAMA_LLM_LIBRARY"],
  1215. envVars["OLLAMA_MAX_VRAM"],
  1216. })
  1217. default:
  1218. appendEnvDocs(cmd, envs)
  1219. }
  1220. }
  1221. rootCmd.AddCommand(
  1222. serveCmd,
  1223. createCmd,
  1224. showCmd,
  1225. runCmd,
  1226. pullCmd,
  1227. pushCmd,
  1228. listCmd,
  1229. psCmd,
  1230. copyCmd,
  1231. deleteCmd,
  1232. )
  1233. return rootCmd
  1234. }