cmd.go 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711
  1. package cmd
  2. import (
  3. "bufio"
  4. "context"
  5. "errors"
  6. "fmt"
  7. "io"
  8. "log"
  9. "net"
  10. "net/http"
  11. "os"
  12. "os/exec"
  13. "path/filepath"
  14. "runtime"
  15. "strings"
  16. "time"
  17. "github.com/chzyer/readline"
  18. "github.com/dustin/go-humanize"
  19. "github.com/olekukonko/tablewriter"
  20. "github.com/spf13/cobra"
  21. "github.com/jmorganca/ollama/api"
  22. "github.com/jmorganca/ollama/format"
  23. "github.com/jmorganca/ollama/progressbar"
  24. "github.com/jmorganca/ollama/server"
  25. )
  26. func CreateHandler(cmd *cobra.Command, args []string) error {
  27. filename, _ := cmd.Flags().GetString("file")
  28. filename, err := filepath.Abs(filename)
  29. if err != nil {
  30. return err
  31. }
  32. client := api.NewClient()
  33. var spinner *Spinner
  34. var currentDigest string
  35. var bar *progressbar.ProgressBar
  36. request := api.CreateRequest{Name: args[0], Path: filename}
  37. fn := func(resp api.ProgressResponse) error {
  38. if resp.Digest != currentDigest && resp.Digest != "" {
  39. if spinner != nil {
  40. spinner.Stop()
  41. }
  42. currentDigest = resp.Digest
  43. switch {
  44. case strings.Contains(resp.Status, "embeddings"):
  45. bar = progressbar.Default(int64(resp.Total), resp.Status)
  46. bar.Set(resp.Completed)
  47. default:
  48. // pulling
  49. bar = progressbar.DefaultBytes(
  50. int64(resp.Total),
  51. resp.Status,
  52. )
  53. bar.Set(resp.Completed)
  54. }
  55. } else if resp.Digest == currentDigest && resp.Digest != "" {
  56. bar.Set(resp.Completed)
  57. } else {
  58. currentDigest = ""
  59. if spinner != nil {
  60. spinner.Stop()
  61. }
  62. spinner = NewSpinner(resp.Status)
  63. go spinner.Spin(100 * time.Millisecond)
  64. }
  65. return nil
  66. }
  67. if err := client.Create(context.Background(), &request, fn); err != nil {
  68. return err
  69. }
  70. if spinner != nil {
  71. spinner.Stop()
  72. }
  73. return nil
  74. }
  75. func RunHandler(cmd *cobra.Command, args []string) error {
  76. mp := server.ParseModelPath(args[0])
  77. fp, err := mp.GetManifestPath(false)
  78. if err != nil {
  79. return err
  80. }
  81. _, err = os.Stat(fp)
  82. switch {
  83. case errors.Is(err, os.ErrNotExist):
  84. if err := pull(args[0], false); err != nil {
  85. var apiStatusError api.StatusError
  86. if !errors.As(err, &apiStatusError) {
  87. return err
  88. }
  89. if apiStatusError.StatusCode != http.StatusBadGateway {
  90. return err
  91. }
  92. }
  93. case err != nil:
  94. return err
  95. }
  96. return RunGenerate(cmd, args)
  97. }
  98. func PushHandler(cmd *cobra.Command, args []string) error {
  99. client := api.NewClient()
  100. insecure, err := cmd.Flags().GetBool("insecure")
  101. if err != nil {
  102. return err
  103. }
  104. var currentDigest string
  105. var bar *progressbar.ProgressBar
  106. request := api.PushRequest{Name: args[0], Insecure: insecure}
  107. fn := func(resp api.ProgressResponse) error {
  108. if resp.Digest != currentDigest && resp.Digest != "" {
  109. currentDigest = resp.Digest
  110. bar = progressbar.DefaultBytes(
  111. int64(resp.Total),
  112. fmt.Sprintf("pushing %s...", resp.Digest[7:19]),
  113. )
  114. bar.Set(resp.Completed)
  115. } else if resp.Digest == currentDigest && resp.Digest != "" {
  116. bar.Set(resp.Completed)
  117. } else {
  118. currentDigest = ""
  119. fmt.Println(resp.Status)
  120. }
  121. return nil
  122. }
  123. if err := client.Push(context.Background(), &request, fn); err != nil {
  124. return err
  125. }
  126. return nil
  127. }
  128. func ListHandler(cmd *cobra.Command, args []string) error {
  129. client := api.NewClient()
  130. models, err := client.List(context.Background())
  131. if err != nil {
  132. return err
  133. }
  134. var data [][]string
  135. for _, m := range models.Models {
  136. if len(args) == 0 || strings.HasPrefix(m.Name, args[0]) {
  137. data = append(data, []string{m.Name, humanize.Bytes(uint64(m.Size)), format.HumanTime(m.ModifiedAt, "Never")})
  138. }
  139. }
  140. table := tablewriter.NewWriter(os.Stdout)
  141. table.SetHeader([]string{"NAME", "SIZE", "MODIFIED"})
  142. table.SetHeaderAlignment(tablewriter.ALIGN_LEFT)
  143. table.SetAlignment(tablewriter.ALIGN_LEFT)
  144. table.SetHeaderLine(false)
  145. table.SetBorder(false)
  146. table.SetNoWhiteSpace(true)
  147. table.SetTablePadding("\t")
  148. table.AppendBulk(data)
  149. table.Render()
  150. return nil
  151. }
  152. func DeleteHandler(cmd *cobra.Command, args []string) error {
  153. client := api.NewClient()
  154. req := api.DeleteRequest{Name: args[0]}
  155. if err := client.Delete(context.Background(), &req); err != nil {
  156. return err
  157. }
  158. fmt.Printf("deleted '%s'\n", args[0])
  159. return nil
  160. }
  161. func CopyHandler(cmd *cobra.Command, args []string) error {
  162. client := api.NewClient()
  163. req := api.CopyRequest{Source: args[0], Destination: args[1]}
  164. if err := client.Copy(context.Background(), &req); err != nil {
  165. return err
  166. }
  167. fmt.Printf("copied '%s' to '%s'\n", args[0], args[1])
  168. return nil
  169. }
  170. func PullHandler(cmd *cobra.Command, args []string) error {
  171. insecure, err := cmd.Flags().GetBool("insecure")
  172. if err != nil {
  173. return err
  174. }
  175. return pull(args[0], insecure)
  176. }
  177. func pull(model string, insecure bool) error {
  178. client := api.NewClient()
  179. var currentDigest string
  180. var bar *progressbar.ProgressBar
  181. request := api.PullRequest{Name: model, Insecure: insecure}
  182. fn := func(resp api.ProgressResponse) error {
  183. if resp.Digest != currentDigest && resp.Digest != "" {
  184. currentDigest = resp.Digest
  185. bar = progressbar.DefaultBytes(
  186. int64(resp.Total),
  187. fmt.Sprintf("pulling %s...", resp.Digest[7:19]),
  188. )
  189. bar.Set(resp.Completed)
  190. } else if resp.Digest == currentDigest && resp.Digest != "" {
  191. bar.Set(resp.Completed)
  192. } else {
  193. currentDigest = ""
  194. fmt.Println(resp.Status)
  195. }
  196. return nil
  197. }
  198. if err := client.Pull(context.Background(), &request, fn); err != nil {
  199. return err
  200. }
  201. return nil
  202. }
  203. func RunGenerate(cmd *cobra.Command, args []string) error {
  204. if len(args) > 1 {
  205. // join all args into a single prompt
  206. return generate(cmd, args[0], strings.Join(args[1:], " "))
  207. }
  208. if readline.IsTerminal(int(os.Stdin.Fd())) {
  209. return generateInteractive(cmd, args[0])
  210. }
  211. return generateBatch(cmd, args[0])
  212. }
  213. type generateContextKey string
  214. func generate(cmd *cobra.Command, model, prompt string) error {
  215. if len(strings.TrimSpace(prompt)) > 0 {
  216. client := api.NewClient()
  217. spinner := NewSpinner("")
  218. go spinner.Spin(60 * time.Millisecond)
  219. var latest api.GenerateResponse
  220. generateContext, ok := cmd.Context().Value(generateContextKey("context")).([]int)
  221. if !ok {
  222. generateContext = []int{}
  223. }
  224. request := api.GenerateRequest{Model: model, Prompt: prompt, Context: generateContext}
  225. fn := func(response api.GenerateResponse) error {
  226. if !spinner.IsFinished() {
  227. spinner.Finish()
  228. }
  229. latest = response
  230. fmt.Print(response.Response)
  231. return nil
  232. }
  233. if err := client.Generate(context.Background(), &request, fn); err != nil {
  234. if strings.Contains(err.Error(), "failed to load model") {
  235. // tell the user to check the server log, if it exists locally
  236. home, nestedErr := os.UserHomeDir()
  237. if nestedErr != nil {
  238. // return the original error
  239. return err
  240. }
  241. logPath := filepath.Join(home, ".ollama", "logs", "server.log")
  242. if _, nestedErr := os.Stat(logPath); nestedErr == nil {
  243. err = fmt.Errorf("%w\nFor more details, check the error logs at %s", err, logPath)
  244. }
  245. }
  246. return err
  247. }
  248. fmt.Println()
  249. fmt.Println()
  250. verbose, err := cmd.Flags().GetBool("verbose")
  251. if err != nil {
  252. return err
  253. }
  254. if verbose {
  255. latest.Summary()
  256. }
  257. ctx := cmd.Context()
  258. ctx = context.WithValue(ctx, generateContextKey("context"), latest.Context)
  259. cmd.SetContext(ctx)
  260. }
  261. return nil
  262. }
  263. func showLayer(l *server.Layer) {
  264. filename, err := server.GetBlobsPath(l.Digest)
  265. bts, err := os.ReadFile(filename)
  266. if err != nil {
  267. fmt.Printf("Couldn't read layer")
  268. return
  269. }
  270. fmt.Printf(string(bts) + "\n")
  271. }
  272. func generateInteractive(cmd *cobra.Command, model string) error {
  273. home, err := os.UserHomeDir()
  274. if err != nil {
  275. return err
  276. }
  277. completer := readline.NewPrefixCompleter(
  278. readline.PcItem("/help"),
  279. readline.PcItem("/list"),
  280. readline.PcItem("/set",
  281. readline.PcItem("history"),
  282. readline.PcItem("nohistory"),
  283. readline.PcItem("verbose"),
  284. readline.PcItem("quiet"),
  285. readline.PcItem("mode",
  286. readline.PcItem("vim"),
  287. readline.PcItem("emacs"),
  288. readline.PcItem("default"),
  289. ),
  290. ),
  291. readline.PcItem("/show",
  292. readline.PcItem("license"),
  293. readline.PcItem("system"),
  294. readline.PcItem("template"),
  295. ),
  296. readline.PcItem("/exit"),
  297. readline.PcItem("/bye"),
  298. )
  299. usage := func() {
  300. fmt.Fprintln(os.Stderr, "commands:")
  301. fmt.Fprintln(os.Stderr, completer.Tree(" "))
  302. }
  303. config := readline.Config{
  304. Prompt: ">>> ",
  305. HistoryFile: filepath.Join(home, ".ollama", "history"),
  306. AutoComplete: completer,
  307. }
  308. scanner, err := readline.NewEx(&config)
  309. if err != nil {
  310. return err
  311. }
  312. defer scanner.Close()
  313. var multiLineBuffer string
  314. var isMultiLine bool
  315. for {
  316. line, err := scanner.Readline()
  317. switch {
  318. case errors.Is(err, io.EOF):
  319. return nil
  320. case errors.Is(err, readline.ErrInterrupt):
  321. if line == "" {
  322. return nil
  323. }
  324. continue
  325. case err != nil:
  326. return err
  327. }
  328. line = strings.TrimSpace(line)
  329. switch {
  330. case isMultiLine:
  331. if strings.HasSuffix(line, `"""`) {
  332. isMultiLine = false
  333. multiLineBuffer += strings.TrimSuffix(line, `"""`)
  334. line = multiLineBuffer
  335. multiLineBuffer = ""
  336. scanner.SetPrompt(">>> ")
  337. } else {
  338. multiLineBuffer += line + " "
  339. continue
  340. }
  341. case strings.HasPrefix(line, `"""`):
  342. isMultiLine = true
  343. multiLineBuffer = strings.TrimPrefix(line, `"""`) + " "
  344. scanner.SetPrompt("... ")
  345. continue
  346. case strings.HasPrefix(line, "/list"):
  347. args := strings.Fields(line)
  348. if err := ListHandler(cmd, args[1:]); err != nil {
  349. return err
  350. }
  351. continue
  352. case strings.HasPrefix(line, "/set"):
  353. args := strings.Fields(line)
  354. if len(args) > 1 {
  355. switch args[1] {
  356. case "history":
  357. scanner.HistoryEnable()
  358. continue
  359. case "nohistory":
  360. scanner.HistoryDisable()
  361. continue
  362. case "verbose":
  363. cmd.Flags().Set("verbose", "true")
  364. continue
  365. case "quiet":
  366. cmd.Flags().Set("verbose", "false")
  367. continue
  368. case "mode":
  369. if len(args) > 2 {
  370. switch args[2] {
  371. case "vim":
  372. scanner.SetVimMode(true)
  373. continue
  374. case "emacs", "default":
  375. scanner.SetVimMode(false)
  376. continue
  377. default:
  378. usage()
  379. continue
  380. }
  381. } else {
  382. usage()
  383. continue
  384. }
  385. }
  386. } else {
  387. usage()
  388. continue
  389. }
  390. case strings.HasPrefix(line, "/show"):
  391. args := strings.Fields(line)
  392. if len(args) > 1 {
  393. mp := server.ParseModelPath(model)
  394. manifest, err := server.GetManifest(mp)
  395. if err != nil {
  396. fmt.Printf("error: couldn't get a manifestfor this model")
  397. continue
  398. }
  399. switch args[1] {
  400. case "license":
  401. for _, l := range manifest.Layers {
  402. if l.MediaType == "application/vnd.ollama.image.license" {
  403. showLayer(l)
  404. }
  405. }
  406. continue
  407. case "system":
  408. for _, l := range manifest.Layers {
  409. if l.MediaType == "application/vnd.ollama.image.system" {
  410. showLayer(l)
  411. }
  412. }
  413. continue
  414. case "template":
  415. for _, l := range manifest.Layers {
  416. if l.MediaType == "application/vnd.ollama.image.template" {
  417. showLayer(l)
  418. }
  419. }
  420. continue
  421. default:
  422. usage()
  423. continue
  424. }
  425. } else {
  426. usage()
  427. continue
  428. }
  429. case line == "/help", line == "/?":
  430. usage()
  431. continue
  432. case line == "/exit", line == "/bye":
  433. return nil
  434. }
  435. if err := generate(cmd, model, line); err != nil {
  436. return err
  437. }
  438. }
  439. }
  440. func generateBatch(cmd *cobra.Command, model string) error {
  441. scanner := bufio.NewScanner(os.Stdin)
  442. for scanner.Scan() {
  443. prompt := scanner.Text()
  444. fmt.Printf(">>> %s\n", prompt)
  445. if err := generate(cmd, model, prompt); err != nil {
  446. return err
  447. }
  448. }
  449. return nil
  450. }
  451. // getRunServerParams takes a command and the environment variables and returns the correct params
  452. // given the order of precedence: command line args (highest), environment variables, defaults (lowest)
  453. func getRunServerParams(cmd *cobra.Command) (host, port string, extraOrigins []string, err error) {
  454. host = os.Getenv("OLLAMA_HOST")
  455. hostFlag := cmd.Flags().Lookup("host")
  456. if hostFlag == nil {
  457. return "", "", nil, errors.New("host unset")
  458. }
  459. if hostFlag.Changed || host == "" {
  460. host = hostFlag.Value.String()
  461. }
  462. port = os.Getenv("OLLAMA_PORT")
  463. portFlag := cmd.Flags().Lookup("port")
  464. if portFlag == nil {
  465. return "", "", nil, errors.New("port unset")
  466. }
  467. if portFlag.Changed || port == "" {
  468. port = portFlag.Value.String()
  469. }
  470. extraOrigins, err = cmd.Flags().GetStringSlice("origins")
  471. if err != nil {
  472. return "", "", nil, err
  473. }
  474. return host, port, extraOrigins, nil
  475. }
  476. func RunServer(cmd *cobra.Command, _ []string) error {
  477. host, port, origins, err := getRunServerParams(cmd)
  478. if err != nil {
  479. return err
  480. }
  481. ln, err := net.Listen("tcp", fmt.Sprintf("%s:%s", host, port))
  482. if err != nil {
  483. return err
  484. }
  485. return server.Serve(ln, origins)
  486. }
  487. func startMacApp(client *api.Client) error {
  488. exe, err := os.Executable()
  489. if err != nil {
  490. return err
  491. }
  492. link, err := os.Readlink(exe)
  493. if err != nil {
  494. return err
  495. }
  496. if !strings.Contains(link, "Ollama.app") {
  497. return fmt.Errorf("could not find ollama app")
  498. }
  499. path := strings.Split(link, "Ollama.app")
  500. if err := exec.Command("/usr/bin/open", "-a", path[0]+"Ollama.app").Run(); err != nil {
  501. return err
  502. }
  503. // wait for the server to start
  504. timeout := time.After(5 * time.Second)
  505. tick := time.Tick(500 * time.Millisecond)
  506. for {
  507. select {
  508. case <-timeout:
  509. return errors.New("timed out waiting for server to start")
  510. case <-tick:
  511. if err := client.Heartbeat(context.Background()); err == nil {
  512. return nil // server has started
  513. }
  514. }
  515. }
  516. }
  517. func checkServerHeartbeat(_ *cobra.Command, _ []string) error {
  518. client := api.NewClient()
  519. if err := client.Heartbeat(context.Background()); err != nil {
  520. if !strings.Contains(err.Error(), "connection refused") {
  521. return err
  522. }
  523. if runtime.GOOS == "darwin" {
  524. if err := startMacApp(client); err != nil {
  525. return fmt.Errorf("could not connect to ollama app, is it running?")
  526. }
  527. } else {
  528. return fmt.Errorf("could not connect to ollama server, run 'ollama serve' to start it")
  529. }
  530. }
  531. return nil
  532. }
  533. func NewCLI() *cobra.Command {
  534. log.SetFlags(log.LstdFlags | log.Lshortfile)
  535. rootCmd := &cobra.Command{
  536. Use: "ollama",
  537. Short: "Large language model runner",
  538. SilenceUsage: true,
  539. CompletionOptions: cobra.CompletionOptions{
  540. DisableDefaultCmd: true,
  541. },
  542. }
  543. cobra.EnableCommandSorting = false
  544. createCmd := &cobra.Command{
  545. Use: "create MODEL",
  546. Short: "Create a model from a Modelfile",
  547. Args: cobra.MinimumNArgs(1),
  548. PreRunE: checkServerHeartbeat,
  549. RunE: CreateHandler,
  550. }
  551. createCmd.Flags().StringP("file", "f", "Modelfile", "Name of the Modelfile (default \"Modelfile\")")
  552. runCmd := &cobra.Command{
  553. Use: "run MODEL [PROMPT]",
  554. Short: "Run a model",
  555. Args: cobra.MinimumNArgs(1),
  556. PreRunE: checkServerHeartbeat,
  557. RunE: RunHandler,
  558. }
  559. runCmd.Flags().Bool("verbose", false, "Show timings for response")
  560. serveCmd := &cobra.Command{
  561. Use: "serve",
  562. Aliases: []string{"start"},
  563. Short: "Start ollama",
  564. RunE: RunServer,
  565. }
  566. serveCmd.Flags().String("port", "11434", "Port to listen on")
  567. serveCmd.Flags().String("host", "127.0.0.1", "Host to listen on")
  568. serveCmd.Flags().StringSlice("origins", nil, "Additional allowed CORS origins as comma-separated list (e.g. http://192.168.1.24:3000)")
  569. pullCmd := &cobra.Command{
  570. Use: "pull MODEL",
  571. Short: "Pull a model from a registry",
  572. Args: cobra.MinimumNArgs(1),
  573. PreRunE: checkServerHeartbeat,
  574. RunE: PullHandler,
  575. }
  576. pullCmd.Flags().Bool("insecure", false, "Use an insecure registry")
  577. pushCmd := &cobra.Command{
  578. Use: "push MODEL",
  579. Short: "Push a model to a registry",
  580. Args: cobra.MinimumNArgs(1),
  581. PreRunE: checkServerHeartbeat,
  582. RunE: PushHandler,
  583. }
  584. pushCmd.Flags().Bool("insecure", false, "Use an insecure registry")
  585. listCmd := &cobra.Command{
  586. Use: "list",
  587. Aliases: []string{"ls"},
  588. Short: "List models",
  589. PreRunE: checkServerHeartbeat,
  590. RunE: ListHandler,
  591. }
  592. copyCmd := &cobra.Command{
  593. Use: "cp",
  594. Short: "Copy a model",
  595. Args: cobra.MinimumNArgs(2),
  596. PreRunE: checkServerHeartbeat,
  597. RunE: CopyHandler,
  598. }
  599. deleteCmd := &cobra.Command{
  600. Use: "rm",
  601. Short: "Remove a model",
  602. Args: cobra.MinimumNArgs(1),
  603. PreRunE: checkServerHeartbeat,
  604. RunE: DeleteHandler,
  605. }
  606. rootCmd.AddCommand(
  607. serveCmd,
  608. createCmd,
  609. runCmd,
  610. pullCmd,
  611. pushCmd,
  612. listCmd,
  613. copyCmd,
  614. deleteCmd,
  615. )
  616. return rootCmd
  617. }