cmd.go 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705
  1. package cmd
  2. import (
  3. "bufio"
  4. "context"
  5. "errors"
  6. "fmt"
  7. "io"
  8. "log"
  9. "net"
  10. "net/http"
  11. "os"
  12. "os/exec"
  13. "path/filepath"
  14. "runtime"
  15. "strings"
  16. "time"
  17. "github.com/chzyer/readline"
  18. "github.com/dustin/go-humanize"
  19. "github.com/olekukonko/tablewriter"
  20. "github.com/spf13/cobra"
  21. "github.com/jmorganca/ollama/api"
  22. "github.com/jmorganca/ollama/format"
  23. "github.com/jmorganca/ollama/progressbar"
  24. "github.com/jmorganca/ollama/server"
  25. )
  26. func CreateHandler(cmd *cobra.Command, args []string) error {
  27. filename, _ := cmd.Flags().GetString("file")
  28. filename, err := filepath.Abs(filename)
  29. if err != nil {
  30. return err
  31. }
  32. client := api.NewClient()
  33. var spinner *Spinner
  34. var currentDigest string
  35. var bar *progressbar.ProgressBar
  36. request := api.CreateRequest{Name: args[0], Path: filename}
  37. fn := func(resp api.ProgressResponse) error {
  38. if resp.Digest != currentDigest && resp.Digest != "" {
  39. if spinner != nil {
  40. spinner.Stop()
  41. }
  42. currentDigest = resp.Digest
  43. bar = progressbar.DefaultBytes(
  44. int64(resp.Total),
  45. fmt.Sprintf("pulling %s...", resp.Digest[7:19]),
  46. )
  47. bar.Set(resp.Completed)
  48. } else if resp.Digest == currentDigest && resp.Digest != "" {
  49. bar.Set(resp.Completed)
  50. } else {
  51. currentDigest = ""
  52. if spinner != nil {
  53. spinner.Stop()
  54. }
  55. spinner = NewSpinner(resp.Status)
  56. go spinner.Spin(100 * time.Millisecond)
  57. }
  58. return nil
  59. }
  60. if err := client.Create(context.Background(), &request, fn); err != nil {
  61. return err
  62. }
  63. if spinner != nil {
  64. spinner.Stop()
  65. }
  66. return nil
  67. }
  68. func RunHandler(cmd *cobra.Command, args []string) error {
  69. mp := server.ParseModelPath(args[0])
  70. fp, err := mp.GetManifestPath(false)
  71. if err != nil {
  72. return err
  73. }
  74. _, err = os.Stat(fp)
  75. switch {
  76. case errors.Is(err, os.ErrNotExist):
  77. if err := pull(args[0], false); err != nil {
  78. var apiStatusError api.StatusError
  79. if !errors.As(err, &apiStatusError) {
  80. return err
  81. }
  82. if apiStatusError.StatusCode != http.StatusBadGateway {
  83. return err
  84. }
  85. }
  86. case err != nil:
  87. return err
  88. }
  89. return RunGenerate(cmd, args)
  90. }
  91. func PushHandler(cmd *cobra.Command, args []string) error {
  92. client := api.NewClient()
  93. insecure, err := cmd.Flags().GetBool("insecure")
  94. if err != nil {
  95. return err
  96. }
  97. var currentDigest string
  98. var bar *progressbar.ProgressBar
  99. request := api.PushRequest{Name: args[0], Insecure: insecure}
  100. fn := func(resp api.ProgressResponse) error {
  101. if resp.Digest != currentDigest && resp.Digest != "" {
  102. currentDigest = resp.Digest
  103. bar = progressbar.DefaultBytes(
  104. int64(resp.Total),
  105. fmt.Sprintf("pushing %s...", resp.Digest[7:19]),
  106. )
  107. bar.Set(resp.Completed)
  108. } else if resp.Digest == currentDigest && resp.Digest != "" {
  109. bar.Set(resp.Completed)
  110. } else {
  111. currentDigest = ""
  112. fmt.Println(resp.Status)
  113. }
  114. return nil
  115. }
  116. if err := client.Push(context.Background(), &request, fn); err != nil {
  117. return err
  118. }
  119. return nil
  120. }
  121. func ListHandler(cmd *cobra.Command, args []string) error {
  122. client := api.NewClient()
  123. models, err := client.List(context.Background())
  124. if err != nil {
  125. return err
  126. }
  127. var data [][]string
  128. for _, m := range models.Models {
  129. if len(args) == 0 || strings.HasPrefix(m.Name, args[0]) {
  130. data = append(data, []string{m.Name, humanize.Bytes(uint64(m.Size)), format.HumanTime(m.ModifiedAt, "Never")})
  131. }
  132. }
  133. table := tablewriter.NewWriter(os.Stdout)
  134. table.SetHeader([]string{"NAME", "SIZE", "MODIFIED"})
  135. table.SetHeaderAlignment(tablewriter.ALIGN_LEFT)
  136. table.SetAlignment(tablewriter.ALIGN_LEFT)
  137. table.SetHeaderLine(false)
  138. table.SetBorder(false)
  139. table.SetNoWhiteSpace(true)
  140. table.SetTablePadding("\t")
  141. table.AppendBulk(data)
  142. table.Render()
  143. return nil
  144. }
  145. func DeleteHandler(cmd *cobra.Command, args []string) error {
  146. client := api.NewClient()
  147. req := api.DeleteRequest{Name: args[0]}
  148. if err := client.Delete(context.Background(), &req); err != nil {
  149. return err
  150. }
  151. fmt.Printf("deleted '%s'\n", args[0])
  152. return nil
  153. }
  154. func CopyHandler(cmd *cobra.Command, args []string) error {
  155. client := api.NewClient()
  156. req := api.CopyRequest{Source: args[0], Destination: args[1]}
  157. if err := client.Copy(context.Background(), &req); err != nil {
  158. return err
  159. }
  160. fmt.Printf("copied '%s' to '%s'\n", args[0], args[1])
  161. return nil
  162. }
  163. func PullHandler(cmd *cobra.Command, args []string) error {
  164. insecure, err := cmd.Flags().GetBool("insecure")
  165. if err != nil {
  166. return err
  167. }
  168. return pull(args[0], insecure)
  169. }
  170. func pull(model string, insecure bool) error {
  171. client := api.NewClient()
  172. var currentDigest string
  173. var bar *progressbar.ProgressBar
  174. request := api.PullRequest{Name: model, Insecure: insecure}
  175. fn := func(resp api.ProgressResponse) error {
  176. if resp.Digest != currentDigest && resp.Digest != "" {
  177. currentDigest = resp.Digest
  178. bar = progressbar.DefaultBytes(
  179. int64(resp.Total),
  180. fmt.Sprintf("pulling %s...", resp.Digest[7:19]),
  181. )
  182. bar.Set(resp.Completed)
  183. } else if resp.Digest == currentDigest && resp.Digest != "" {
  184. bar.Set(resp.Completed)
  185. } else {
  186. currentDigest = ""
  187. fmt.Println(resp.Status)
  188. }
  189. return nil
  190. }
  191. if err := client.Pull(context.Background(), &request, fn); err != nil {
  192. return err
  193. }
  194. return nil
  195. }
  196. func RunGenerate(cmd *cobra.Command, args []string) error {
  197. if len(args) > 1 {
  198. // join all args into a single prompt
  199. return generate(cmd, args[0], strings.Join(args[1:], " "))
  200. }
  201. if readline.IsTerminal(int(os.Stdin.Fd())) {
  202. return generateInteractive(cmd, args[0])
  203. }
  204. return generateBatch(cmd, args[0])
  205. }
  206. type generateContextKey string
  207. func generate(cmd *cobra.Command, model, prompt string) error {
  208. if len(strings.TrimSpace(prompt)) > 0 {
  209. client := api.NewClient()
  210. spinner := NewSpinner("")
  211. go spinner.Spin(60 * time.Millisecond)
  212. var latest api.GenerateResponse
  213. generateContext, ok := cmd.Context().Value(generateContextKey("context")).([]int)
  214. if !ok {
  215. generateContext = []int{}
  216. }
  217. request := api.GenerateRequest{Model: model, Prompt: prompt, Context: generateContext}
  218. fn := func(response api.GenerateResponse) error {
  219. if !spinner.IsFinished() {
  220. spinner.Finish()
  221. }
  222. latest = response
  223. fmt.Print(response.Response)
  224. return nil
  225. }
  226. if err := client.Generate(context.Background(), &request, fn); err != nil {
  227. if strings.Contains(err.Error(), "failed to load model") {
  228. // tell the user to check the server log, if it exists locally
  229. home, nestedErr := os.UserHomeDir()
  230. if nestedErr != nil {
  231. // return the original error
  232. return err
  233. }
  234. logPath := filepath.Join(home, ".ollama", "logs", "server.log")
  235. if _, nestedErr := os.Stat(logPath); nestedErr == nil {
  236. err = fmt.Errorf("%w\nFor more details, check the error logs at %s", err, logPath)
  237. }
  238. }
  239. return err
  240. }
  241. fmt.Println()
  242. fmt.Println()
  243. verbose, err := cmd.Flags().GetBool("verbose")
  244. if err != nil {
  245. return err
  246. }
  247. if verbose {
  248. latest.Summary()
  249. }
  250. ctx := cmd.Context()
  251. ctx = context.WithValue(ctx, generateContextKey("context"), latest.Context)
  252. cmd.SetContext(ctx)
  253. }
  254. return nil
  255. }
  256. func showLayer(l *server.Layer) {
  257. filename, err := server.GetBlobsPath(l.Digest)
  258. bts, err := os.ReadFile(filename)
  259. if err != nil {
  260. fmt.Printf("Couldn't read layer")
  261. return
  262. }
  263. fmt.Printf(string(bts) + "\n")
  264. }
  265. func generateInteractive(cmd *cobra.Command, model string) error {
  266. home, err := os.UserHomeDir()
  267. if err != nil {
  268. return err
  269. }
  270. completer := readline.NewPrefixCompleter(
  271. readline.PcItem("/help"),
  272. readline.PcItem("/list"),
  273. readline.PcItem("/set",
  274. readline.PcItem("history"),
  275. readline.PcItem("nohistory"),
  276. readline.PcItem("verbose"),
  277. readline.PcItem("quiet"),
  278. readline.PcItem("mode",
  279. readline.PcItem("vim"),
  280. readline.PcItem("emacs"),
  281. readline.PcItem("default"),
  282. ),
  283. ),
  284. readline.PcItem("/show",
  285. readline.PcItem("license"),
  286. readline.PcItem("system"),
  287. readline.PcItem("template"),
  288. ),
  289. readline.PcItem("/exit"),
  290. readline.PcItem("/bye"),
  291. )
  292. usage := func() {
  293. fmt.Fprintln(os.Stderr, "commands:")
  294. fmt.Fprintln(os.Stderr, completer.Tree(" "))
  295. }
  296. config := readline.Config{
  297. Prompt: ">>> ",
  298. HistoryFile: filepath.Join(home, ".ollama", "history"),
  299. AutoComplete: completer,
  300. }
  301. scanner, err := readline.NewEx(&config)
  302. if err != nil {
  303. return err
  304. }
  305. defer scanner.Close()
  306. var multiLineBuffer string
  307. var isMultiLine bool
  308. for {
  309. line, err := scanner.Readline()
  310. switch {
  311. case errors.Is(err, io.EOF):
  312. return nil
  313. case errors.Is(err, readline.ErrInterrupt):
  314. if line == "" {
  315. return nil
  316. }
  317. continue
  318. case err != nil:
  319. return err
  320. }
  321. line = strings.TrimSpace(line)
  322. switch {
  323. case isMultiLine:
  324. if strings.HasSuffix(line, `"""`) {
  325. isMultiLine = false
  326. multiLineBuffer += strings.TrimSuffix(line, `"""`)
  327. line = multiLineBuffer
  328. multiLineBuffer = ""
  329. scanner.SetPrompt(">>> ")
  330. } else {
  331. multiLineBuffer += line + " "
  332. continue
  333. }
  334. case strings.HasPrefix(line, `"""`):
  335. isMultiLine = true
  336. multiLineBuffer = strings.TrimPrefix(line, `"""`) + " "
  337. scanner.SetPrompt("... ")
  338. continue
  339. case strings.HasPrefix(line, "/list"):
  340. args := strings.Fields(line)
  341. if err := ListHandler(cmd, args[1:]); err != nil {
  342. return err
  343. }
  344. continue
  345. case strings.HasPrefix(line, "/set"):
  346. args := strings.Fields(line)
  347. if len(args) > 1 {
  348. switch args[1] {
  349. case "history":
  350. scanner.HistoryEnable()
  351. continue
  352. case "nohistory":
  353. scanner.HistoryDisable()
  354. continue
  355. case "verbose":
  356. cmd.Flags().Set("verbose", "true")
  357. continue
  358. case "quiet":
  359. cmd.Flags().Set("verbose", "false")
  360. continue
  361. case "mode":
  362. if len(args) > 2 {
  363. switch args[2] {
  364. case "vim":
  365. scanner.SetVimMode(true)
  366. continue
  367. case "emacs", "default":
  368. scanner.SetVimMode(false)
  369. continue
  370. default:
  371. usage()
  372. continue
  373. }
  374. } else {
  375. usage()
  376. continue
  377. }
  378. }
  379. } else {
  380. usage()
  381. continue
  382. }
  383. case strings.HasPrefix(line, "/show"):
  384. args := strings.Fields(line)
  385. if len(args) > 1 {
  386. mp := server.ParseModelPath(model)
  387. manifest, err := server.GetManifest(mp)
  388. if err != nil {
  389. fmt.Printf("error: couldn't get a manifestfor this model")
  390. continue
  391. }
  392. switch args[1] {
  393. case "license":
  394. for _, l := range manifest.Layers {
  395. if l.MediaType == "application/vnd.ollama.image.license" {
  396. showLayer(l)
  397. }
  398. }
  399. continue
  400. case "system":
  401. for _, l := range manifest.Layers {
  402. if l.MediaType == "application/vnd.ollama.image.system" {
  403. showLayer(l)
  404. }
  405. }
  406. continue
  407. case "template":
  408. for _, l := range manifest.Layers {
  409. if l.MediaType == "application/vnd.ollama.image.template" {
  410. showLayer(l)
  411. }
  412. }
  413. continue
  414. default:
  415. usage()
  416. continue
  417. }
  418. } else {
  419. usage()
  420. continue
  421. }
  422. case line == "/help", line == "/?":
  423. usage()
  424. continue
  425. case line == "/exit", line == "/bye":
  426. return nil
  427. }
  428. if err := generate(cmd, model, line); err != nil {
  429. return err
  430. }
  431. }
  432. }
  433. func generateBatch(cmd *cobra.Command, model string) error {
  434. scanner := bufio.NewScanner(os.Stdin)
  435. for scanner.Scan() {
  436. prompt := scanner.Text()
  437. fmt.Printf(">>> %s\n", prompt)
  438. if err := generate(cmd, model, prompt); err != nil {
  439. return err
  440. }
  441. }
  442. return nil
  443. }
  444. // getRunServerParams takes a command and the environment variables and returns the correct params
  445. // given the order of precedence: command line args (highest), environment variables, defaults (lowest)
  446. func getRunServerParams(cmd *cobra.Command) (host, port string, extraOrigins []string, err error) {
  447. host = os.Getenv("OLLAMA_HOST")
  448. hostFlag := cmd.Flags().Lookup("host")
  449. if hostFlag == nil {
  450. return "", "", nil, errors.New("host unset")
  451. }
  452. if hostFlag.Changed || host == "" {
  453. host = hostFlag.Value.String()
  454. }
  455. port = os.Getenv("OLLAMA_PORT")
  456. portFlag := cmd.Flags().Lookup("port")
  457. if portFlag == nil {
  458. return "", "", nil, errors.New("port unset")
  459. }
  460. if portFlag.Changed || port == "" {
  461. port = portFlag.Value.String()
  462. }
  463. extraOrigins, err = cmd.Flags().GetStringSlice("allowed-origins")
  464. if err != nil {
  465. return "", "", nil, err
  466. }
  467. return host, port, extraOrigins, nil
  468. }
  469. func RunServer(cmd *cobra.Command, _ []string) error {
  470. host, port, extraOrigins, err := getRunServerParams(cmd)
  471. if err != nil {
  472. return err
  473. }
  474. ln, err := net.Listen("tcp", fmt.Sprintf("%s:%s", host, port))
  475. if err != nil {
  476. return err
  477. }
  478. return server.Serve(ln, extraOrigins)
  479. }
  480. func startMacApp(client *api.Client) error {
  481. exe, err := os.Executable()
  482. if err != nil {
  483. return err
  484. }
  485. link, err := os.Readlink(exe)
  486. if err != nil {
  487. return err
  488. }
  489. if !strings.Contains(link, "Ollama.app") {
  490. return fmt.Errorf("could not find ollama app")
  491. }
  492. path := strings.Split(link, "Ollama.app")
  493. if err := exec.Command("/usr/bin/open", "-a", path[0]+"Ollama.app").Run(); err != nil {
  494. return err
  495. }
  496. // wait for the server to start
  497. timeout := time.After(5 * time.Second)
  498. tick := time.Tick(500 * time.Millisecond)
  499. for {
  500. select {
  501. case <-timeout:
  502. return errors.New("timed out waiting for server to start")
  503. case <-tick:
  504. if err := client.Heartbeat(context.Background()); err == nil {
  505. return nil // server has started
  506. }
  507. }
  508. }
  509. }
  510. func checkServerHeartbeat(_ *cobra.Command, _ []string) error {
  511. client := api.NewClient()
  512. if err := client.Heartbeat(context.Background()); err != nil {
  513. if !strings.Contains(err.Error(), "connection refused") {
  514. return err
  515. }
  516. if runtime.GOOS == "darwin" {
  517. if err := startMacApp(client); err != nil {
  518. return fmt.Errorf("could not connect to ollama app, is it running?")
  519. }
  520. } else {
  521. return fmt.Errorf("could not connect to ollama server, run 'ollama serve' to start it")
  522. }
  523. }
  524. return nil
  525. }
  526. func NewCLI() *cobra.Command {
  527. log.SetFlags(log.LstdFlags | log.Lshortfile)
  528. rootCmd := &cobra.Command{
  529. Use: "ollama",
  530. Short: "Large language model runner",
  531. SilenceUsage: true,
  532. CompletionOptions: cobra.CompletionOptions{
  533. DisableDefaultCmd: true,
  534. },
  535. }
  536. cobra.EnableCommandSorting = false
  537. createCmd := &cobra.Command{
  538. Use: "create MODEL",
  539. Short: "Create a model from a Modelfile",
  540. Args: cobra.MinimumNArgs(1),
  541. PreRunE: checkServerHeartbeat,
  542. RunE: CreateHandler,
  543. }
  544. createCmd.Flags().StringP("file", "f", "Modelfile", "Name of the Modelfile (default \"Modelfile\")")
  545. runCmd := &cobra.Command{
  546. Use: "run MODEL [PROMPT]",
  547. Short: "Run a model",
  548. Args: cobra.MinimumNArgs(1),
  549. PreRunE: checkServerHeartbeat,
  550. RunE: RunHandler,
  551. }
  552. runCmd.Flags().Bool("verbose", false, "Show timings for response")
  553. serveCmd := &cobra.Command{
  554. Use: "serve",
  555. Aliases: []string{"start"},
  556. Short: "Start ollama",
  557. RunE: RunServer,
  558. }
  559. serveCmd.Flags().String("port", "11434", "Port to listen on, may also use OLLAMA_PORT environment variable")
  560. serveCmd.Flags().String("host", "127.0.0.1", "Host listen address, may also use OLLAMA_HOST environment variable")
  561. serveCmd.Flags().StringSlice("allowed-origins", []string{}, "Additional allowed CORS origins (outside of localhost), specify as comma-separated list")
  562. pullCmd := &cobra.Command{
  563. Use: "pull MODEL",
  564. Short: "Pull a model from a registry",
  565. Args: cobra.MinimumNArgs(1),
  566. PreRunE: checkServerHeartbeat,
  567. RunE: PullHandler,
  568. }
  569. pullCmd.Flags().Bool("insecure", false, "Use an insecure registry")
  570. pushCmd := &cobra.Command{
  571. Use: "push MODEL",
  572. Short: "Push a model to a registry",
  573. Args: cobra.MinimumNArgs(1),
  574. PreRunE: checkServerHeartbeat,
  575. RunE: PushHandler,
  576. }
  577. pushCmd.Flags().Bool("insecure", false, "Use an insecure registry")
  578. listCmd := &cobra.Command{
  579. Use: "list",
  580. Aliases: []string{"ls"},
  581. Short: "List models",
  582. PreRunE: checkServerHeartbeat,
  583. RunE: ListHandler,
  584. }
  585. copyCmd := &cobra.Command{
  586. Use: "cp",
  587. Short: "Copy a model",
  588. Args: cobra.MinimumNArgs(2),
  589. PreRunE: checkServerHeartbeat,
  590. RunE: CopyHandler,
  591. }
  592. deleteCmd := &cobra.Command{
  593. Use: "rm",
  594. Short: "Remove a model",
  595. Args: cobra.MinimumNArgs(1),
  596. PreRunE: checkServerHeartbeat,
  597. RunE: DeleteHandler,
  598. }
  599. rootCmd.AddCommand(
  600. serveCmd,
  601. createCmd,
  602. runCmd,
  603. pullCmd,
  604. pushCmd,
  605. listCmd,
  606. copyCmd,
  607. deleteCmd,
  608. )
  609. return rootCmd
  610. }