cmd.go 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780
  1. package cmd
  2. import (
  3. "bufio"
  4. "context"
  5. "crypto/ed25519"
  6. "crypto/rand"
  7. "encoding/pem"
  8. "errors"
  9. "fmt"
  10. "io"
  11. "log"
  12. "net"
  13. "net/http"
  14. "os"
  15. "os/exec"
  16. "path"
  17. "path/filepath"
  18. "runtime"
  19. "strings"
  20. "time"
  21. "github.com/chzyer/readline"
  22. "github.com/dustin/go-humanize"
  23. "github.com/olekukonko/tablewriter"
  24. "github.com/spf13/cobra"
  25. "golang.org/x/crypto/ssh"
  26. "github.com/jmorganca/ollama/api"
  27. "github.com/jmorganca/ollama/format"
  28. "github.com/jmorganca/ollama/progressbar"
  29. "github.com/jmorganca/ollama/server"
  30. )
  31. func CreateHandler(cmd *cobra.Command, args []string) error {
  32. filename, _ := cmd.Flags().GetString("file")
  33. filename, err := filepath.Abs(filename)
  34. if err != nil {
  35. return err
  36. }
  37. client := api.NewClient()
  38. var spinner *Spinner
  39. var currentDigest string
  40. var bar *progressbar.ProgressBar
  41. request := api.CreateRequest{Name: args[0], Path: filename}
  42. fn := func(resp api.ProgressResponse) error {
  43. if resp.Digest != currentDigest && resp.Digest != "" {
  44. if spinner != nil {
  45. spinner.Stop()
  46. }
  47. currentDigest = resp.Digest
  48. switch {
  49. case strings.Contains(resp.Status, "embeddings"):
  50. bar = progressbar.Default(int64(resp.Total), resp.Status)
  51. bar.Set(resp.Completed)
  52. default:
  53. // pulling
  54. bar = progressbar.DefaultBytes(
  55. int64(resp.Total),
  56. resp.Status,
  57. )
  58. bar.Set(resp.Completed)
  59. }
  60. } else if resp.Digest == currentDigest && resp.Digest != "" {
  61. bar.Set(resp.Completed)
  62. } else {
  63. currentDigest = ""
  64. if spinner != nil {
  65. spinner.Stop()
  66. }
  67. spinner = NewSpinner(resp.Status)
  68. go spinner.Spin(100 * time.Millisecond)
  69. }
  70. return nil
  71. }
  72. if err := client.Create(context.Background(), &request, fn); err != nil {
  73. return err
  74. }
  75. if spinner != nil {
  76. spinner.Stop()
  77. if spinner.description != "success" {
  78. return errors.New("unexpected end to create model")
  79. }
  80. }
  81. return nil
  82. }
  83. func RunHandler(cmd *cobra.Command, args []string) error {
  84. mp := server.ParseModelPath(args[0])
  85. fp, err := mp.GetManifestPath(false)
  86. if err != nil {
  87. return err
  88. }
  89. _, err = os.Stat(fp)
  90. switch {
  91. case errors.Is(err, os.ErrNotExist):
  92. if err := pull(args[0], false); err != nil {
  93. var apiStatusError api.StatusError
  94. if !errors.As(err, &apiStatusError) {
  95. return err
  96. }
  97. if apiStatusError.StatusCode != http.StatusBadGateway {
  98. return err
  99. }
  100. }
  101. case err != nil:
  102. return err
  103. }
  104. return RunGenerate(cmd, args)
  105. }
  106. func PushHandler(cmd *cobra.Command, args []string) error {
  107. client := api.NewClient()
  108. insecure, err := cmd.Flags().GetBool("insecure")
  109. if err != nil {
  110. return err
  111. }
  112. var currentDigest string
  113. var bar *progressbar.ProgressBar
  114. request := api.PushRequest{Name: args[0], Insecure: insecure}
  115. fn := func(resp api.ProgressResponse) error {
  116. if resp.Digest != currentDigest && resp.Digest != "" {
  117. currentDigest = resp.Digest
  118. bar = progressbar.DefaultBytes(
  119. int64(resp.Total),
  120. fmt.Sprintf("pushing %s...", resp.Digest[7:19]),
  121. )
  122. bar.Set(resp.Completed)
  123. } else if resp.Digest == currentDigest && resp.Digest != "" {
  124. bar.Set(resp.Completed)
  125. } else {
  126. currentDigest = ""
  127. fmt.Println(resp.Status)
  128. }
  129. return nil
  130. }
  131. if err := client.Push(context.Background(), &request, fn); err != nil {
  132. return err
  133. }
  134. if bar != nil && !bar.IsFinished() {
  135. return errors.New("unexpected end to push model")
  136. }
  137. return nil
  138. }
  139. func ListHandler(cmd *cobra.Command, args []string) error {
  140. client := api.NewClient()
  141. models, err := client.List(context.Background())
  142. if err != nil {
  143. return err
  144. }
  145. var data [][]string
  146. for _, m := range models.Models {
  147. if len(args) == 0 || strings.HasPrefix(m.Name, args[0]) {
  148. data = append(data, []string{m.Name, humanize.Bytes(uint64(m.Size)), format.HumanTime(m.ModifiedAt, "Never")})
  149. }
  150. }
  151. table := tablewriter.NewWriter(os.Stdout)
  152. table.SetHeader([]string{"NAME", "SIZE", "MODIFIED"})
  153. table.SetHeaderAlignment(tablewriter.ALIGN_LEFT)
  154. table.SetAlignment(tablewriter.ALIGN_LEFT)
  155. table.SetHeaderLine(false)
  156. table.SetBorder(false)
  157. table.SetNoWhiteSpace(true)
  158. table.SetTablePadding("\t")
  159. table.AppendBulk(data)
  160. table.Render()
  161. return nil
  162. }
  163. func DeleteHandler(cmd *cobra.Command, args []string) error {
  164. client := api.NewClient()
  165. req := api.DeleteRequest{Name: args[0]}
  166. if err := client.Delete(context.Background(), &req); err != nil {
  167. return err
  168. }
  169. fmt.Printf("deleted '%s'\n", args[0])
  170. return nil
  171. }
  172. func CopyHandler(cmd *cobra.Command, args []string) error {
  173. client := api.NewClient()
  174. req := api.CopyRequest{Source: args[0], Destination: args[1]}
  175. if err := client.Copy(context.Background(), &req); err != nil {
  176. return err
  177. }
  178. fmt.Printf("copied '%s' to '%s'\n", args[0], args[1])
  179. return nil
  180. }
  181. func PullHandler(cmd *cobra.Command, args []string) error {
  182. insecure, err := cmd.Flags().GetBool("insecure")
  183. if err != nil {
  184. return err
  185. }
  186. return pull(args[0], insecure)
  187. }
  188. func pull(model string, insecure bool) error {
  189. client := api.NewClient()
  190. var currentDigest string
  191. var bar *progressbar.ProgressBar
  192. request := api.PullRequest{Name: model, Insecure: insecure}
  193. fn := func(resp api.ProgressResponse) error {
  194. if resp.Digest != currentDigest && resp.Digest != "" {
  195. currentDigest = resp.Digest
  196. bar = progressbar.DefaultBytes(
  197. int64(resp.Total),
  198. fmt.Sprintf("pulling %s...", resp.Digest[7:19]),
  199. )
  200. bar.Set(resp.Completed)
  201. } else if resp.Digest == currentDigest && resp.Digest != "" {
  202. bar.Set(resp.Completed)
  203. } else {
  204. currentDigest = ""
  205. fmt.Println(resp.Status)
  206. }
  207. return nil
  208. }
  209. if err := client.Pull(context.Background(), &request, fn); err != nil {
  210. return err
  211. }
  212. if bar != nil && !bar.IsFinished() {
  213. return errors.New("unexpected end to pull model")
  214. }
  215. return nil
  216. }
  217. func RunGenerate(cmd *cobra.Command, args []string) error {
  218. if len(args) > 1 {
  219. // join all args into a single prompt
  220. return generate(cmd, args[0], strings.Join(args[1:], " "))
  221. }
  222. if readline.IsTerminal(int(os.Stdin.Fd())) {
  223. return generateInteractive(cmd, args[0])
  224. }
  225. return generateBatch(cmd, args[0])
  226. }
  227. type generateContextKey string
  228. func generate(cmd *cobra.Command, model, prompt string) error {
  229. if len(strings.TrimSpace(prompt)) > 0 {
  230. client := api.NewClient()
  231. spinner := NewSpinner("")
  232. go spinner.Spin(60 * time.Millisecond)
  233. var latest api.GenerateResponse
  234. generateContext, ok := cmd.Context().Value(generateContextKey("context")).([]int)
  235. if !ok {
  236. generateContext = []int{}
  237. }
  238. request := api.GenerateRequest{Model: model, Prompt: prompt, Context: generateContext}
  239. fn := func(response api.GenerateResponse) error {
  240. if !spinner.IsFinished() {
  241. spinner.Finish()
  242. }
  243. latest = response
  244. fmt.Print(response.Response)
  245. return nil
  246. }
  247. if err := client.Generate(context.Background(), &request, fn); err != nil {
  248. if strings.Contains(err.Error(), "failed to load model") {
  249. // tell the user to check the server log, if it exists locally
  250. home, nestedErr := os.UserHomeDir()
  251. if nestedErr != nil {
  252. // return the original error
  253. return err
  254. }
  255. logPath := filepath.Join(home, ".ollama", "logs", "server.log")
  256. if _, nestedErr := os.Stat(logPath); nestedErr == nil {
  257. err = fmt.Errorf("%w\nFor more details, check the error logs at %s", err, logPath)
  258. }
  259. }
  260. return err
  261. }
  262. fmt.Println()
  263. fmt.Println()
  264. if !latest.Done {
  265. return errors.New("unexpected end of response")
  266. }
  267. verbose, err := cmd.Flags().GetBool("verbose")
  268. if err != nil {
  269. return err
  270. }
  271. if verbose {
  272. latest.Summary()
  273. }
  274. ctx := cmd.Context()
  275. ctx = context.WithValue(ctx, generateContextKey("context"), latest.Context)
  276. cmd.SetContext(ctx)
  277. }
  278. return nil
  279. }
  280. func showLayer(l *server.Layer) {
  281. filename, err := server.GetBlobsPath(l.Digest)
  282. if err != nil {
  283. fmt.Println("Couldn't get layer's path")
  284. return
  285. }
  286. bts, err := os.ReadFile(filename)
  287. if err != nil {
  288. fmt.Println("Couldn't read layer")
  289. return
  290. }
  291. fmt.Println(string(bts))
  292. }
  293. func generateInteractive(cmd *cobra.Command, model string) error {
  294. home, err := os.UserHomeDir()
  295. if err != nil {
  296. return err
  297. }
  298. completer := readline.NewPrefixCompleter(
  299. readline.PcItem("/help"),
  300. readline.PcItem("/list"),
  301. readline.PcItem("/set",
  302. readline.PcItem("history"),
  303. readline.PcItem("nohistory"),
  304. readline.PcItem("verbose"),
  305. readline.PcItem("quiet"),
  306. readline.PcItem("mode",
  307. readline.PcItem("vim"),
  308. readline.PcItem("emacs"),
  309. readline.PcItem("default"),
  310. ),
  311. ),
  312. readline.PcItem("/show",
  313. readline.PcItem("license"),
  314. readline.PcItem("system"),
  315. readline.PcItem("template"),
  316. ),
  317. readline.PcItem("/exit"),
  318. readline.PcItem("/bye"),
  319. )
  320. usage := func() {
  321. fmt.Fprintln(os.Stderr, "commands:")
  322. fmt.Fprintln(os.Stderr, completer.Tree(" "))
  323. }
  324. config := readline.Config{
  325. Prompt: ">>> ",
  326. HistoryFile: filepath.Join(home, ".ollama", "history"),
  327. AutoComplete: completer,
  328. }
  329. scanner, err := readline.NewEx(&config)
  330. if err != nil {
  331. return err
  332. }
  333. defer scanner.Close()
  334. var multiLineBuffer string
  335. var isMultiLine bool
  336. for {
  337. line, err := scanner.Readline()
  338. switch {
  339. case errors.Is(err, io.EOF):
  340. return nil
  341. case errors.Is(err, readline.ErrInterrupt):
  342. if line == "" {
  343. return nil
  344. }
  345. continue
  346. case err != nil:
  347. return err
  348. }
  349. line = strings.TrimSpace(line)
  350. switch {
  351. case isMultiLine:
  352. if strings.HasSuffix(line, `"""`) {
  353. isMultiLine = false
  354. multiLineBuffer += strings.TrimSuffix(line, `"""`)
  355. line = multiLineBuffer
  356. multiLineBuffer = ""
  357. scanner.SetPrompt(">>> ")
  358. } else {
  359. multiLineBuffer += line + " "
  360. continue
  361. }
  362. case strings.HasPrefix(line, `"""`):
  363. isMultiLine = true
  364. multiLineBuffer = strings.TrimPrefix(line, `"""`) + " "
  365. scanner.SetPrompt("... ")
  366. continue
  367. case strings.HasPrefix(line, "/list"):
  368. args := strings.Fields(line)
  369. if err := ListHandler(cmd, args[1:]); err != nil {
  370. return err
  371. }
  372. continue
  373. case strings.HasPrefix(line, "/set"):
  374. args := strings.Fields(line)
  375. if len(args) > 1 {
  376. switch args[1] {
  377. case "history":
  378. scanner.HistoryEnable()
  379. continue
  380. case "nohistory":
  381. scanner.HistoryDisable()
  382. continue
  383. case "verbose":
  384. cmd.Flags().Set("verbose", "true")
  385. continue
  386. case "quiet":
  387. cmd.Flags().Set("verbose", "false")
  388. continue
  389. case "mode":
  390. if len(args) > 2 {
  391. switch args[2] {
  392. case "vim":
  393. scanner.SetVimMode(true)
  394. continue
  395. case "emacs", "default":
  396. scanner.SetVimMode(false)
  397. continue
  398. default:
  399. usage()
  400. continue
  401. }
  402. } else {
  403. usage()
  404. continue
  405. }
  406. }
  407. } else {
  408. usage()
  409. continue
  410. }
  411. case strings.HasPrefix(line, "/show"):
  412. args := strings.Fields(line)
  413. if len(args) > 1 {
  414. mp := server.ParseModelPath(model)
  415. manifest, err := server.GetManifest(mp)
  416. if err != nil {
  417. fmt.Println("error: couldn't get a manifest for this model")
  418. continue
  419. }
  420. switch args[1] {
  421. case "license":
  422. for _, l := range manifest.Layers {
  423. if l.MediaType == "application/vnd.ollama.image.license" {
  424. showLayer(l)
  425. }
  426. }
  427. continue
  428. case "system":
  429. for _, l := range manifest.Layers {
  430. if l.MediaType == "application/vnd.ollama.image.system" {
  431. showLayer(l)
  432. }
  433. }
  434. continue
  435. case "template":
  436. for _, l := range manifest.Layers {
  437. if l.MediaType == "application/vnd.ollama.image.template" {
  438. showLayer(l)
  439. }
  440. }
  441. continue
  442. default:
  443. usage()
  444. continue
  445. }
  446. } else {
  447. usage()
  448. continue
  449. }
  450. case line == "/help", line == "/?":
  451. usage()
  452. continue
  453. case line == "/exit", line == "/bye":
  454. return nil
  455. }
  456. if err := generate(cmd, model, line); err != nil {
  457. return err
  458. }
  459. }
  460. }
  461. func generateBatch(cmd *cobra.Command, model string) error {
  462. scanner := bufio.NewScanner(os.Stdin)
  463. for scanner.Scan() {
  464. prompt := scanner.Text()
  465. fmt.Printf(">>> %s\n", prompt)
  466. if err := generate(cmd, model, prompt); err != nil {
  467. return err
  468. }
  469. }
  470. return nil
  471. }
  472. func RunServer(cmd *cobra.Command, _ []string) error {
  473. var host, port = "127.0.0.1", "11434"
  474. parts := strings.Split(os.Getenv("OLLAMA_HOST"), ":")
  475. if ip := net.ParseIP(parts[0]); ip != nil {
  476. host = ip.String()
  477. }
  478. if len(parts) > 1 {
  479. port = parts[1]
  480. }
  481. // deprecated: include port in OLLAMA_HOST
  482. if p := os.Getenv("OLLAMA_PORT"); p != "" {
  483. port = p
  484. }
  485. err := initializeKeypair()
  486. if err != nil {
  487. return err
  488. }
  489. ln, err := net.Listen("tcp", fmt.Sprintf("%s:%s", host, port))
  490. if err != nil {
  491. return err
  492. }
  493. var origins []string
  494. if o := os.Getenv("OLLAMA_ORIGINS"); o != "" {
  495. origins = strings.Split(o, ",")
  496. }
  497. return server.Serve(ln, origins)
  498. }
  499. func initializeKeypair() error {
  500. home, err := os.UserHomeDir()
  501. if err != nil {
  502. return err
  503. }
  504. privKeyPath := filepath.Join(home, ".ollama", "id_ed25519")
  505. pubKeyPath := filepath.Join(home, ".ollama", "id_ed25519.pub")
  506. _, err = os.Stat(privKeyPath)
  507. if os.IsNotExist(err) {
  508. fmt.Printf("Couldn't find '%s'. Generating new private key.\n", privKeyPath)
  509. _, privKey, err := ed25519.GenerateKey(rand.Reader)
  510. if err != nil {
  511. return err
  512. }
  513. privKeyBytes, err := format.OpenSSHPrivateKey(privKey, "")
  514. if err != nil {
  515. return err
  516. }
  517. err = os.MkdirAll(path.Dir(privKeyPath), 0o700)
  518. if err != nil {
  519. return fmt.Errorf("could not create directory %w", err)
  520. }
  521. err = os.WriteFile(privKeyPath, pem.EncodeToMemory(privKeyBytes), 0600)
  522. if err != nil {
  523. return err
  524. }
  525. sshPrivateKey, err := ssh.NewSignerFromKey(privKey)
  526. if err != nil {
  527. return err
  528. }
  529. pubKeyData := ssh.MarshalAuthorizedKey(sshPrivateKey.PublicKey())
  530. err = os.WriteFile(pubKeyPath, pubKeyData, 0644)
  531. if err != nil {
  532. return err
  533. }
  534. fmt.Printf("Your new public key is: \n\n%s\n", string(pubKeyData))
  535. }
  536. return nil
  537. }
  538. func startMacApp(client *api.Client) error {
  539. exe, err := os.Executable()
  540. if err != nil {
  541. return err
  542. }
  543. link, err := os.Readlink(exe)
  544. if err != nil {
  545. return err
  546. }
  547. if !strings.Contains(link, "Ollama.app") {
  548. return fmt.Errorf("could not find ollama app")
  549. }
  550. path := strings.Split(link, "Ollama.app")
  551. if err := exec.Command("/usr/bin/open", "-a", path[0]+"Ollama.app").Run(); err != nil {
  552. return err
  553. }
  554. // wait for the server to start
  555. timeout := time.After(5 * time.Second)
  556. tick := time.Tick(500 * time.Millisecond)
  557. for {
  558. select {
  559. case <-timeout:
  560. return errors.New("timed out waiting for server to start")
  561. case <-tick:
  562. if err := client.Heartbeat(context.Background()); err == nil {
  563. return nil // server has started
  564. }
  565. }
  566. }
  567. }
  568. func checkServerHeartbeat(_ *cobra.Command, _ []string) error {
  569. client := api.NewClient()
  570. if err := client.Heartbeat(context.Background()); err != nil {
  571. if !strings.Contains(err.Error(), "connection refused") {
  572. return err
  573. }
  574. if runtime.GOOS == "darwin" {
  575. if err := startMacApp(client); err != nil {
  576. return fmt.Errorf("could not connect to ollama app, is it running?")
  577. }
  578. } else {
  579. return fmt.Errorf("could not connect to ollama server, run 'ollama serve' to start it")
  580. }
  581. }
  582. return nil
  583. }
  584. func NewCLI() *cobra.Command {
  585. log.SetFlags(log.LstdFlags | log.Lshortfile)
  586. rootCmd := &cobra.Command{
  587. Use: "ollama",
  588. Short: "Large language model runner",
  589. SilenceUsage: true,
  590. SilenceErrors: true,
  591. CompletionOptions: cobra.CompletionOptions{
  592. DisableDefaultCmd: true,
  593. },
  594. }
  595. cobra.EnableCommandSorting = false
  596. createCmd := &cobra.Command{
  597. Use: "create MODEL",
  598. Short: "Create a model from a Modelfile",
  599. Args: cobra.MinimumNArgs(1),
  600. PreRunE: checkServerHeartbeat,
  601. RunE: CreateHandler,
  602. }
  603. createCmd.Flags().StringP("file", "f", "Modelfile", "Name of the Modelfile (default \"Modelfile\")")
  604. runCmd := &cobra.Command{
  605. Use: "run MODEL [PROMPT]",
  606. Short: "Run a model",
  607. Args: cobra.MinimumNArgs(1),
  608. PreRunE: checkServerHeartbeat,
  609. RunE: RunHandler,
  610. }
  611. runCmd.Flags().Bool("verbose", false, "Show timings for response")
  612. serveCmd := &cobra.Command{
  613. Use: "serve",
  614. Aliases: []string{"start"},
  615. Short: "Start ollama",
  616. RunE: RunServer,
  617. }
  618. pullCmd := &cobra.Command{
  619. Use: "pull MODEL",
  620. Short: "Pull a model from a registry",
  621. Args: cobra.MinimumNArgs(1),
  622. PreRunE: checkServerHeartbeat,
  623. RunE: PullHandler,
  624. }
  625. pullCmd.Flags().Bool("insecure", false, "Use an insecure registry")
  626. pushCmd := &cobra.Command{
  627. Use: "push MODEL",
  628. Short: "Push a model to a registry",
  629. Args: cobra.MinimumNArgs(1),
  630. PreRunE: checkServerHeartbeat,
  631. RunE: PushHandler,
  632. }
  633. pushCmd.Flags().Bool("insecure", false, "Use an insecure registry")
  634. listCmd := &cobra.Command{
  635. Use: "list",
  636. Aliases: []string{"ls"},
  637. Short: "List models",
  638. PreRunE: checkServerHeartbeat,
  639. RunE: ListHandler,
  640. }
  641. copyCmd := &cobra.Command{
  642. Use: "cp",
  643. Short: "Copy a model",
  644. Args: cobra.MinimumNArgs(2),
  645. PreRunE: checkServerHeartbeat,
  646. RunE: CopyHandler,
  647. }
  648. deleteCmd := &cobra.Command{
  649. Use: "rm",
  650. Short: "Remove a model",
  651. Args: cobra.MinimumNArgs(1),
  652. PreRunE: checkServerHeartbeat,
  653. RunE: DeleteHandler,
  654. }
  655. rootCmd.AddCommand(
  656. serveCmd,
  657. createCmd,
  658. runCmd,
  659. pullCmd,
  660. pushCmd,
  661. listCmd,
  662. copyCmd,
  663. deleteCmd,
  664. )
  665. return rootCmd
  666. }