cmd.go 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536
  1. package cmd
  2. import (
  3. "bufio"
  4. "context"
  5. "errors"
  6. "fmt"
  7. "io"
  8. "log"
  9. "net"
  10. "net/http"
  11. "os"
  12. "path/filepath"
  13. "strings"
  14. "time"
  15. "github.com/chzyer/readline"
  16. "github.com/dustin/go-humanize"
  17. "github.com/olekukonko/tablewriter"
  18. "github.com/spf13/cobra"
  19. "github.com/jmorganca/ollama/api"
  20. "github.com/jmorganca/ollama/format"
  21. "github.com/jmorganca/ollama/parser"
  22. "github.com/jmorganca/ollama/progressbar"
  23. "github.com/jmorganca/ollama/server"
  24. )
  25. func CreateHandler(cmd *cobra.Command, args []string) error {
  26. filename, _ := cmd.Flags().GetString("file")
  27. filename, err := filepath.Abs(filename)
  28. if err != nil {
  29. return err
  30. }
  31. client := api.NewClient()
  32. var spinner *Spinner
  33. // pull the model file if needed
  34. mf, err := os.Open(filename)
  35. defer mf.Close()
  36. cmds, err := parser.Parse(mf)
  37. if err != nil {
  38. return err
  39. }
  40. mf.Close()
  41. for _, c := range cmds {
  42. if c.Name == "model" {
  43. // check if the model file needs to be pulled
  44. checkPull(c.Args)
  45. }
  46. }
  47. if err != nil {
  48. return err
  49. }
  50. request := api.CreateRequest{Name: args[0], Path: filename}
  51. fn := func(resp api.CreateProgress) error {
  52. if spinner != nil {
  53. spinner.Stop()
  54. }
  55. spinner = NewSpinner(resp.Status)
  56. go spinner.Spin(100 * time.Millisecond)
  57. return nil
  58. }
  59. if err := client.Create(context.Background(), &request, fn); err != nil {
  60. return err
  61. }
  62. if spinner != nil {
  63. spinner.Stop()
  64. }
  65. return nil
  66. }
  67. func checkPull(model string) error {
  68. mp := server.ParseModelPath(model)
  69. fp, err := mp.GetManifestPath(false)
  70. if err != nil {
  71. return err
  72. }
  73. _, err = os.Stat(fp)
  74. switch {
  75. case errors.Is(err, os.ErrNotExist):
  76. if err := pull(model, false); err != nil {
  77. var apiStatusError api.StatusError
  78. if !errors.As(err, &apiStatusError) {
  79. return err
  80. }
  81. if apiStatusError.StatusCode != http.StatusBadGateway {
  82. return err
  83. }
  84. }
  85. case err != nil:
  86. return err
  87. }
  88. return nil
  89. }
  90. func RunHandler(cmd *cobra.Command, args []string) error {
  91. if err := checkPull(args[0]); err != nil {
  92. return err
  93. }
  94. return RunGenerate(cmd, args)
  95. }
  96. func PushHandler(cmd *cobra.Command, args []string) error {
  97. client := api.NewClient()
  98. insecure, err := cmd.Flags().GetBool("insecure")
  99. if err != nil {
  100. return err
  101. }
  102. var currentDigest string
  103. var bar *progressbar.ProgressBar
  104. request := api.PushRequest{Name: args[0], Insecure: insecure}
  105. fn := func(resp api.ProgressResponse) error {
  106. if resp.Digest != currentDigest && resp.Digest != "" {
  107. currentDigest = resp.Digest
  108. bar = progressbar.DefaultBytes(
  109. int64(resp.Total),
  110. fmt.Sprintf("pushing %s...", resp.Digest[7:19]),
  111. )
  112. bar.Set(resp.Completed)
  113. } else if resp.Digest == currentDigest && resp.Digest != "" {
  114. bar.Set(resp.Completed)
  115. } else {
  116. currentDigest = ""
  117. fmt.Println(resp.Status)
  118. }
  119. return nil
  120. }
  121. if err := client.Push(context.Background(), &request, fn); err != nil {
  122. return err
  123. }
  124. return nil
  125. }
  126. func ListHandler(cmd *cobra.Command, args []string) error {
  127. client := api.NewClient()
  128. models, err := client.List(context.Background())
  129. if err != nil {
  130. return err
  131. }
  132. var data [][]string
  133. for _, m := range models.Models {
  134. if len(args) == 0 || strings.HasPrefix(m.Name, args[0]) {
  135. data = append(data, []string{m.Name, humanize.Bytes(uint64(m.Size)), format.HumanTime(m.ModifiedAt, "Never")})
  136. }
  137. }
  138. table := tablewriter.NewWriter(os.Stdout)
  139. table.SetHeader([]string{"NAME", "SIZE", "MODIFIED"})
  140. table.SetHeaderAlignment(tablewriter.ALIGN_LEFT)
  141. table.SetAlignment(tablewriter.ALIGN_LEFT)
  142. table.SetHeaderLine(false)
  143. table.SetBorder(false)
  144. table.SetNoWhiteSpace(true)
  145. table.SetTablePadding("\t")
  146. table.AppendBulk(data)
  147. table.Render()
  148. return nil
  149. }
  150. func DeleteHandler(cmd *cobra.Command, args []string) error {
  151. client := api.NewClient()
  152. req := api.DeleteRequest{Name: args[0]}
  153. if err := client.Delete(context.Background(), &req); err != nil {
  154. return err
  155. }
  156. fmt.Printf("deleted '%s'\n", args[0])
  157. return nil
  158. }
  159. func CopyHandler(cmd *cobra.Command, args []string) error {
  160. client := api.NewClient()
  161. req := api.CopyRequest{Source: args[0], Destination: args[1]}
  162. if err := client.Copy(context.Background(), &req); err != nil {
  163. return err
  164. }
  165. fmt.Printf("copied '%s' to '%s'\n", args[0], args[1])
  166. return nil
  167. }
  168. func PullHandler(cmd *cobra.Command, args []string) error {
  169. insecure, err := cmd.Flags().GetBool("insecure")
  170. if err != nil {
  171. return err
  172. }
  173. return pull(args[0], insecure)
  174. }
  175. func pull(model string, insecure bool) error {
  176. client := api.NewClient()
  177. var currentDigest string
  178. var bar *progressbar.ProgressBar
  179. request := api.PullRequest{Name: model, Insecure: insecure}
  180. fn := func(resp api.ProgressResponse) error {
  181. if resp.Digest != currentDigest && resp.Digest != "" {
  182. currentDigest = resp.Digest
  183. bar = progressbar.DefaultBytes(
  184. int64(resp.Total),
  185. fmt.Sprintf("pulling %s...", resp.Digest[7:19]),
  186. )
  187. bar.Set(resp.Completed)
  188. } else if resp.Digest == currentDigest && resp.Digest != "" {
  189. bar.Set(resp.Completed)
  190. } else {
  191. currentDigest = ""
  192. fmt.Println(resp.Status)
  193. }
  194. return nil
  195. }
  196. if err := client.Pull(context.Background(), &request, fn); err != nil {
  197. return err
  198. }
  199. return nil
  200. }
  201. func RunGenerate(cmd *cobra.Command, args []string) error {
  202. if len(args) > 1 {
  203. // join all args into a single prompt
  204. return generate(cmd, args[0], strings.Join(args[1:], " "))
  205. }
  206. if readline.IsTerminal(int(os.Stdin.Fd())) {
  207. return generateInteractive(cmd, args[0])
  208. }
  209. return generateBatch(cmd, args[0])
  210. }
  211. var generateContextKey struct{}
  212. func generate(cmd *cobra.Command, model, prompt string) error {
  213. if len(strings.TrimSpace(prompt)) > 0 {
  214. client := api.NewClient()
  215. spinner := NewSpinner("")
  216. go spinner.Spin(60 * time.Millisecond)
  217. var latest api.GenerateResponse
  218. generateContext, ok := cmd.Context().Value(generateContextKey).([]int)
  219. if !ok {
  220. generateContext = []int{}
  221. }
  222. request := api.GenerateRequest{Model: model, Prompt: prompt, Context: generateContext}
  223. fn := func(resp api.GenerateResponse) error {
  224. if !spinner.IsFinished() {
  225. spinner.Finish()
  226. }
  227. latest = resp
  228. fmt.Print(resp.Response)
  229. cmd.SetContext(context.WithValue(cmd.Context(), generateContextKey, resp.Context))
  230. return nil
  231. }
  232. if err := client.Generate(context.Background(), &request, fn); err != nil {
  233. return err
  234. }
  235. fmt.Println()
  236. fmt.Println()
  237. verbose, err := cmd.Flags().GetBool("verbose")
  238. if err != nil {
  239. return err
  240. }
  241. if verbose {
  242. latest.Summary()
  243. }
  244. }
  245. return nil
  246. }
  247. func generateInteractive(cmd *cobra.Command, model string) error {
  248. home, err := os.UserHomeDir()
  249. if err != nil {
  250. return err
  251. }
  252. completer := readline.NewPrefixCompleter(
  253. readline.PcItem("/help"),
  254. readline.PcItem("/list"),
  255. readline.PcItem("/set",
  256. readline.PcItem("history"),
  257. readline.PcItem("nohistory"),
  258. readline.PcItem("verbose"),
  259. readline.PcItem("quiet"),
  260. readline.PcItem("mode",
  261. readline.PcItem("vim"),
  262. readline.PcItem("emacs"),
  263. readline.PcItem("default"),
  264. ),
  265. ),
  266. readline.PcItem("/exit"),
  267. readline.PcItem("/bye"),
  268. )
  269. usage := func() {
  270. fmt.Fprintln(os.Stderr, "commands:")
  271. fmt.Fprintln(os.Stderr, completer.Tree(" "))
  272. }
  273. config := readline.Config{
  274. Prompt: ">>> ",
  275. HistoryFile: filepath.Join(home, ".ollama", "history"),
  276. AutoComplete: completer,
  277. }
  278. scanner, err := readline.NewEx(&config)
  279. if err != nil {
  280. return err
  281. }
  282. defer scanner.Close()
  283. for {
  284. line, err := scanner.Readline()
  285. switch {
  286. case errors.Is(err, io.EOF):
  287. return nil
  288. case errors.Is(err, readline.ErrInterrupt):
  289. if line == "" {
  290. return nil
  291. }
  292. continue
  293. case err != nil:
  294. return err
  295. }
  296. line = strings.TrimSpace(line)
  297. switch {
  298. case strings.HasPrefix(line, "/list"):
  299. args := strings.Fields(line)
  300. if err := ListHandler(cmd, args[1:]); err != nil {
  301. return err
  302. }
  303. continue
  304. case strings.HasPrefix(line, "/set"):
  305. args := strings.Fields(line)
  306. if len(args) > 1 {
  307. switch args[1] {
  308. case "history":
  309. scanner.HistoryEnable()
  310. continue
  311. case "nohistory":
  312. scanner.HistoryDisable()
  313. continue
  314. case "verbose":
  315. cmd.Flags().Set("verbose", "true")
  316. continue
  317. case "quiet":
  318. cmd.Flags().Set("verbose", "false")
  319. continue
  320. case "mode":
  321. if len(args) > 2 {
  322. switch args[2] {
  323. case "vim":
  324. scanner.SetVimMode(true)
  325. continue
  326. case "emacs", "default":
  327. scanner.SetVimMode(false)
  328. continue
  329. }
  330. }
  331. }
  332. }
  333. case line == "/help", line == "/?":
  334. usage()
  335. continue
  336. case line == "/exit", line == "/bye":
  337. return nil
  338. }
  339. if err := generate(cmd, model, line); err != nil {
  340. return err
  341. }
  342. }
  343. }
  344. func generateBatch(cmd *cobra.Command, model string) error {
  345. scanner := bufio.NewScanner(os.Stdin)
  346. for scanner.Scan() {
  347. prompt := scanner.Text()
  348. fmt.Printf(">>> %s\n", prompt)
  349. if err := generate(cmd, model, prompt); err != nil {
  350. return err
  351. }
  352. }
  353. return nil
  354. }
  355. func RunServer(_ *cobra.Command, _ []string) error {
  356. host := os.Getenv("OLLAMA_HOST")
  357. if host == "" {
  358. host = "127.0.0.1"
  359. }
  360. port := os.Getenv("OLLAMA_PORT")
  361. if port == "" {
  362. port = "11434"
  363. }
  364. ln, err := net.Listen("tcp", fmt.Sprintf("%s:%s", host, port))
  365. if err != nil {
  366. return err
  367. }
  368. return server.Serve(ln)
  369. }
  370. func NewCLI() *cobra.Command {
  371. log.SetFlags(log.LstdFlags | log.Lshortfile)
  372. rootCmd := &cobra.Command{
  373. Use: "ollama",
  374. Short: "Large language model runner",
  375. SilenceUsage: true,
  376. CompletionOptions: cobra.CompletionOptions{
  377. DisableDefaultCmd: true,
  378. },
  379. }
  380. cobra.EnableCommandSorting = false
  381. createCmd := &cobra.Command{
  382. Use: "create MODEL",
  383. Short: "Create a model from a Modelfile",
  384. Args: cobra.MinimumNArgs(1),
  385. RunE: CreateHandler,
  386. }
  387. createCmd.Flags().StringP("file", "f", "Modelfile", "Name of the Modelfile (default \"Modelfile\")")
  388. runCmd := &cobra.Command{
  389. Use: "run MODEL [PROMPT]",
  390. Short: "Run a model",
  391. Args: cobra.MinimumNArgs(1),
  392. RunE: RunHandler,
  393. }
  394. runCmd.Flags().Bool("verbose", false, "Show timings for response")
  395. serveCmd := &cobra.Command{
  396. Use: "serve",
  397. Aliases: []string{"start"},
  398. Short: "Start ollama",
  399. RunE: RunServer,
  400. }
  401. pullCmd := &cobra.Command{
  402. Use: "pull MODEL",
  403. Short: "Pull a model from a registry",
  404. Args: cobra.MinimumNArgs(1),
  405. RunE: PullHandler,
  406. }
  407. pullCmd.Flags().Bool("insecure", false, "Use an insecure registry")
  408. pushCmd := &cobra.Command{
  409. Use: "push MODEL",
  410. Short: "Push a model to a registry",
  411. Args: cobra.MinimumNArgs(1),
  412. RunE: PushHandler,
  413. }
  414. pushCmd.Flags().Bool("insecure", false, "Use an insecure registry")
  415. listCmd := &cobra.Command{
  416. Use: "list",
  417. Aliases: []string{"ls"},
  418. Short: "List models",
  419. RunE: ListHandler,
  420. }
  421. copyCmd := &cobra.Command{
  422. Use: "cp",
  423. Short: "Copy a model",
  424. Args: cobra.MinimumNArgs(2),
  425. RunE: CopyHandler,
  426. }
  427. deleteCmd := &cobra.Command{
  428. Use: "rm",
  429. Short: "Remove a model",
  430. Args: cobra.MinimumNArgs(1),
  431. RunE: DeleteHandler,
  432. }
  433. rootCmd.AddCommand(
  434. serveCmd,
  435. createCmd,
  436. runCmd,
  437. pullCmd,
  438. pushCmd,
  439. listCmd,
  440. copyCmd,
  441. deleteCmd,
  442. )
  443. return rootCmd
  444. }