cmd.go 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510
  1. package cmd
  2. import (
  3. "bufio"
  4. "context"
  5. "errors"
  6. "fmt"
  7. "io"
  8. "log"
  9. "net"
  10. "net/http"
  11. "os"
  12. "path/filepath"
  13. "strings"
  14. "time"
  15. "github.com/chzyer/readline"
  16. "github.com/dustin/go-humanize"
  17. "github.com/olekukonko/tablewriter"
  18. "github.com/spf13/cobra"
  19. "github.com/jmorganca/ollama/api"
  20. "github.com/jmorganca/ollama/format"
  21. "github.com/jmorganca/ollama/progressbar"
  22. "github.com/jmorganca/ollama/server"
  23. )
  24. func CreateHandler(cmd *cobra.Command, args []string) error {
  25. filename, _ := cmd.Flags().GetString("file")
  26. filename, err := filepath.Abs(filename)
  27. if err != nil {
  28. return err
  29. }
  30. client := api.NewClient()
  31. var spinner *Spinner
  32. request := api.CreateRequest{Name: args[0], Path: filename}
  33. fn := func(resp api.CreateProgress) error {
  34. if spinner != nil {
  35. spinner.Stop()
  36. }
  37. spinner = NewSpinner(resp.Status)
  38. go spinner.Spin(100 * time.Millisecond)
  39. return nil
  40. }
  41. if err := client.Create(context.Background(), &request, fn); err != nil {
  42. return err
  43. }
  44. if spinner != nil {
  45. spinner.Stop()
  46. }
  47. return nil
  48. }
  49. func RunHandler(cmd *cobra.Command, args []string) error {
  50. mp := server.ParseModelPath(args[0])
  51. fp, err := mp.GetManifestPath(false)
  52. if err != nil {
  53. return err
  54. }
  55. _, err = os.Stat(fp)
  56. switch {
  57. case errors.Is(err, os.ErrNotExist):
  58. if err := pull(args[0], false); err != nil {
  59. var apiStatusError api.StatusError
  60. if !errors.As(err, &apiStatusError) {
  61. return err
  62. }
  63. if apiStatusError.StatusCode != http.StatusBadGateway {
  64. return err
  65. }
  66. }
  67. case err != nil:
  68. return err
  69. }
  70. return RunGenerate(cmd, args)
  71. }
  72. func PushHandler(cmd *cobra.Command, args []string) error {
  73. client := api.NewClient()
  74. insecure, err := cmd.Flags().GetBool("insecure")
  75. if err != nil {
  76. return err
  77. }
  78. var currentDigest string
  79. var bar *progressbar.ProgressBar
  80. request := api.PushRequest{Name: args[0], Insecure: insecure}
  81. fn := func(resp api.ProgressResponse) error {
  82. if resp.Digest != currentDigest && resp.Digest != "" {
  83. currentDigest = resp.Digest
  84. bar = progressbar.DefaultBytes(
  85. int64(resp.Total),
  86. fmt.Sprintf("pushing %s...", resp.Digest[7:19]),
  87. )
  88. bar.Set(resp.Completed)
  89. } else if resp.Digest == currentDigest && resp.Digest != "" {
  90. bar.Set(resp.Completed)
  91. } else {
  92. currentDigest = ""
  93. fmt.Println(resp.Status)
  94. }
  95. return nil
  96. }
  97. if err := client.Push(context.Background(), &request, fn); err != nil {
  98. return err
  99. }
  100. return nil
  101. }
  102. func ListHandler(cmd *cobra.Command, args []string) error {
  103. client := api.NewClient()
  104. models, err := client.List(context.Background())
  105. if err != nil {
  106. return err
  107. }
  108. var data [][]string
  109. for _, m := range models.Models {
  110. if len(args) == 0 || strings.HasPrefix(m.Name, args[0]) {
  111. data = append(data, []string{m.Name, humanize.Bytes(uint64(m.Size)), format.HumanTime(m.ModifiedAt, "Never")})
  112. }
  113. }
  114. table := tablewriter.NewWriter(os.Stdout)
  115. table.SetHeader([]string{"NAME", "SIZE", "MODIFIED"})
  116. table.SetHeaderAlignment(tablewriter.ALIGN_LEFT)
  117. table.SetAlignment(tablewriter.ALIGN_LEFT)
  118. table.SetHeaderLine(false)
  119. table.SetBorder(false)
  120. table.SetNoWhiteSpace(true)
  121. table.SetTablePadding("\t")
  122. table.AppendBulk(data)
  123. table.Render()
  124. return nil
  125. }
  126. func DeleteHandler(cmd *cobra.Command, args []string) error {
  127. client := api.NewClient()
  128. req := api.DeleteRequest{Name: args[0]}
  129. if err := client.Delete(context.Background(), &req); err != nil {
  130. return err
  131. }
  132. fmt.Printf("deleted '%s'\n", args[0])
  133. return nil
  134. }
  135. func CopyHandler(cmd *cobra.Command, args []string) error {
  136. client := api.NewClient()
  137. req := api.CopyRequest{Source: args[0], Destination: args[1]}
  138. if err := client.Copy(context.Background(), &req); err != nil {
  139. return err
  140. }
  141. fmt.Printf("copied '%s' to '%s'\n", args[0], args[1])
  142. return nil
  143. }
  144. func PullHandler(cmd *cobra.Command, args []string) error {
  145. insecure, err := cmd.Flags().GetBool("insecure")
  146. if err != nil {
  147. return err
  148. }
  149. return pull(args[0], insecure)
  150. }
  151. func pull(model string, insecure bool) error {
  152. client := api.NewClient()
  153. var currentDigest string
  154. var bar *progressbar.ProgressBar
  155. request := api.PullRequest{Name: model, Insecure: insecure}
  156. fn := func(resp api.ProgressResponse) error {
  157. if resp.Digest != currentDigest && resp.Digest != "" {
  158. currentDigest = resp.Digest
  159. bar = progressbar.DefaultBytes(
  160. int64(resp.Total),
  161. fmt.Sprintf("pulling %s...", resp.Digest[7:19]),
  162. )
  163. bar.Set(resp.Completed)
  164. } else if resp.Digest == currentDigest && resp.Digest != "" {
  165. bar.Set(resp.Completed)
  166. } else {
  167. currentDigest = ""
  168. fmt.Println(resp.Status)
  169. }
  170. return nil
  171. }
  172. if err := client.Pull(context.Background(), &request, fn); err != nil {
  173. return err
  174. }
  175. return nil
  176. }
  177. func RunGenerate(cmd *cobra.Command, args []string) error {
  178. if len(args) > 1 {
  179. // join all args into a single prompt
  180. return generate(cmd, args[0], strings.Join(args[1:], " "))
  181. }
  182. if readline.IsTerminal(int(os.Stdin.Fd())) {
  183. return generateInteractive(cmd, args[0])
  184. }
  185. return generateBatch(cmd, args[0])
  186. }
  187. var generateContextKey struct{}
  188. func generate(cmd *cobra.Command, model, prompt string) error {
  189. if len(strings.TrimSpace(prompt)) > 0 {
  190. client := api.NewClient()
  191. spinner := NewSpinner("")
  192. go spinner.Spin(60 * time.Millisecond)
  193. var latest api.GenerateResponse
  194. generateContext, ok := cmd.Context().Value(generateContextKey).([]int)
  195. if !ok {
  196. generateContext = []int{}
  197. }
  198. request := api.GenerateRequest{Model: model, Prompt: prompt, Context: generateContext}
  199. fn := func(resp api.GenerateResponse) error {
  200. if !spinner.IsFinished() {
  201. spinner.Finish()
  202. }
  203. latest = resp
  204. fmt.Print(resp.Response)
  205. cmd.SetContext(context.WithValue(cmd.Context(), generateContextKey, resp.Context))
  206. return nil
  207. }
  208. if err := client.Generate(context.Background(), &request, fn); err != nil {
  209. return err
  210. }
  211. fmt.Println()
  212. fmt.Println()
  213. verbose, err := cmd.Flags().GetBool("verbose")
  214. if err != nil {
  215. return err
  216. }
  217. if verbose {
  218. latest.Summary()
  219. }
  220. }
  221. return nil
  222. }
  223. func generateInteractive(cmd *cobra.Command, model string) error {
  224. home, err := os.UserHomeDir()
  225. if err != nil {
  226. return err
  227. }
  228. completer := readline.NewPrefixCompleter(
  229. readline.PcItem("/help"),
  230. readline.PcItem("/list"),
  231. readline.PcItem("/set",
  232. readline.PcItem("history"),
  233. readline.PcItem("nohistory"),
  234. readline.PcItem("verbose"),
  235. readline.PcItem("quiet"),
  236. readline.PcItem("mode",
  237. readline.PcItem("vim"),
  238. readline.PcItem("emacs"),
  239. readline.PcItem("default"),
  240. ),
  241. ),
  242. readline.PcItem("/exit"),
  243. readline.PcItem("/bye"),
  244. )
  245. usage := func() {
  246. fmt.Fprintln(os.Stderr, "commands:")
  247. fmt.Fprintln(os.Stderr, completer.Tree(" "))
  248. }
  249. config := readline.Config{
  250. Prompt: ">>> ",
  251. HistoryFile: filepath.Join(home, ".ollama", "history"),
  252. AutoComplete: completer,
  253. }
  254. scanner, err := readline.NewEx(&config)
  255. if err != nil {
  256. return err
  257. }
  258. defer scanner.Close()
  259. for {
  260. line, err := scanner.Readline()
  261. switch {
  262. case errors.Is(err, io.EOF):
  263. return nil
  264. case errors.Is(err, readline.ErrInterrupt):
  265. if line == "" {
  266. return nil
  267. }
  268. continue
  269. case err != nil:
  270. return err
  271. }
  272. line = strings.TrimSpace(line)
  273. switch {
  274. case strings.HasPrefix(line, "/list"):
  275. args := strings.Fields(line)
  276. if err := ListHandler(cmd, args[1:]); err != nil {
  277. return err
  278. }
  279. continue
  280. case strings.HasPrefix(line, "/set"):
  281. args := strings.Fields(line)
  282. if len(args) > 1 {
  283. switch args[1] {
  284. case "history":
  285. scanner.HistoryEnable()
  286. continue
  287. case "nohistory":
  288. scanner.HistoryDisable()
  289. continue
  290. case "verbose":
  291. cmd.Flags().Set("verbose", "true")
  292. continue
  293. case "quiet":
  294. cmd.Flags().Set("verbose", "false")
  295. continue
  296. case "mode":
  297. if len(args) > 2 {
  298. switch args[2] {
  299. case "vim":
  300. scanner.SetVimMode(true)
  301. continue
  302. case "emacs", "default":
  303. scanner.SetVimMode(false)
  304. continue
  305. }
  306. }
  307. }
  308. }
  309. case line == "/help", line == "/?":
  310. usage()
  311. continue
  312. case line == "/exit", line == "/bye":
  313. return nil
  314. }
  315. if err := generate(cmd, model, line); err != nil {
  316. return err
  317. }
  318. }
  319. }
  320. func generateBatch(cmd *cobra.Command, model string) error {
  321. scanner := bufio.NewScanner(os.Stdin)
  322. for scanner.Scan() {
  323. prompt := scanner.Text()
  324. fmt.Printf(">>> %s\n", prompt)
  325. if err := generate(cmd, model, prompt); err != nil {
  326. return err
  327. }
  328. }
  329. return nil
  330. }
  331. func RunServer(_ *cobra.Command, _ []string) error {
  332. host := os.Getenv("OLLAMA_HOST")
  333. if host == "" {
  334. host = "127.0.0.1"
  335. }
  336. port := os.Getenv("OLLAMA_PORT")
  337. if port == "" {
  338. port = "11434"
  339. }
  340. ln, err := net.Listen("tcp", fmt.Sprintf("%s:%s", host, port))
  341. if err != nil {
  342. return err
  343. }
  344. return server.Serve(ln)
  345. }
  346. func NewCLI() *cobra.Command {
  347. log.SetFlags(log.LstdFlags | log.Lshortfile)
  348. rootCmd := &cobra.Command{
  349. Use: "ollama",
  350. Short: "Large language model runner",
  351. SilenceUsage: true,
  352. CompletionOptions: cobra.CompletionOptions{
  353. DisableDefaultCmd: true,
  354. },
  355. }
  356. cobra.EnableCommandSorting = false
  357. createCmd := &cobra.Command{
  358. Use: "create MODEL",
  359. Short: "Create a model from a Modelfile",
  360. Args: cobra.MinimumNArgs(1),
  361. RunE: CreateHandler,
  362. }
  363. createCmd.Flags().StringP("file", "f", "Modelfile", "Name of the Modelfile (default \"Modelfile\")")
  364. runCmd := &cobra.Command{
  365. Use: "run MODEL [PROMPT]",
  366. Short: "Run a model",
  367. Args: cobra.MinimumNArgs(1),
  368. RunE: RunHandler,
  369. }
  370. runCmd.Flags().Bool("verbose", false, "Show timings for response")
  371. serveCmd := &cobra.Command{
  372. Use: "serve",
  373. Aliases: []string{"start"},
  374. Short: "Start ollama",
  375. RunE: RunServer,
  376. }
  377. pullCmd := &cobra.Command{
  378. Use: "pull MODEL",
  379. Short: "Pull a model from a registry",
  380. Args: cobra.MinimumNArgs(1),
  381. RunE: PullHandler,
  382. }
  383. pullCmd.Flags().Bool("insecure", false, "Use an insecure registry")
  384. pushCmd := &cobra.Command{
  385. Use: "push MODEL",
  386. Short: "Push a model to a registry",
  387. Args: cobra.MinimumNArgs(1),
  388. RunE: PushHandler,
  389. }
  390. pushCmd.Flags().Bool("insecure", false, "Use an insecure registry")
  391. listCmd := &cobra.Command{
  392. Use: "list",
  393. Aliases: []string{"ls"},
  394. Short: "List models",
  395. RunE: ListHandler,
  396. }
  397. copyCmd := &cobra.Command{
  398. Use: "cp",
  399. Short: "Copy a model",
  400. Args: cobra.MinimumNArgs(2),
  401. RunE: CopyHandler,
  402. }
  403. deleteCmd := &cobra.Command{
  404. Use: "rm",
  405. Short: "Remove a model",
  406. Args: cobra.MinimumNArgs(1),
  407. RunE: DeleteHandler,
  408. }
  409. rootCmd.AddCommand(
  410. serveCmd,
  411. createCmd,
  412. runCmd,
  413. pullCmd,
  414. pushCmd,
  415. listCmd,
  416. copyCmd,
  417. deleteCmd,
  418. )
  419. return rootCmd
  420. }