cmd.go 8.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442
  1. package cmd
  2. import (
  3. "bufio"
  4. "context"
  5. "errors"
  6. "fmt"
  7. "io"
  8. "log"
  9. "net"
  10. "net/http"
  11. "os"
  12. "path/filepath"
  13. "strings"
  14. "time"
  15. "github.com/chzyer/readline"
  16. "github.com/dustin/go-humanize"
  17. "github.com/olekukonko/tablewriter"
  18. "github.com/spf13/cobra"
  19. "github.com/jmorganca/ollama/api"
  20. "github.com/jmorganca/ollama/format"
  21. "github.com/jmorganca/ollama/progressbar"
  22. "github.com/jmorganca/ollama/server"
  23. )
  24. func create(cmd *cobra.Command, args []string) error {
  25. filename, _ := cmd.Flags().GetString("file")
  26. filename, err := filepath.Abs(filename)
  27. if err != nil {
  28. return err
  29. }
  30. client := api.NewClient()
  31. var spinner *Spinner
  32. request := api.CreateRequest{Name: args[0], Path: filename}
  33. fn := func(resp api.CreateProgress) error {
  34. if spinner != nil {
  35. spinner.Stop()
  36. }
  37. spinner = NewSpinner(resp.Status)
  38. go spinner.Spin(100 * time.Millisecond)
  39. return nil
  40. }
  41. if err := client.Create(context.Background(), &request, fn); err != nil {
  42. return err
  43. }
  44. if spinner != nil {
  45. spinner.Stop()
  46. }
  47. return nil
  48. }
  49. func RunRun(cmd *cobra.Command, args []string) error {
  50. mp := server.ParseModelPath(args[0])
  51. fp, err := mp.GetManifestPath(false)
  52. if err != nil {
  53. return err
  54. }
  55. _, err = os.Stat(fp)
  56. switch {
  57. case errors.Is(err, os.ErrNotExist):
  58. if err := pull(args[0]); err != nil {
  59. var apiStatusError api.StatusError
  60. if !errors.As(err, &apiStatusError) {
  61. return err
  62. }
  63. if apiStatusError.StatusCode != http.StatusBadGateway {
  64. return err
  65. }
  66. }
  67. case err != nil:
  68. return err
  69. }
  70. return RunGenerate(cmd, args)
  71. }
  72. func push(cmd *cobra.Command, args []string) error {
  73. client := api.NewClient()
  74. request := api.PushRequest{Name: args[0]}
  75. fn := func(resp api.ProgressResponse) error {
  76. fmt.Println(resp.Status)
  77. return nil
  78. }
  79. if err := client.Push(context.Background(), &request, fn); err != nil {
  80. return err
  81. }
  82. return nil
  83. }
  84. func list(cmd *cobra.Command, args []string) error {
  85. client := api.NewClient()
  86. models, err := client.List(context.Background())
  87. if err != nil {
  88. return err
  89. }
  90. var data [][]string
  91. for _, m := range models.Models {
  92. if len(args) == 0 || strings.HasPrefix(m.Name, args[0]) {
  93. data = append(data, []string{m.Name, humanize.Bytes(uint64(m.Size)), format.HumanTime(m.ModifiedAt, "Never")})
  94. }
  95. }
  96. table := tablewriter.NewWriter(os.Stdout)
  97. table.SetHeader([]string{"NAME", "SIZE", "MODIFIED"})
  98. table.SetHeaderAlignment(tablewriter.ALIGN_LEFT)
  99. table.SetAlignment(tablewriter.ALIGN_LEFT)
  100. table.SetHeaderLine(false)
  101. table.SetBorder(false)
  102. table.SetNoWhiteSpace(true)
  103. table.SetTablePadding("\t")
  104. table.AppendBulk(data)
  105. table.Render()
  106. return nil
  107. }
  108. func RunPull(cmd *cobra.Command, args []string) error {
  109. return pull(args[0])
  110. }
  111. func pull(model string) error {
  112. client := api.NewClient()
  113. var currentDigest string
  114. var bar *progressbar.ProgressBar
  115. request := api.PullRequest{Name: model}
  116. fn := func(resp api.ProgressResponse) error {
  117. if resp.Digest != currentDigest && resp.Digest != "" {
  118. currentDigest = resp.Digest
  119. bar = progressbar.DefaultBytes(
  120. int64(resp.Total),
  121. fmt.Sprintf("pulling %s...", resp.Digest[7:19]),
  122. )
  123. bar.Set(resp.Completed)
  124. } else if resp.Digest == currentDigest && resp.Digest != "" {
  125. bar.Set(resp.Completed)
  126. } else {
  127. currentDigest = ""
  128. fmt.Println(resp.Status)
  129. }
  130. return nil
  131. }
  132. if err := client.Pull(context.Background(), &request, fn); err != nil {
  133. return err
  134. }
  135. return nil
  136. }
  137. func RunGenerate(cmd *cobra.Command, args []string) error {
  138. if len(args) > 1 {
  139. // join all args into a single prompt
  140. return generate(cmd, args[0], strings.Join(args[1:], " "))
  141. }
  142. if readline.IsTerminal(int(os.Stdin.Fd())) {
  143. return generateInteractive(cmd, args[0])
  144. }
  145. return generateBatch(cmd, args[0])
  146. }
  147. var generateContextKey struct{}
  148. func generate(cmd *cobra.Command, model, prompt string) error {
  149. if len(strings.TrimSpace(prompt)) > 0 {
  150. client := api.NewClient()
  151. spinner := NewSpinner("")
  152. go spinner.Spin(60 * time.Millisecond)
  153. var latest api.GenerateResponse
  154. generateContext, ok := cmd.Context().Value(generateContextKey).([]int)
  155. if !ok {
  156. generateContext = []int{}
  157. }
  158. request := api.GenerateRequest{Model: model, Prompt: prompt, Context: generateContext}
  159. fn := func(resp api.GenerateResponse) error {
  160. if !spinner.IsFinished() {
  161. spinner.Finish()
  162. }
  163. latest = resp
  164. fmt.Print(resp.Response)
  165. cmd.SetContext(context.WithValue(cmd.Context(), generateContextKey, resp.Context))
  166. return nil
  167. }
  168. if err := client.Generate(context.Background(), &request, fn); err != nil {
  169. return err
  170. }
  171. fmt.Println()
  172. fmt.Println()
  173. verbose, err := cmd.Flags().GetBool("verbose")
  174. if err != nil {
  175. return err
  176. }
  177. if verbose {
  178. latest.Summary()
  179. }
  180. }
  181. return nil
  182. }
  183. func generateInteractive(cmd *cobra.Command, model string) error {
  184. home, err := os.UserHomeDir()
  185. if err != nil {
  186. return err
  187. }
  188. completer := readline.NewPrefixCompleter(
  189. readline.PcItem("/help"),
  190. readline.PcItem("/list"),
  191. readline.PcItem("/set",
  192. readline.PcItem("history"),
  193. readline.PcItem("nohistory"),
  194. readline.PcItem("verbose"),
  195. readline.PcItem("quiet"),
  196. readline.PcItem("mode",
  197. readline.PcItem("vim"),
  198. readline.PcItem("emacs"),
  199. readline.PcItem("default"),
  200. ),
  201. ),
  202. readline.PcItem("/exit"),
  203. readline.PcItem("/bye"),
  204. )
  205. usage := func() {
  206. fmt.Fprintln(os.Stderr, "commands:")
  207. fmt.Fprintln(os.Stderr, completer.Tree(" "))
  208. }
  209. config := readline.Config{
  210. Prompt: ">>> ",
  211. HistoryFile: filepath.Join(home, ".ollama", "history"),
  212. AutoComplete: completer,
  213. }
  214. scanner, err := readline.NewEx(&config)
  215. if err != nil {
  216. return err
  217. }
  218. defer scanner.Close()
  219. for {
  220. line, err := scanner.Readline()
  221. switch {
  222. case errors.Is(err, io.EOF):
  223. return nil
  224. case errors.Is(err, readline.ErrInterrupt):
  225. if line == "" {
  226. return nil
  227. }
  228. continue
  229. case err != nil:
  230. return err
  231. }
  232. line = strings.TrimSpace(line)
  233. switch {
  234. case strings.HasPrefix(line, "/list"):
  235. args := strings.Fields(line)
  236. if err := list(cmd, args[1:]); err != nil {
  237. return err
  238. }
  239. continue
  240. case strings.HasPrefix(line, "/set"):
  241. args := strings.Fields(line)
  242. if len(args) > 1 {
  243. switch args[1] {
  244. case "history":
  245. scanner.HistoryEnable()
  246. continue
  247. case "nohistory":
  248. scanner.HistoryDisable()
  249. continue
  250. case "verbose":
  251. cmd.Flags().Set("verbose", "true")
  252. continue
  253. case "quiet":
  254. cmd.Flags().Set("verbose", "false")
  255. continue
  256. case "mode":
  257. if len(args) > 2 {
  258. switch args[2] {
  259. case "vim":
  260. scanner.SetVimMode(true)
  261. continue
  262. case "emacs", "default":
  263. scanner.SetVimMode(false)
  264. continue
  265. }
  266. }
  267. }
  268. }
  269. case line == "/help", line == "/?":
  270. usage()
  271. continue
  272. case line == "/exit", line == "/bye":
  273. return nil
  274. }
  275. if err := generate(cmd, model, line); err != nil {
  276. return err
  277. }
  278. }
  279. }
  280. func generateBatch(cmd *cobra.Command, model string) error {
  281. scanner := bufio.NewScanner(os.Stdin)
  282. for scanner.Scan() {
  283. prompt := scanner.Text()
  284. fmt.Printf(">>> %s\n", prompt)
  285. if err := generate(cmd, model, prompt); err != nil {
  286. return err
  287. }
  288. }
  289. return nil
  290. }
  291. func RunServer(_ *cobra.Command, _ []string) error {
  292. host := os.Getenv("OLLAMA_HOST")
  293. if host == "" {
  294. host = "127.0.0.1"
  295. }
  296. port := os.Getenv("OLLAMA_PORT")
  297. if port == "" {
  298. port = "11434"
  299. }
  300. ln, err := net.Listen("tcp", fmt.Sprintf("%s:%s", host, port))
  301. if err != nil {
  302. return err
  303. }
  304. return server.Serve(ln)
  305. }
  306. func NewCLI() *cobra.Command {
  307. log.SetFlags(log.LstdFlags | log.Lshortfile)
  308. rootCmd := &cobra.Command{
  309. Use: "ollama",
  310. Short: "Large language model runner",
  311. SilenceUsage: true,
  312. CompletionOptions: cobra.CompletionOptions{
  313. DisableDefaultCmd: true,
  314. },
  315. }
  316. cobra.EnableCommandSorting = false
  317. createCmd := &cobra.Command{
  318. Use: "create MODEL",
  319. Short: "Create a model from a Modelfile",
  320. Args: cobra.MinimumNArgs(1),
  321. RunE: create,
  322. }
  323. createCmd.Flags().StringP("file", "f", "Modelfile", "Name of the Modelfile (default \"Modelfile\")")
  324. runCmd := &cobra.Command{
  325. Use: "run MODEL [PROMPT]",
  326. Short: "Run a model",
  327. Args: cobra.MinimumNArgs(1),
  328. RunE: RunRun,
  329. }
  330. runCmd.Flags().Bool("verbose", false, "Show timings for response")
  331. serveCmd := &cobra.Command{
  332. Use: "serve",
  333. Aliases: []string{"start"},
  334. Short: "Start ollama",
  335. RunE: RunServer,
  336. }
  337. pullCmd := &cobra.Command{
  338. Use: "pull MODEL",
  339. Short: "Pull a model from a registry",
  340. Args: cobra.MinimumNArgs(1),
  341. RunE: RunPull,
  342. }
  343. pushCmd := &cobra.Command{
  344. Use: "push MODEL",
  345. Short: "Push a model to a registry",
  346. Args: cobra.MinimumNArgs(1),
  347. RunE: push,
  348. }
  349. listCmd := &cobra.Command{
  350. Use: "list",
  351. Aliases: []string{"ls"},
  352. Short: "List models",
  353. RunE: list,
  354. }
  355. rootCmd.AddCommand(
  356. serveCmd,
  357. createCmd,
  358. runCmd,
  359. pullCmd,
  360. pushCmd,
  361. listCmd,
  362. )
  363. return rootCmd
  364. }