cmd.go 6.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338
  1. package cmd
  2. import (
  3. "bufio"
  4. "context"
  5. "errors"
  6. "fmt"
  7. "log"
  8. "net"
  9. "net/http"
  10. "os"
  11. "strings"
  12. "time"
  13. "github.com/dustin/go-humanize"
  14. "github.com/olekukonko/tablewriter"
  15. "github.com/schollz/progressbar/v3"
  16. "github.com/spf13/cobra"
  17. "golang.org/x/term"
  18. "github.com/jmorganca/ollama/api"
  19. "github.com/jmorganca/ollama/format"
  20. "github.com/jmorganca/ollama/server"
  21. )
  22. func create(cmd *cobra.Command, args []string) error {
  23. filename, _ := cmd.Flags().GetString("file")
  24. client := api.NewClient()
  25. var spinner *Spinner
  26. request := api.CreateRequest{Name: args[0], Path: filename}
  27. fn := func(resp api.CreateProgress) error {
  28. if spinner != nil {
  29. spinner.Stop()
  30. }
  31. spinner = NewSpinner(resp.Status)
  32. go spinner.Spin(100 * time.Millisecond)
  33. return nil
  34. }
  35. if err := client.Create(context.Background(), &request, fn); err != nil {
  36. return err
  37. }
  38. if spinner != nil {
  39. spinner.Stop()
  40. }
  41. return nil
  42. }
  43. func RunRun(cmd *cobra.Command, args []string) error {
  44. mp := server.ParseModelPath(args[0])
  45. fp, err := mp.GetManifestPath(false)
  46. if err != nil {
  47. return err
  48. }
  49. _, err = os.Stat(fp)
  50. switch {
  51. case errors.Is(err, os.ErrNotExist):
  52. if err := pull(args[0]); err != nil {
  53. var apiStatusError api.StatusError
  54. if !errors.As(err, &apiStatusError) {
  55. return err
  56. }
  57. if apiStatusError.StatusCode != http.StatusBadGateway {
  58. return err
  59. }
  60. }
  61. case err != nil:
  62. return err
  63. }
  64. return RunGenerate(cmd, args)
  65. }
  66. func push(cmd *cobra.Command, args []string) error {
  67. client := api.NewClient()
  68. request := api.PushRequest{Name: args[0]}
  69. fn := func(resp api.ProgressResponse) error {
  70. fmt.Println(resp.Status)
  71. return nil
  72. }
  73. if err := client.Push(context.Background(), &request, fn); err != nil {
  74. return err
  75. }
  76. return nil
  77. }
  78. func list(cmd *cobra.Command, args []string) error {
  79. client := api.NewClient()
  80. models, err := client.List(context.Background())
  81. if err != nil {
  82. return err
  83. }
  84. var data [][]string
  85. for _, m := range models.Models {
  86. data = append(data, []string{m.Name, humanize.Bytes(uint64(m.Size)), format.HumanTime(m.ModifiedAt, "Never")})
  87. }
  88. table := tablewriter.NewWriter(os.Stdout)
  89. table.SetHeader([]string{"NAME", "SIZE", "MODIFIED"})
  90. table.SetHeaderAlignment(tablewriter.ALIGN_LEFT)
  91. table.SetAlignment(tablewriter.ALIGN_LEFT)
  92. table.SetHeaderLine(false)
  93. table.SetBorder(false)
  94. table.SetNoWhiteSpace(true)
  95. table.SetTablePadding("\t")
  96. table.AppendBulk(data)
  97. table.Render()
  98. return nil
  99. }
  100. func RunPull(cmd *cobra.Command, args []string) error {
  101. return pull(args[0])
  102. }
  103. func pull(model string) error {
  104. client := api.NewClient()
  105. var currentDigest string
  106. var bar *progressbar.ProgressBar
  107. request := api.PullRequest{Name: model}
  108. fn := func(resp api.ProgressResponse) error {
  109. if resp.Digest != currentDigest && resp.Digest != "" {
  110. currentDigest = resp.Digest
  111. bar = progressbar.DefaultBytes(
  112. int64(resp.Total),
  113. fmt.Sprintf("pulling %s...", resp.Digest[7:19]),
  114. )
  115. bar.Set(resp.Completed)
  116. } else if resp.Digest == currentDigest && resp.Digest != "" {
  117. bar.Set(resp.Completed)
  118. } else {
  119. currentDigest = ""
  120. fmt.Println(resp.Status)
  121. }
  122. return nil
  123. }
  124. if err := client.Pull(context.Background(), &request, fn); err != nil {
  125. return err
  126. }
  127. return nil
  128. }
  129. func RunGenerate(cmd *cobra.Command, args []string) error {
  130. if len(args) > 1 {
  131. // join all args into a single prompt
  132. return generate(cmd, args[0], strings.Join(args[1:], " "))
  133. }
  134. if term.IsTerminal(int(os.Stdin.Fd())) {
  135. return generateInteractive(cmd, args[0])
  136. }
  137. return generateBatch(cmd, args[0])
  138. }
  139. var generateContextKey struct{}
  140. func generate(cmd *cobra.Command, model, prompt string) error {
  141. if len(strings.TrimSpace(prompt)) > 0 {
  142. client := api.NewClient()
  143. spinner := NewSpinner("")
  144. go spinner.Spin(60 * time.Millisecond)
  145. var latest api.GenerateResponse
  146. generateContext, ok := cmd.Context().Value(generateContextKey).([]int)
  147. if !ok {
  148. generateContext = []int{}
  149. }
  150. request := api.GenerateRequest{Model: model, Prompt: prompt, Context: generateContext}
  151. fn := func(resp api.GenerateResponse) error {
  152. if !spinner.IsFinished() {
  153. spinner.Finish()
  154. }
  155. latest = resp
  156. fmt.Print(resp.Response)
  157. cmd.SetContext(context.WithValue(cmd.Context(), generateContextKey, resp.Context))
  158. return nil
  159. }
  160. if err := client.Generate(context.Background(), &request, fn); err != nil {
  161. return err
  162. }
  163. fmt.Println()
  164. fmt.Println()
  165. verbose, err := cmd.Flags().GetBool("verbose")
  166. if err != nil {
  167. return err
  168. }
  169. if verbose {
  170. latest.Summary()
  171. }
  172. }
  173. return nil
  174. }
  175. func generateInteractive(cmd *cobra.Command, model string) error {
  176. fmt.Print(">>> ")
  177. scanner := bufio.NewScanner(os.Stdin)
  178. for scanner.Scan() {
  179. if err := generate(cmd, model, scanner.Text()); err != nil {
  180. return err
  181. }
  182. fmt.Print(">>> ")
  183. }
  184. return nil
  185. }
  186. func generateBatch(cmd *cobra.Command, model string) error {
  187. scanner := bufio.NewScanner(os.Stdin)
  188. for scanner.Scan() {
  189. prompt := scanner.Text()
  190. fmt.Printf(">>> %s\n", prompt)
  191. if err := generate(cmd, model, prompt); err != nil {
  192. return err
  193. }
  194. }
  195. return nil
  196. }
  197. func RunServer(_ *cobra.Command, _ []string) error {
  198. host := os.Getenv("OLLAMA_HOST")
  199. if host == "" {
  200. host = "127.0.0.1"
  201. }
  202. port := os.Getenv("OLLAMA_PORT")
  203. if port == "" {
  204. port = "11434"
  205. }
  206. ln, err := net.Listen("tcp", fmt.Sprintf("%s:%s", host, port))
  207. if err != nil {
  208. return err
  209. }
  210. return server.Serve(ln)
  211. }
  212. func NewCLI() *cobra.Command {
  213. log.SetFlags(log.LstdFlags | log.Lshortfile)
  214. rootCmd := &cobra.Command{
  215. Use: "ollama",
  216. Short: "Large language model runner",
  217. SilenceUsage: true,
  218. CompletionOptions: cobra.CompletionOptions{
  219. DisableDefaultCmd: true,
  220. },
  221. }
  222. cobra.EnableCommandSorting = false
  223. createCmd := &cobra.Command{
  224. Use: "create MODEL",
  225. Short: "Create a model from a Modelfile",
  226. Args: cobra.MinimumNArgs(1),
  227. RunE: create,
  228. }
  229. createCmd.Flags().StringP("file", "f", "Modelfile", "Name of the Modelfile (default \"Modelfile\")")
  230. runCmd := &cobra.Command{
  231. Use: "run MODEL [PROMPT]",
  232. Short: "Run a model",
  233. Args: cobra.MinimumNArgs(1),
  234. RunE: RunRun,
  235. }
  236. runCmd.Flags().Bool("verbose", false, "Show timings for response")
  237. serveCmd := &cobra.Command{
  238. Use: "serve",
  239. Aliases: []string{"start"},
  240. Short: "Start ollama",
  241. RunE: RunServer,
  242. }
  243. pullCmd := &cobra.Command{
  244. Use: "pull MODEL",
  245. Short: "Pull a model from a registry",
  246. Args: cobra.MinimumNArgs(1),
  247. RunE: RunPull,
  248. }
  249. pushCmd := &cobra.Command{
  250. Use: "push MODEL",
  251. Short: "Push a model to a registry",
  252. Args: cobra.MinimumNArgs(1),
  253. RunE: push,
  254. }
  255. listCmd := &cobra.Command{
  256. Use: "list",
  257. Short: "List models",
  258. RunE: list,
  259. }
  260. rootCmd.AddCommand(
  261. serveCmd,
  262. createCmd,
  263. runCmd,
  264. pullCmd,
  265. pushCmd,
  266. listCmd,
  267. )
  268. return rootCmd
  269. }