cmd.go 7.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358
  1. package cmd
  2. import (
  3. "bufio"
  4. "context"
  5. "errors"
  6. "fmt"
  7. "log"
  8. "net"
  9. "net/http"
  10. "os"
  11. "path/filepath"
  12. "strings"
  13. "time"
  14. "github.com/dustin/go-humanize"
  15. "github.com/olekukonko/tablewriter"
  16. "github.com/schollz/progressbar/v3"
  17. "github.com/spf13/cobra"
  18. "golang.org/x/term"
  19. "github.com/jmorganca/ollama/api"
  20. "github.com/jmorganca/ollama/format"
  21. "github.com/jmorganca/ollama/server"
  22. )
  23. func cacheDir() string {
  24. home, err := os.UserHomeDir()
  25. if err != nil {
  26. panic(err)
  27. }
  28. return filepath.Join(home, ".ollama")
  29. }
  30. func create(cmd *cobra.Command, args []string) error {
  31. filename, _ := cmd.Flags().GetString("file")
  32. client := api.NewClient()
  33. request := api.CreateRequest{Name: args[0], Path: filename}
  34. fn := func(resp api.CreateProgress) error {
  35. fmt.Println(resp.Status)
  36. return nil
  37. }
  38. if err := client.Create(context.Background(), &request, fn); err != nil {
  39. return err
  40. }
  41. return nil
  42. }
  43. func RunRun(cmd *cobra.Command, args []string) error {
  44. mp := server.ParseModelPath(args[0])
  45. fp, err := mp.GetManifestPath(false)
  46. if err != nil {
  47. return err
  48. }
  49. _, err = os.Stat(fp)
  50. switch {
  51. case errors.Is(err, os.ErrNotExist):
  52. if err := pull(args[0]); err != nil {
  53. var apiStatusError api.StatusError
  54. if !errors.As(err, &apiStatusError) {
  55. return err
  56. }
  57. if apiStatusError.StatusCode != http.StatusBadGateway {
  58. return err
  59. }
  60. }
  61. case err != nil:
  62. return err
  63. }
  64. return RunGenerate(cmd, args)
  65. }
  66. func push(cmd *cobra.Command, args []string) error {
  67. client := api.NewClient()
  68. request := api.PushRequest{Name: args[0]}
  69. fn := func(resp api.PushProgress) error {
  70. fmt.Println(resp.Status)
  71. return nil
  72. }
  73. if err := client.Push(context.Background(), &request, fn); err != nil {
  74. return err
  75. }
  76. return nil
  77. }
  78. func list(cmd *cobra.Command, args []string) error {
  79. client := api.NewClient()
  80. models, err := client.List(context.Background())
  81. if err != nil {
  82. return err
  83. }
  84. var data [][]string
  85. for _, m := range models.Models {
  86. data = append(data, []string{m.Name, humanize.Bytes(uint64(m.Size)), format.HumanTime(m.ModifiedAt, "Never")})
  87. }
  88. table := tablewriter.NewWriter(os.Stdout)
  89. table.SetHeader([]string{"NAME", "SIZE", "MODIFIED"})
  90. table.SetHeaderAlignment(tablewriter.ALIGN_LEFT)
  91. table.SetAlignment(tablewriter.ALIGN_LEFT)
  92. table.SetHeaderLine(false)
  93. table.SetBorder(false)
  94. table.SetNoWhiteSpace(true)
  95. table.SetTablePadding("\t")
  96. table.AppendBulk(data)
  97. table.Render()
  98. return nil
  99. }
  100. func RunPull(cmd *cobra.Command, args []string) error {
  101. return pull(args[0])
  102. }
  103. func pull(model string) error {
  104. client := api.NewClient()
  105. var bar *progressbar.ProgressBar
  106. currentLayer := ""
  107. request := api.PullRequest{Name: model}
  108. fn := func(resp api.PullProgress) error {
  109. if resp.Digest != currentLayer && resp.Digest != "" {
  110. if currentLayer != "" {
  111. fmt.Println()
  112. }
  113. currentLayer = resp.Digest
  114. layerStr := resp.Digest[7:23] + "..."
  115. bar = progressbar.DefaultBytes(
  116. int64(resp.Total),
  117. "pulling "+layerStr,
  118. )
  119. } else if resp.Digest == currentLayer && resp.Digest != "" {
  120. bar.Set(resp.Completed)
  121. } else {
  122. currentLayer = ""
  123. fmt.Println(resp.Status)
  124. }
  125. return nil
  126. }
  127. if err := client.Pull(context.Background(), &request, fn); err != nil {
  128. return err
  129. }
  130. return nil
  131. }
  132. func RunGenerate(cmd *cobra.Command, args []string) error {
  133. if len(args) > 1 {
  134. // join all args into a single prompt
  135. return generate(cmd, args[0], strings.Join(args[1:], " "))
  136. }
  137. if term.IsTerminal(int(os.Stdin.Fd())) {
  138. return generateInteractive(cmd, args[0])
  139. }
  140. return generateBatch(cmd, args[0])
  141. }
  142. var generateContextKey struct{}
  143. func generate(cmd *cobra.Command, model, prompt string) error {
  144. if len(strings.TrimSpace(prompt)) > 0 {
  145. client := api.NewClient()
  146. spinner := progressbar.NewOptions(-1,
  147. progressbar.OptionSetWriter(os.Stderr),
  148. progressbar.OptionThrottle(60*time.Millisecond),
  149. progressbar.OptionSpinnerType(14),
  150. progressbar.OptionSetRenderBlankState(true),
  151. progressbar.OptionSetElapsedTime(false),
  152. progressbar.OptionClearOnFinish(),
  153. )
  154. go func() {
  155. for range time.Tick(60 * time.Millisecond) {
  156. if spinner.IsFinished() {
  157. break
  158. }
  159. spinner.Add(1)
  160. }
  161. }()
  162. var latest api.GenerateResponse
  163. generateContext, ok := cmd.Context().Value(generateContextKey).([]int)
  164. if !ok {
  165. generateContext = []int{}
  166. }
  167. request := api.GenerateRequest{Model: model, Prompt: prompt, Context: generateContext}
  168. fn := func(resp api.GenerateResponse) error {
  169. if !spinner.IsFinished() {
  170. spinner.Finish()
  171. }
  172. latest = resp
  173. fmt.Print(resp.Response)
  174. cmd.SetContext(context.WithValue(cmd.Context(), generateContextKey, resp.Context))
  175. return nil
  176. }
  177. if err := client.Generate(context.Background(), &request, fn); err != nil {
  178. return err
  179. }
  180. fmt.Println()
  181. fmt.Println()
  182. verbose, err := cmd.Flags().GetBool("verbose")
  183. if err != nil {
  184. return err
  185. }
  186. if verbose {
  187. latest.Summary()
  188. }
  189. }
  190. return nil
  191. }
  192. func generateInteractive(cmd *cobra.Command, model string) error {
  193. fmt.Print(">>> ")
  194. scanner := bufio.NewScanner(os.Stdin)
  195. for scanner.Scan() {
  196. if err := generate(cmd, model, scanner.Text()); err != nil {
  197. return err
  198. }
  199. fmt.Print(">>> ")
  200. }
  201. return nil
  202. }
  203. func generateBatch(cmd *cobra.Command, model string) error {
  204. scanner := bufio.NewScanner(os.Stdin)
  205. for scanner.Scan() {
  206. prompt := scanner.Text()
  207. fmt.Printf(">>> %s\n", prompt)
  208. if err := generate(cmd, model, prompt); err != nil {
  209. return err
  210. }
  211. }
  212. return nil
  213. }
  214. func RunServer(_ *cobra.Command, _ []string) error {
  215. host := os.Getenv("OLLAMA_HOST")
  216. if host == "" {
  217. host = "127.0.0.1"
  218. }
  219. port := os.Getenv("OLLAMA_PORT")
  220. if port == "" {
  221. port = "11434"
  222. }
  223. ln, err := net.Listen("tcp", fmt.Sprintf("%s:%s", host, port))
  224. if err != nil {
  225. return err
  226. }
  227. return server.Serve(ln)
  228. }
  229. func NewCLI() *cobra.Command {
  230. log.SetFlags(log.LstdFlags | log.Lshortfile)
  231. rootCmd := &cobra.Command{
  232. Use: "ollama",
  233. Short: "Large language model runner",
  234. SilenceUsage: true,
  235. CompletionOptions: cobra.CompletionOptions{
  236. DisableDefaultCmd: true,
  237. },
  238. PersistentPreRunE: func(_ *cobra.Command, args []string) error {
  239. // create the models directory and it's parent
  240. return os.MkdirAll(filepath.Join(cacheDir(), "models"), 0o700)
  241. },
  242. }
  243. cobra.EnableCommandSorting = false
  244. createCmd := &cobra.Command{
  245. Use: "create MODEL",
  246. Short: "Create a model from a Modelfile",
  247. Args: cobra.MinimumNArgs(1),
  248. RunE: create,
  249. }
  250. createCmd.Flags().StringP("file", "f", "Modelfile", "Name of the Modelfile (default \"Modelfile\")")
  251. runCmd := &cobra.Command{
  252. Use: "run MODEL [PROMPT]",
  253. Short: "Run a model",
  254. Args: cobra.MinimumNArgs(1),
  255. RunE: RunRun,
  256. }
  257. runCmd.Flags().Bool("verbose", false, "Show timings for response")
  258. serveCmd := &cobra.Command{
  259. Use: "serve",
  260. Aliases: []string{"start"},
  261. Short: "Start ollama",
  262. RunE: RunServer,
  263. }
  264. pullCmd := &cobra.Command{
  265. Use: "pull MODEL",
  266. Short: "Pull a model from a registry",
  267. Args: cobra.MinimumNArgs(1),
  268. RunE: RunPull,
  269. }
  270. pushCmd := &cobra.Command{
  271. Use: "push MODEL",
  272. Short: "Push a model to a registry",
  273. Args: cobra.MinimumNArgs(1),
  274. RunE: push,
  275. }
  276. listCmd := &cobra.Command{
  277. Use: "list",
  278. Short: "List models",
  279. RunE: list,
  280. }
  281. rootCmd.AddCommand(
  282. serveCmd,
  283. createCmd,
  284. runCmd,
  285. pullCmd,
  286. pushCmd,
  287. listCmd,
  288. )
  289. return rootCmd
  290. }