123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240 |
- package cmd
- import (
- "bufio"
- "context"
- "errors"
- "fmt"
- "log"
- "net"
- "net/http"
- "os"
- "path"
- "strings"
- "time"
- "github.com/schollz/progressbar/v3"
- "github.com/spf13/cobra"
- "golang.org/x/term"
- "github.com/jmorganca/ollama/api"
- "github.com/jmorganca/ollama/server"
- )
- func cacheDir() string {
- home, err := os.UserHomeDir()
- if err != nil {
- panic(err)
- }
- return path.Join(home, ".ollama")
- }
- func RunRun(cmd *cobra.Command, args []string) error {
- _, err := os.Stat(args[0])
- switch {
- case errors.Is(err, os.ErrNotExist):
- if err := pull(args[0]); err != nil {
- var apiStatusError api.StatusError
- if !errors.As(err, &apiStatusError) {
- return err
- }
- if apiStatusError.StatusCode != http.StatusBadGateway {
- return err
- }
- }
- case err != nil:
- return err
- }
- return RunGenerate(cmd, args)
- }
- func pull(model string) error {
- client := api.NewClient()
- var bar *progressbar.ProgressBar
- return client.Pull(
- context.Background(),
- &api.PullRequest{Model: model},
- func(progress api.PullProgress) error {
- if bar == nil {
- if progress.Percent >= 100 {
- // already downloaded
- return nil
- }
- bar = progressbar.DefaultBytes(progress.Total)
- }
- return bar.Set64(progress.Completed)
- },
- )
- }
- func RunGenerate(cmd *cobra.Command, args []string) error {
- if len(args) > 1 {
- // join all args into a single prompt
- return generate(cmd, args[0], strings.Join(args[1:], " "))
- }
- if term.IsTerminal(int(os.Stdin.Fd())) {
- return generateInteractive(cmd, args[0])
- }
- return generateBatch(cmd, args[0])
- }
- var generateContextKey struct{}
- func generate(cmd *cobra.Command, model, prompt string) error {
- if len(strings.TrimSpace(prompt)) > 0 {
- client := api.NewClient()
- spinner := progressbar.NewOptions(-1,
- progressbar.OptionSetWriter(os.Stderr),
- progressbar.OptionThrottle(60*time.Millisecond),
- progressbar.OptionSpinnerType(14),
- progressbar.OptionSetRenderBlankState(true),
- progressbar.OptionSetElapsedTime(false),
- progressbar.OptionClearOnFinish(),
- )
- go func() {
- for range time.Tick(60 * time.Millisecond) {
- if spinner.IsFinished() {
- break
- }
- spinner.Add(1)
- }
- }()
- var latest api.GenerateResponse
- generateContext, ok := cmd.Context().Value(generateContextKey).([]int)
- if !ok {
- generateContext = []int{}
- }
- request := api.GenerateRequest{Model: model, Prompt: prompt, Context: generateContext}
- fn := func(resp api.GenerateResponse) error {
- if !spinner.IsFinished() {
- spinner.Finish()
- }
- latest = resp
- fmt.Print(resp.Response)
- cmd.SetContext(context.WithValue(cmd.Context(), generateContextKey, resp.Context))
- return nil
- }
- if err := client.Generate(context.Background(), &request, fn); err != nil {
- return err
- }
- fmt.Println()
- fmt.Println()
- verbose, err := cmd.Flags().GetBool("verbose")
- if err != nil {
- return err
- }
- if verbose {
- latest.Summary()
- }
- }
- return nil
- }
- func generateInteractive(cmd *cobra.Command, model string) error {
- fmt.Print(">>> ")
- scanner := bufio.NewScanner(os.Stdin)
- for scanner.Scan() {
- if err := generate(cmd, model, scanner.Text()); err != nil {
- return err
- }
- fmt.Print(">>> ")
- }
- return nil
- }
- func generateBatch(cmd *cobra.Command, model string) error {
- scanner := bufio.NewScanner(os.Stdin)
- for scanner.Scan() {
- prompt := scanner.Text()
- fmt.Printf(">>> %s\n", prompt)
- if err := generate(cmd, model, prompt); err != nil {
- return err
- }
- }
- return nil
- }
- func RunServer(_ *cobra.Command, _ []string) error {
- host := os.Getenv("OLLAMA_HOST")
- if host == "" {
- host = "127.0.0.1"
- }
- port := os.Getenv("OLLAMA_PORT")
- if port == "" {
- port = "11434"
- }
- ln, err := net.Listen("tcp", fmt.Sprintf("%s:%s", host, port))
- if err != nil {
- return err
- }
- return server.Serve(ln)
- }
- func NewCLI() *cobra.Command {
- log.SetFlags(log.LstdFlags | log.Lshortfile)
- rootCmd := &cobra.Command{
- Use: "ollama",
- Short: "Large language model runner",
- SilenceUsage: true,
- CompletionOptions: cobra.CompletionOptions{
- DisableDefaultCmd: true,
- },
- PersistentPreRunE: func(_ *cobra.Command, args []string) error {
- // create the models directory and it's parent
- return os.MkdirAll(path.Join(cacheDir(), "models"), 0o700)
- },
- }
- cobra.EnableCommandSorting = false
- runCmd := &cobra.Command{
- Use: "run MODEL [PROMPT]",
- Short: "Run a model",
- Args: cobra.MinimumNArgs(1),
- RunE: RunRun,
- }
- runCmd.Flags().Bool("verbose", false, "Show timings for response")
- serveCmd := &cobra.Command{
- Use: "serve",
- Aliases: []string{"start"},
- Short: "Start ollama",
- RunE: RunServer,
- }
- rootCmd.AddCommand(
- serveCmd,
- runCmd,
- )
- return rootCmd
- }
|