123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320 |
- package cmd
- import (
- "bufio"
- "context"
- "errors"
- "fmt"
- "log"
- "net"
- "net/http"
- "os"
- "path/filepath"
- "strings"
- "time"
- "github.com/schollz/progressbar/v3"
- "github.com/spf13/cobra"
- "golang.org/x/term"
- "github.com/jmorganca/ollama/api"
- "github.com/jmorganca/ollama/server"
- )
- func cacheDir() string {
- home, err := os.UserHomeDir()
- if err != nil {
- panic(err)
- }
- return filepath.Join(home, ".ollama")
- }
- func create(cmd *cobra.Command, args []string) error {
- filename, _ := cmd.Flags().GetString("file")
- client := api.NewClient()
- request := api.CreateRequest{Name: args[0], Path: filename}
- fn := func(resp api.CreateProgress) error {
- fmt.Println(resp.Status)
- return nil
- }
- if err := client.Create(context.Background(), &request, fn); err != nil {
- return err
- }
- return nil
- }
- func RunRun(cmd *cobra.Command, args []string) error {
- mp := server.ParseModelPath(args[0])
- fp, err := mp.GetManifestPath(false)
- if err != nil {
- return err
- }
- _, err = os.Stat(fp)
- switch {
- case errors.Is(err, os.ErrNotExist):
- if err := pull(args[0]); err != nil {
- var apiStatusError api.StatusError
- if !errors.As(err, &apiStatusError) {
- return err
- }
- if apiStatusError.StatusCode != http.StatusBadGateway {
- return err
- }
- }
- case err != nil:
- return err
- }
- return RunGenerate(cmd, args)
- }
- func push(cmd *cobra.Command, args []string) error {
- client := api.NewClient()
- request := api.PushRequest{Name: args[0]}
- fn := func(resp api.PushProgress) error {
- fmt.Println(resp.Status)
- return nil
- }
- if err := client.Push(context.Background(), &request, fn); err != nil {
- return err
- }
- return nil
- }
- func RunPull(cmd *cobra.Command, args []string) error {
- return pull(args[0])
- }
- func pull(model string) error {
- client := api.NewClient()
- var bar *progressbar.ProgressBar
- currentLayer := ""
- request := api.PullRequest{Name: model}
- fn := func(resp api.PullProgress) error {
- if resp.Digest != currentLayer && resp.Digest != "" {
- if currentLayer != "" {
- fmt.Println()
- }
- currentLayer = resp.Digest
- layerStr := resp.Digest[7:23] + "..."
- bar = progressbar.DefaultBytes(
- int64(resp.Total),
- "pulling "+layerStr,
- )
- } else if resp.Digest == currentLayer && resp.Digest != "" {
- bar.Set(resp.Completed)
- } else {
- currentLayer = ""
- fmt.Println(resp.Status)
- }
- return nil
- }
- if err := client.Pull(context.Background(), &request, fn); err != nil {
- return err
- }
- return nil
- }
- func RunGenerate(cmd *cobra.Command, args []string) error {
- if len(args) > 1 {
- // join all args into a single prompt
- return generate(cmd, args[0], strings.Join(args[1:], " "))
- }
- if term.IsTerminal(int(os.Stdin.Fd())) {
- return generateInteractive(cmd, args[0])
- }
- return generateBatch(cmd, args[0])
- }
- var generateContextKey struct{}
- func generate(cmd *cobra.Command, model, prompt string) error {
- if len(strings.TrimSpace(prompt)) > 0 {
- client := api.NewClient()
- spinner := progressbar.NewOptions(-1,
- progressbar.OptionSetWriter(os.Stderr),
- progressbar.OptionThrottle(60*time.Millisecond),
- progressbar.OptionSpinnerType(14),
- progressbar.OptionSetRenderBlankState(true),
- progressbar.OptionSetElapsedTime(false),
- progressbar.OptionClearOnFinish(),
- )
- go func() {
- for range time.Tick(60 * time.Millisecond) {
- if spinner.IsFinished() {
- break
- }
- spinner.Add(1)
- }
- }()
- var latest api.GenerateResponse
- generateContext, ok := cmd.Context().Value(generateContextKey).([]int)
- if !ok {
- generateContext = []int{}
- }
- request := api.GenerateRequest{Model: model, Prompt: prompt, Context: generateContext}
- fn := func(resp api.GenerateResponse) error {
- if !spinner.IsFinished() {
- spinner.Finish()
- }
- latest = resp
- fmt.Print(resp.Response)
- cmd.SetContext(context.WithValue(cmd.Context(), generateContextKey, resp.Context))
- return nil
- }
- if err := client.Generate(context.Background(), &request, fn); err != nil {
- return err
- }
- fmt.Println()
- fmt.Println()
- verbose, err := cmd.Flags().GetBool("verbose")
- if err != nil {
- return err
- }
- if verbose {
- latest.Summary()
- }
- }
- return nil
- }
- func generateInteractive(cmd *cobra.Command, model string) error {
- fmt.Print(">>> ")
- scanner := bufio.NewScanner(os.Stdin)
- for scanner.Scan() {
- if err := generate(cmd, model, scanner.Text()); err != nil {
- return err
- }
- fmt.Print(">>> ")
- }
- return nil
- }
- func generateBatch(cmd *cobra.Command, model string) error {
- scanner := bufio.NewScanner(os.Stdin)
- for scanner.Scan() {
- prompt := scanner.Text()
- fmt.Printf(">>> %s\n", prompt)
- if err := generate(cmd, model, prompt); err != nil {
- return err
- }
- }
- return nil
- }
- func RunServer(_ *cobra.Command, _ []string) error {
- host := os.Getenv("OLLAMA_HOST")
- if host == "" {
- host = "127.0.0.1"
- }
- port := os.Getenv("OLLAMA_PORT")
- if port == "" {
- port = "11434"
- }
- ln, err := net.Listen("tcp", fmt.Sprintf("%s:%s", host, port))
- if err != nil {
- return err
- }
- return server.Serve(ln)
- }
- func NewCLI() *cobra.Command {
- log.SetFlags(log.LstdFlags | log.Lshortfile)
- rootCmd := &cobra.Command{
- Use: "ollama",
- Short: "Large language model runner",
- SilenceUsage: true,
- CompletionOptions: cobra.CompletionOptions{
- DisableDefaultCmd: true,
- },
- PersistentPreRunE: func(_ *cobra.Command, args []string) error {
- // create the models directory and it's parent
- return os.MkdirAll(filepath.Join(cacheDir(), "models"), 0o700)
- },
- }
- cobra.EnableCommandSorting = false
- createCmd := &cobra.Command{
- Use: "create MODEL",
- Short: "Create a model from a Modelfile",
- Args: cobra.MinimumNArgs(1),
- RunE: create,
- }
- createCmd.Flags().StringP("file", "f", "Modelfile", "Name of the Modelfile (default \"Modelfile\")")
- runCmd := &cobra.Command{
- Use: "run MODEL [PROMPT]",
- Short: "Run a model",
- Args: cobra.MinimumNArgs(1),
- RunE: RunRun,
- }
- runCmd.Flags().Bool("verbose", false, "Show timings for response")
- serveCmd := &cobra.Command{
- Use: "serve",
- Aliases: []string{"start"},
- Short: "Start ollama",
- RunE: RunServer,
- }
- pullCmd := &cobra.Command{
- Use: "pull MODEL",
- Short: "Pull a model from a registry",
- Args: cobra.MinimumNArgs(1),
- RunE: RunPull,
- }
- pushCmd := &cobra.Command{
- Use: "push MODEL",
- Short: "Push a model to a registry",
- Args: cobra.MinimumNArgs(1),
- RunE: push,
- }
- rootCmd.AddCommand(
- serveCmd,
- createCmd,
- runCmd,
- pullCmd,
- pushCmd,
- )
- return rootCmd
- }
|