cmd.go 26 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083
  1. package cmd
  2. import (
  3. "bytes"
  4. "context"
  5. "crypto/ed25519"
  6. "crypto/rand"
  7. "crypto/sha256"
  8. "encoding/pem"
  9. "errors"
  10. "fmt"
  11. "io"
  12. "log"
  13. "net"
  14. "net/http"
  15. "os"
  16. "os/exec"
  17. "os/signal"
  18. "path/filepath"
  19. "runtime"
  20. "strings"
  21. "syscall"
  22. "time"
  23. "github.com/olekukonko/tablewriter"
  24. "github.com/spf13/cobra"
  25. "golang.org/x/crypto/ssh"
  26. "golang.org/x/term"
  27. "github.com/jmorganca/ollama/api"
  28. "github.com/jmorganca/ollama/format"
  29. "github.com/jmorganca/ollama/parser"
  30. "github.com/jmorganca/ollama/progress"
  31. "github.com/jmorganca/ollama/readline"
  32. "github.com/jmorganca/ollama/server"
  33. "github.com/jmorganca/ollama/version"
  34. )
  35. func CreateHandler(cmd *cobra.Command, args []string) error {
  36. filename, _ := cmd.Flags().GetString("file")
  37. filename, err := filepath.Abs(filename)
  38. if err != nil {
  39. return err
  40. }
  41. client, err := api.ClientFromEnvironment()
  42. if err != nil {
  43. return err
  44. }
  45. p := progress.NewProgress(os.Stderr)
  46. defer p.Stop()
  47. bars := make(map[string]*progress.Bar)
  48. modelfile, err := os.ReadFile(filename)
  49. if err != nil {
  50. return err
  51. }
  52. commands, err := parser.Parse(bytes.NewReader(modelfile))
  53. if err != nil {
  54. return err
  55. }
  56. home, err := os.UserHomeDir()
  57. if err != nil {
  58. return err
  59. }
  60. status := "transferring model data"
  61. spinner := progress.NewSpinner(status)
  62. p.Add(status, spinner)
  63. for _, c := range commands {
  64. switch c.Name {
  65. case "model", "adapter":
  66. path := c.Args
  67. if path == "~" {
  68. path = home
  69. } else if strings.HasPrefix(path, "~/") {
  70. path = filepath.Join(home, path[2:])
  71. }
  72. if !filepath.IsAbs(path) {
  73. path = filepath.Join(filepath.Dir(filename), path)
  74. }
  75. bin, err := os.Open(path)
  76. if errors.Is(err, os.ErrNotExist) && c.Name == "model" {
  77. continue
  78. } else if err != nil {
  79. return err
  80. }
  81. defer bin.Close()
  82. hash := sha256.New()
  83. if _, err := io.Copy(hash, bin); err != nil {
  84. return err
  85. }
  86. bin.Seek(0, io.SeekStart)
  87. digest := fmt.Sprintf("sha256:%x", hash.Sum(nil))
  88. if err = client.CreateBlob(cmd.Context(), digest, bin); err != nil {
  89. return err
  90. }
  91. modelfile = bytes.ReplaceAll(modelfile, []byte(c.Args), []byte("@"+digest))
  92. }
  93. }
  94. fn := func(resp api.ProgressResponse) error {
  95. if resp.Digest != "" {
  96. spinner.Stop()
  97. bar, ok := bars[resp.Digest]
  98. if !ok {
  99. bar = progress.NewBar(fmt.Sprintf("pulling %s...", resp.Digest[7:19]), resp.Total, resp.Completed)
  100. bars[resp.Digest] = bar
  101. p.Add(resp.Digest, bar)
  102. }
  103. bar.Set(resp.Completed)
  104. } else if status != resp.Status {
  105. spinner.Stop()
  106. status = resp.Status
  107. spinner = progress.NewSpinner(status)
  108. p.Add(status, spinner)
  109. }
  110. return nil
  111. }
  112. request := api.CreateRequest{Name: args[0], Modelfile: string(modelfile)}
  113. if err := client.Create(context.Background(), &request, fn); err != nil {
  114. return err
  115. }
  116. return nil
  117. }
  118. func RunHandler(cmd *cobra.Command, args []string) error {
  119. client, err := api.ClientFromEnvironment()
  120. if err != nil {
  121. return err
  122. }
  123. name := args[0]
  124. // check if the model exists on the server
  125. _, err = client.Show(context.Background(), &api.ShowRequest{Name: name})
  126. var statusError api.StatusError
  127. switch {
  128. case errors.As(err, &statusError) && statusError.StatusCode == http.StatusNotFound:
  129. if err := PullHandler(cmd, args); err != nil {
  130. return err
  131. }
  132. case err != nil:
  133. return err
  134. }
  135. return RunGenerate(cmd, args)
  136. }
  137. func PushHandler(cmd *cobra.Command, args []string) error {
  138. client, err := api.ClientFromEnvironment()
  139. if err != nil {
  140. return err
  141. }
  142. insecure, err := cmd.Flags().GetBool("insecure")
  143. if err != nil {
  144. return err
  145. }
  146. p := progress.NewProgress(os.Stderr)
  147. defer p.Stop()
  148. bars := make(map[string]*progress.Bar)
  149. var status string
  150. var spinner *progress.Spinner
  151. fn := func(resp api.ProgressResponse) error {
  152. if resp.Digest != "" {
  153. if spinner != nil {
  154. spinner.Stop()
  155. }
  156. bar, ok := bars[resp.Digest]
  157. if !ok {
  158. bar = progress.NewBar(fmt.Sprintf("pushing %s...", resp.Digest[7:19]), resp.Total, resp.Completed)
  159. bars[resp.Digest] = bar
  160. p.Add(resp.Digest, bar)
  161. }
  162. bar.Set(resp.Completed)
  163. } else if status != resp.Status {
  164. if spinner != nil {
  165. spinner.Stop()
  166. }
  167. status = resp.Status
  168. spinner = progress.NewSpinner(status)
  169. p.Add(status, spinner)
  170. }
  171. return nil
  172. }
  173. request := api.PushRequest{Name: args[0], Insecure: insecure}
  174. if err := client.Push(context.Background(), &request, fn); err != nil {
  175. return err
  176. }
  177. spinner.Stop()
  178. return nil
  179. }
  180. func ListHandler(cmd *cobra.Command, args []string) error {
  181. client, err := api.ClientFromEnvironment()
  182. if err != nil {
  183. return err
  184. }
  185. models, err := client.List(context.Background())
  186. if err != nil {
  187. return err
  188. }
  189. var data [][]string
  190. for _, m := range models.Models {
  191. if len(args) == 0 || strings.HasPrefix(m.Name, args[0]) {
  192. data = append(data, []string{m.Name, m.Digest[:12], format.HumanBytes(m.Size), format.HumanTime(m.ModifiedAt, "Never")})
  193. }
  194. }
  195. table := tablewriter.NewWriter(os.Stdout)
  196. table.SetHeader([]string{"NAME", "ID", "SIZE", "MODIFIED"})
  197. table.SetHeaderAlignment(tablewriter.ALIGN_LEFT)
  198. table.SetAlignment(tablewriter.ALIGN_LEFT)
  199. table.SetHeaderLine(false)
  200. table.SetBorder(false)
  201. table.SetNoWhiteSpace(true)
  202. table.SetTablePadding("\t")
  203. table.AppendBulk(data)
  204. table.Render()
  205. return nil
  206. }
  207. func DeleteHandler(cmd *cobra.Command, args []string) error {
  208. client, err := api.ClientFromEnvironment()
  209. if err != nil {
  210. return err
  211. }
  212. for _, name := range args {
  213. req := api.DeleteRequest{Name: name}
  214. if err := client.Delete(context.Background(), &req); err != nil {
  215. return err
  216. }
  217. fmt.Printf("deleted '%s'\n", name)
  218. }
  219. return nil
  220. }
  221. func ShowHandler(cmd *cobra.Command, args []string) error {
  222. client, err := api.ClientFromEnvironment()
  223. if err != nil {
  224. return err
  225. }
  226. if len(args) != 1 {
  227. return errors.New("missing model name")
  228. }
  229. license, errLicense := cmd.Flags().GetBool("license")
  230. modelfile, errModelfile := cmd.Flags().GetBool("modelfile")
  231. parameters, errParams := cmd.Flags().GetBool("parameters")
  232. system, errSystem := cmd.Flags().GetBool("system")
  233. template, errTemplate := cmd.Flags().GetBool("template")
  234. for _, boolErr := range []error{errLicense, errModelfile, errParams, errSystem, errTemplate} {
  235. if boolErr != nil {
  236. return errors.New("error retrieving flags")
  237. }
  238. }
  239. flagsSet := 0
  240. showType := ""
  241. if license {
  242. flagsSet++
  243. showType = "license"
  244. }
  245. if modelfile {
  246. flagsSet++
  247. showType = "modelfile"
  248. }
  249. if parameters {
  250. flagsSet++
  251. showType = "parameters"
  252. }
  253. if system {
  254. flagsSet++
  255. showType = "system"
  256. }
  257. if template {
  258. flagsSet++
  259. showType = "template"
  260. }
  261. if flagsSet > 1 {
  262. return errors.New("only one of '--license', '--modelfile', '--parameters', '--system', or '--template' can be specified")
  263. } else if flagsSet == 0 {
  264. return errors.New("one of '--license', '--modelfile', '--parameters', '--system', or '--template' must be specified")
  265. }
  266. req := api.ShowRequest{Name: args[0]}
  267. resp, err := client.Show(context.Background(), &req)
  268. if err != nil {
  269. return err
  270. }
  271. switch showType {
  272. case "license":
  273. fmt.Println(resp.License)
  274. case "modelfile":
  275. fmt.Println(resp.Modelfile)
  276. case "parameters":
  277. fmt.Println(resp.Parameters)
  278. case "system":
  279. fmt.Println(resp.System)
  280. case "template":
  281. fmt.Println(resp.Template)
  282. }
  283. return nil
  284. }
  285. func CopyHandler(cmd *cobra.Command, args []string) error {
  286. client, err := api.ClientFromEnvironment()
  287. if err != nil {
  288. return err
  289. }
  290. req := api.CopyRequest{Source: args[0], Destination: args[1]}
  291. if err := client.Copy(context.Background(), &req); err != nil {
  292. return err
  293. }
  294. fmt.Printf("copied '%s' to '%s'\n", args[0], args[1])
  295. return nil
  296. }
  297. func PullHandler(cmd *cobra.Command, args []string) error {
  298. insecure, err := cmd.Flags().GetBool("insecure")
  299. if err != nil {
  300. return err
  301. }
  302. client, err := api.ClientFromEnvironment()
  303. if err != nil {
  304. return err
  305. }
  306. p := progress.NewProgress(os.Stderr)
  307. defer p.Stop()
  308. bars := make(map[string]*progress.Bar)
  309. var status string
  310. var spinner *progress.Spinner
  311. fn := func(resp api.ProgressResponse) error {
  312. if resp.Digest != "" {
  313. if spinner != nil {
  314. spinner.Stop()
  315. }
  316. bar, ok := bars[resp.Digest]
  317. if !ok {
  318. bar = progress.NewBar(fmt.Sprintf("pulling %s...", resp.Digest[7:19]), resp.Total, resp.Completed)
  319. bars[resp.Digest] = bar
  320. p.Add(resp.Digest, bar)
  321. }
  322. bar.Set(resp.Completed)
  323. } else if status != resp.Status {
  324. if spinner != nil {
  325. spinner.Stop()
  326. }
  327. status = resp.Status
  328. spinner = progress.NewSpinner(status)
  329. p.Add(status, spinner)
  330. }
  331. return nil
  332. }
  333. request := api.PullRequest{Name: args[0], Insecure: insecure}
  334. if err := client.Pull(context.Background(), &request, fn); err != nil {
  335. return err
  336. }
  337. return nil
  338. }
  339. func RunGenerate(cmd *cobra.Command, args []string) error {
  340. interactive := true
  341. opts := generateOptions{
  342. Model: args[0],
  343. WordWrap: os.Getenv("TERM") == "xterm-256color",
  344. Options: map[string]interface{}{},
  345. }
  346. format, err := cmd.Flags().GetString("format")
  347. if err != nil {
  348. return err
  349. }
  350. opts.Format = format
  351. prompts := args[1:]
  352. // prepend stdin to the prompt if provided
  353. if !term.IsTerminal(int(os.Stdin.Fd())) {
  354. in, err := io.ReadAll(os.Stdin)
  355. if err != nil {
  356. return err
  357. }
  358. prompts = append([]string{string(in)}, prompts...)
  359. opts.WordWrap = false
  360. interactive = false
  361. }
  362. opts.Prompt = strings.Join(prompts, " ")
  363. if len(prompts) > 0 {
  364. interactive = false
  365. }
  366. nowrap, err := cmd.Flags().GetBool("nowordwrap")
  367. if err != nil {
  368. return err
  369. }
  370. opts.WordWrap = !nowrap
  371. if !interactive {
  372. return generate(cmd, opts)
  373. }
  374. return generateInteractive(cmd, opts)
  375. }
  376. type generateContextKey string
  377. type generateOptions struct {
  378. Model string
  379. Prompt string
  380. WordWrap bool
  381. Format string
  382. Options map[string]interface{}
  383. }
  384. func generate(cmd *cobra.Command, opts generateOptions) error {
  385. client, err := api.ClientFromEnvironment()
  386. if err != nil {
  387. return err
  388. }
  389. p := progress.NewProgress(os.Stderr)
  390. defer p.StopAndClear()
  391. spinner := progress.NewSpinner("")
  392. p.Add("", spinner)
  393. var latest api.GenerateResponse
  394. generateContext, ok := cmd.Context().Value(generateContextKey("context")).([]int)
  395. if !ok {
  396. generateContext = []int{}
  397. }
  398. termWidth, _, err := term.GetSize(int(os.Stdout.Fd()))
  399. if err != nil {
  400. opts.WordWrap = false
  401. }
  402. cancelCtx, cancel := context.WithCancel(context.Background())
  403. defer cancel()
  404. sigChan := make(chan os.Signal, 1)
  405. signal.Notify(sigChan, syscall.SIGINT)
  406. go func() {
  407. <-sigChan
  408. cancel()
  409. }()
  410. var currentLineLength int
  411. var wordBuffer string
  412. request := api.GenerateRequest{
  413. Model: opts.Model,
  414. Prompt: opts.Prompt,
  415. Context: generateContext,
  416. Format: opts.Format,
  417. Options: opts.Options,
  418. }
  419. fn := func(response api.GenerateResponse) error {
  420. p.StopAndClear()
  421. latest = response
  422. if opts.WordWrap {
  423. for _, ch := range response.Response {
  424. if currentLineLength+1 > termWidth-5 {
  425. // backtrack the length of the last word and clear to the end of the line
  426. fmt.Printf("\x1b[%dD\x1b[K\n", len(wordBuffer))
  427. fmt.Printf("%s%c", wordBuffer, ch)
  428. currentLineLength = len(wordBuffer) + 1
  429. } else {
  430. fmt.Print(string(ch))
  431. currentLineLength += 1
  432. switch ch {
  433. case ' ':
  434. wordBuffer = ""
  435. case '\n':
  436. currentLineLength = 0
  437. default:
  438. wordBuffer += string(ch)
  439. }
  440. }
  441. }
  442. } else {
  443. fmt.Print(response.Response)
  444. }
  445. return nil
  446. }
  447. if err := client.Generate(cancelCtx, &request, fn); err != nil {
  448. if errors.Is(err, context.Canceled) {
  449. return nil
  450. }
  451. return err
  452. }
  453. if opts.Prompt != "" {
  454. fmt.Println()
  455. fmt.Println()
  456. }
  457. if !latest.Done {
  458. return nil
  459. }
  460. verbose, err := cmd.Flags().GetBool("verbose")
  461. if err != nil {
  462. return err
  463. }
  464. if verbose {
  465. latest.Summary()
  466. }
  467. ctx := cmd.Context()
  468. ctx = context.WithValue(ctx, generateContextKey("context"), latest.Context)
  469. cmd.SetContext(ctx)
  470. return nil
  471. }
  472. func generateInteractive(cmd *cobra.Command, opts generateOptions) error {
  473. // load the model
  474. loadOpts := generateOptions{
  475. Model: opts.Model,
  476. Prompt: "",
  477. }
  478. if err := generate(cmd, loadOpts); err != nil {
  479. return err
  480. }
  481. usage := func() {
  482. fmt.Fprintln(os.Stderr, "Available Commands:")
  483. fmt.Fprintln(os.Stderr, " /set Set session variables")
  484. fmt.Fprintln(os.Stderr, " /show Show model information")
  485. fmt.Fprintln(os.Stderr, " /bye Exit")
  486. fmt.Fprintln(os.Stderr, " /?, /help Help for a command")
  487. fmt.Fprintln(os.Stderr, "")
  488. fmt.Fprintln(os.Stderr, "Use \"\"\" to begin a multi-line message.")
  489. fmt.Fprintln(os.Stderr, "")
  490. }
  491. usageSet := func() {
  492. fmt.Fprintln(os.Stderr, "Available Commands:")
  493. fmt.Fprintln(os.Stderr, " /set parameter Set a parameter")
  494. fmt.Fprintln(os.Stderr, " /set history Enable history")
  495. fmt.Fprintln(os.Stderr, " /set nohistory Disable history")
  496. fmt.Fprintln(os.Stderr, " /set wordwrap Enable wordwrap")
  497. fmt.Fprintln(os.Stderr, " /set nowordwrap Disable wordwrap")
  498. fmt.Fprintln(os.Stderr, " /set format json Enable JSON mode")
  499. fmt.Fprintln(os.Stderr, " /set noformat Disable formatting")
  500. fmt.Fprintln(os.Stderr, " /set verbose Show LLM stats")
  501. fmt.Fprintln(os.Stderr, " /set quiet Disable LLM stats")
  502. fmt.Fprintln(os.Stderr, "")
  503. }
  504. usageShow := func() {
  505. fmt.Fprintln(os.Stderr, "Available Commands:")
  506. fmt.Fprintln(os.Stderr, " /show license Show model license")
  507. fmt.Fprintln(os.Stderr, " /show modelfile Show Modelfile for this model")
  508. fmt.Fprintln(os.Stderr, " /show parameters Show parameters for this model")
  509. fmt.Fprintln(os.Stderr, " /show system Show system prompt")
  510. fmt.Fprintln(os.Stderr, " /show template Show prompt template")
  511. fmt.Fprintln(os.Stderr, "")
  512. }
  513. // only list out the most common parameters
  514. usageParameters := func() {
  515. fmt.Fprintln(os.Stderr, "Available Parameters:")
  516. fmt.Fprintln(os.Stderr, " /set parameter seed <int> Random number seed")
  517. fmt.Fprintln(os.Stderr, " /set parameter num_predict <int> Max number of tokens to predict")
  518. fmt.Fprintln(os.Stderr, " /set parameter top_k <int> Pick from top k num of tokens")
  519. fmt.Fprintln(os.Stderr, " /set parameter top_p <float> Pick token based on sum of probabilities")
  520. fmt.Fprintln(os.Stderr, " /set parameter num_ctx <int> Set the context size")
  521. fmt.Fprintln(os.Stderr, " /set parameter temperature <float> Set creativity level")
  522. fmt.Fprintln(os.Stderr, " /set parameter repeat_penalty <float> How strongly to penalize repetitions")
  523. fmt.Fprintln(os.Stderr, " /set parameter repeat_last_n <int> Set how far back to look for repetitions")
  524. fmt.Fprintln(os.Stderr, " /set parameter num_gpu <int> The number of layers to send to the GPU")
  525. fmt.Fprintln(os.Stderr, " /set parameter stop \"<string>\", ... Set the stop parameters")
  526. fmt.Fprintln(os.Stderr, "")
  527. }
  528. scanner, err := readline.New(readline.Prompt{
  529. Prompt: ">>> ",
  530. AltPrompt: "... ",
  531. Placeholder: "Send a message (/? for help)",
  532. AltPlaceholder: `Use """ to end multi-line input`,
  533. })
  534. if err != nil {
  535. return err
  536. }
  537. fmt.Print(readline.StartBracketedPaste)
  538. defer fmt.Printf(readline.EndBracketedPaste)
  539. var prompt string
  540. for {
  541. line, err := scanner.Readline()
  542. switch {
  543. case errors.Is(err, io.EOF):
  544. fmt.Println()
  545. return nil
  546. case errors.Is(err, readline.ErrInterrupt):
  547. if line == "" {
  548. fmt.Println("\nUse Ctrl-D or /bye to exit.")
  549. }
  550. scanner.Prompt.UseAlt = false
  551. prompt = ""
  552. continue
  553. case err != nil:
  554. return err
  555. }
  556. switch {
  557. case strings.HasPrefix(prompt, `"""`):
  558. // if the prompt so far starts with """ then we're in multiline mode
  559. // and we need to keep reading until we find a line that ends with """
  560. cut, found := strings.CutSuffix(line, `"""`)
  561. prompt += cut + "\n"
  562. if !found {
  563. continue
  564. }
  565. prompt = strings.TrimPrefix(prompt, `"""`)
  566. scanner.Prompt.UseAlt = false
  567. case strings.HasPrefix(line, `"""`) && len(prompt) == 0:
  568. scanner.Prompt.UseAlt = true
  569. prompt += line + "\n"
  570. continue
  571. case scanner.Pasting:
  572. prompt += line + "\n"
  573. continue
  574. case strings.HasPrefix(line, "/list"):
  575. args := strings.Fields(line)
  576. if err := ListHandler(cmd, args[1:]); err != nil {
  577. return err
  578. }
  579. case strings.HasPrefix(line, "/set"):
  580. args := strings.Fields(line)
  581. if len(args) > 1 {
  582. switch args[1] {
  583. case "history":
  584. scanner.HistoryEnable()
  585. case "nohistory":
  586. scanner.HistoryDisable()
  587. case "wordwrap":
  588. opts.WordWrap = true
  589. fmt.Println("Set 'wordwrap' mode.")
  590. case "nowordwrap":
  591. opts.WordWrap = false
  592. fmt.Println("Set 'nowordwrap' mode.")
  593. case "verbose":
  594. cmd.Flags().Set("verbose", "true")
  595. fmt.Println("Set 'verbose' mode.")
  596. case "quiet":
  597. cmd.Flags().Set("verbose", "false")
  598. fmt.Println("Set 'quiet' mode.")
  599. case "format":
  600. if len(args) < 3 || args[2] != "json" {
  601. fmt.Println("Invalid or missing format. For 'json' mode use '/set format json'")
  602. } else {
  603. opts.Format = args[2]
  604. fmt.Printf("Set format to '%s' mode.\n", args[2])
  605. }
  606. case "noformat":
  607. opts.Format = ""
  608. fmt.Println("Disabled format.")
  609. case "parameter":
  610. if len(args) < 4 {
  611. usageParameters()
  612. continue
  613. }
  614. var params []string
  615. for _, p := range args[3:] {
  616. params = append(params, p)
  617. }
  618. fp, err := api.FormatParams(map[string][]string{args[2]: params})
  619. if err != nil {
  620. fmt.Printf("Couldn't set parameter: %q\n\n", err)
  621. continue
  622. }
  623. fmt.Printf("Set parameter '%s' to '%s'\n\n", args[2], strings.Join(params, ", "))
  624. opts.Options[args[2]] = fp[args[2]]
  625. default:
  626. fmt.Printf("Unknown command '/set %s'. Type /? for help\n", args[1])
  627. }
  628. } else {
  629. usageSet()
  630. }
  631. case strings.HasPrefix(line, "/show"):
  632. args := strings.Fields(line)
  633. if len(args) > 1 {
  634. client, err := api.ClientFromEnvironment()
  635. if err != nil {
  636. fmt.Println("error: couldn't connect to ollama server")
  637. return err
  638. }
  639. resp, err := client.Show(cmd.Context(), &api.ShowRequest{Name: opts.Model})
  640. if err != nil {
  641. fmt.Println("error: couldn't get model")
  642. return err
  643. }
  644. switch args[1] {
  645. case "license":
  646. if resp.License == "" {
  647. fmt.Print("No license was specified for this model.\n\n")
  648. } else {
  649. fmt.Println(resp.License)
  650. }
  651. case "modelfile":
  652. fmt.Println(resp.Modelfile)
  653. case "parameters":
  654. if resp.Parameters == "" {
  655. fmt.Print("No parameters were specified for this model.\n\n")
  656. } else {
  657. if len(opts.Options) > 0 {
  658. fmt.Println("User defined parameters:")
  659. for k, v := range opts.Options {
  660. fmt.Printf("%-*s %v\n", 30, k, v)
  661. }
  662. fmt.Println()
  663. }
  664. fmt.Println("Model defined parameters:")
  665. fmt.Println(resp.Parameters)
  666. }
  667. case "system":
  668. if resp.System == "" {
  669. fmt.Print("No system prompt was specified for this model.\n\n")
  670. } else {
  671. fmt.Println(resp.System)
  672. }
  673. case "template":
  674. if resp.Template == "" {
  675. fmt.Print("No prompt template was specified for this model.\n\n")
  676. } else {
  677. fmt.Println(resp.Template)
  678. }
  679. default:
  680. fmt.Printf("Unknown command '/show %s'. Type /? for help\n", args[1])
  681. }
  682. } else {
  683. usageShow()
  684. }
  685. case strings.HasPrefix(line, "/help"), strings.HasPrefix(line, "/?"):
  686. args := strings.Fields(line)
  687. if len(args) > 1 {
  688. switch args[1] {
  689. case "set", "/set":
  690. usageSet()
  691. case "show", "/show":
  692. usageShow()
  693. }
  694. } else {
  695. usage()
  696. }
  697. case line == "/exit", line == "/bye":
  698. return nil
  699. case strings.HasPrefix(line, "/"):
  700. args := strings.Fields(line)
  701. fmt.Printf("Unknown command '%s'. Type /? for help\n", args[0])
  702. continue
  703. default:
  704. prompt += line
  705. }
  706. if len(prompt) > 0 && prompt[0] != '/' {
  707. opts.Prompt = prompt
  708. if err := generate(cmd, opts); err != nil {
  709. return err
  710. }
  711. prompt = ""
  712. }
  713. }
  714. }
  715. func RunServer(cmd *cobra.Command, _ []string) error {
  716. host, port, err := net.SplitHostPort(os.Getenv("OLLAMA_HOST"))
  717. if err != nil {
  718. host, port = "127.0.0.1", "11434"
  719. if ip := net.ParseIP(strings.Trim(os.Getenv("OLLAMA_HOST"), "[]")); ip != nil {
  720. host = ip.String()
  721. }
  722. }
  723. if err := initializeKeypair(); err != nil {
  724. return err
  725. }
  726. ln, err := net.Listen("tcp", net.JoinHostPort(host, port))
  727. if err != nil {
  728. return err
  729. }
  730. var origins []string
  731. if o := os.Getenv("OLLAMA_ORIGINS"); o != "" {
  732. origins = strings.Split(o, ",")
  733. }
  734. return server.Serve(ln, origins)
  735. }
  736. func initializeKeypair() error {
  737. home, err := os.UserHomeDir()
  738. if err != nil {
  739. return err
  740. }
  741. privKeyPath := filepath.Join(home, ".ollama", "id_ed25519")
  742. pubKeyPath := filepath.Join(home, ".ollama", "id_ed25519.pub")
  743. _, err = os.Stat(privKeyPath)
  744. if os.IsNotExist(err) {
  745. fmt.Printf("Couldn't find '%s'. Generating new private key.\n", privKeyPath)
  746. _, privKey, err := ed25519.GenerateKey(rand.Reader)
  747. if err != nil {
  748. return err
  749. }
  750. privKeyBytes, err := format.OpenSSHPrivateKey(privKey, "")
  751. if err != nil {
  752. return err
  753. }
  754. err = os.MkdirAll(filepath.Dir(privKeyPath), 0o755)
  755. if err != nil {
  756. return fmt.Errorf("could not create directory %w", err)
  757. }
  758. err = os.WriteFile(privKeyPath, pem.EncodeToMemory(privKeyBytes), 0o600)
  759. if err != nil {
  760. return err
  761. }
  762. sshPrivateKey, err := ssh.NewSignerFromKey(privKey)
  763. if err != nil {
  764. return err
  765. }
  766. pubKeyData := ssh.MarshalAuthorizedKey(sshPrivateKey.PublicKey())
  767. err = os.WriteFile(pubKeyPath, pubKeyData, 0o644)
  768. if err != nil {
  769. return err
  770. }
  771. fmt.Printf("Your new public key is: \n\n%s\n", string(pubKeyData))
  772. }
  773. return nil
  774. }
  775. func startMacApp(client *api.Client) error {
  776. exe, err := os.Executable()
  777. if err != nil {
  778. return err
  779. }
  780. link, err := os.Readlink(exe)
  781. if err != nil {
  782. return err
  783. }
  784. if !strings.Contains(link, "Ollama.app") {
  785. return fmt.Errorf("could not find ollama app")
  786. }
  787. path := strings.Split(link, "Ollama.app")
  788. if err := exec.Command("/usr/bin/open", "-a", path[0]+"Ollama.app").Run(); err != nil {
  789. return err
  790. }
  791. // wait for the server to start
  792. timeout := time.After(5 * time.Second)
  793. tick := time.Tick(500 * time.Millisecond)
  794. for {
  795. select {
  796. case <-timeout:
  797. return errors.New("timed out waiting for server to start")
  798. case <-tick:
  799. if err := client.Heartbeat(context.Background()); err == nil {
  800. return nil // server has started
  801. }
  802. }
  803. }
  804. }
  805. func checkServerHeartbeat(_ *cobra.Command, _ []string) error {
  806. client, err := api.ClientFromEnvironment()
  807. if err != nil {
  808. return err
  809. }
  810. if err := client.Heartbeat(context.Background()); err != nil {
  811. if !strings.Contains(err.Error(), "connection refused") {
  812. return err
  813. }
  814. if runtime.GOOS == "darwin" {
  815. if err := startMacApp(client); err != nil {
  816. return fmt.Errorf("could not connect to ollama app, is it running?")
  817. }
  818. } else {
  819. return fmt.Errorf("could not connect to ollama server, run 'ollama serve' to start it")
  820. }
  821. }
  822. return nil
  823. }
  824. func NewCLI() *cobra.Command {
  825. log.SetFlags(log.LstdFlags | log.Lshortfile)
  826. rootCmd := &cobra.Command{
  827. Use: "ollama",
  828. Short: "Large language model runner",
  829. SilenceUsage: true,
  830. SilenceErrors: true,
  831. CompletionOptions: cobra.CompletionOptions{
  832. DisableDefaultCmd: true,
  833. },
  834. Version: version.Version,
  835. }
  836. cobra.EnableCommandSorting = false
  837. createCmd := &cobra.Command{
  838. Use: "create MODEL",
  839. Short: "Create a model from a Modelfile",
  840. Args: cobra.ExactArgs(1),
  841. PreRunE: checkServerHeartbeat,
  842. RunE: CreateHandler,
  843. }
  844. createCmd.Flags().StringP("file", "f", "Modelfile", "Name of the Modelfile (default \"Modelfile\")")
  845. showCmd := &cobra.Command{
  846. Use: "show MODEL",
  847. Short: "Show information for a model",
  848. Args: cobra.ExactArgs(1),
  849. PreRunE: checkServerHeartbeat,
  850. RunE: ShowHandler,
  851. }
  852. showCmd.Flags().Bool("license", false, "Show license of a model")
  853. showCmd.Flags().Bool("modelfile", false, "Show Modelfile of a model")
  854. showCmd.Flags().Bool("parameters", false, "Show parameters of a model")
  855. showCmd.Flags().Bool("template", false, "Show template of a model")
  856. showCmd.Flags().Bool("system", false, "Show system prompt of a model")
  857. runCmd := &cobra.Command{
  858. Use: "run MODEL [PROMPT]",
  859. Short: "Run a model",
  860. Args: cobra.MinimumNArgs(1),
  861. PreRunE: checkServerHeartbeat,
  862. RunE: RunHandler,
  863. }
  864. runCmd.Flags().Bool("verbose", false, "Show timings for response")
  865. runCmd.Flags().Bool("insecure", false, "Use an insecure registry")
  866. runCmd.Flags().Bool("nowordwrap", false, "Don't wrap words to the next line automatically")
  867. runCmd.Flags().String("format", "", "Response format (e.g. json)")
  868. serveCmd := &cobra.Command{
  869. Use: "serve",
  870. Aliases: []string{"start"},
  871. Short: "Start ollama",
  872. Args: cobra.ExactArgs(0),
  873. RunE: RunServer,
  874. }
  875. pullCmd := &cobra.Command{
  876. Use: "pull MODEL",
  877. Short: "Pull a model from a registry",
  878. Args: cobra.ExactArgs(1),
  879. PreRunE: checkServerHeartbeat,
  880. RunE: PullHandler,
  881. }
  882. pullCmd.Flags().Bool("insecure", false, "Use an insecure registry")
  883. pushCmd := &cobra.Command{
  884. Use: "push MODEL",
  885. Short: "Push a model to a registry",
  886. Args: cobra.ExactArgs(1),
  887. PreRunE: checkServerHeartbeat,
  888. RunE: PushHandler,
  889. }
  890. pushCmd.Flags().Bool("insecure", false, "Use an insecure registry")
  891. listCmd := &cobra.Command{
  892. Use: "list",
  893. Aliases: []string{"ls"},
  894. Short: "List models",
  895. PreRunE: checkServerHeartbeat,
  896. RunE: ListHandler,
  897. }
  898. copyCmd := &cobra.Command{
  899. Use: "cp SOURCE TARGET",
  900. Short: "Copy a model",
  901. Args: cobra.ExactArgs(2),
  902. PreRunE: checkServerHeartbeat,
  903. RunE: CopyHandler,
  904. }
  905. deleteCmd := &cobra.Command{
  906. Use: "rm MODEL [MODEL...]",
  907. Short: "Remove a model",
  908. Args: cobra.MinimumNArgs(1),
  909. PreRunE: checkServerHeartbeat,
  910. RunE: DeleteHandler,
  911. }
  912. rootCmd.AddCommand(
  913. serveCmd,
  914. createCmd,
  915. showCmd,
  916. runCmd,
  917. pullCmd,
  918. pushCmd,
  919. listCmd,
  920. copyCmd,
  921. deleteCmd,
  922. )
  923. return rootCmd
  924. }