cmd.go 28 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160
  1. package cmd
  2. import (
  3. "bytes"
  4. "context"
  5. "crypto/ed25519"
  6. "crypto/rand"
  7. "crypto/sha256"
  8. "encoding/pem"
  9. "errors"
  10. "fmt"
  11. "io"
  12. "log"
  13. "net"
  14. "net/http"
  15. "os"
  16. "os/exec"
  17. "os/signal"
  18. "path/filepath"
  19. "runtime"
  20. "strings"
  21. "syscall"
  22. "time"
  23. "github.com/olekukonko/tablewriter"
  24. "github.com/spf13/cobra"
  25. "golang.org/x/crypto/ssh"
  26. "golang.org/x/term"
  27. "github.com/jmorganca/ollama/api"
  28. "github.com/jmorganca/ollama/format"
  29. "github.com/jmorganca/ollama/parser"
  30. "github.com/jmorganca/ollama/progress"
  31. "github.com/jmorganca/ollama/readline"
  32. "github.com/jmorganca/ollama/server"
  33. "github.com/jmorganca/ollama/version"
  34. )
  35. func CreateHandler(cmd *cobra.Command, args []string) error {
  36. filename, _ := cmd.Flags().GetString("file")
  37. filename, err := filepath.Abs(filename)
  38. if err != nil {
  39. return err
  40. }
  41. client, err := api.ClientFromEnvironment()
  42. if err != nil {
  43. return err
  44. }
  45. p := progress.NewProgress(os.Stderr)
  46. defer p.Stop()
  47. bars := make(map[string]*progress.Bar)
  48. modelfile, err := os.ReadFile(filename)
  49. if err != nil {
  50. return err
  51. }
  52. commands, err := parser.Parse(bytes.NewReader(modelfile))
  53. if err != nil {
  54. return err
  55. }
  56. home, err := os.UserHomeDir()
  57. if err != nil {
  58. return err
  59. }
  60. status := "transferring model data"
  61. spinner := progress.NewSpinner(status)
  62. p.Add(status, spinner)
  63. for _, c := range commands {
  64. switch c.Name {
  65. case "model", "adapter":
  66. path := c.Args
  67. if path == "~" {
  68. path = home
  69. } else if strings.HasPrefix(path, "~/") {
  70. path = filepath.Join(home, path[2:])
  71. }
  72. if !filepath.IsAbs(path) {
  73. path = filepath.Join(filepath.Dir(filename), path)
  74. }
  75. bin, err := os.Open(path)
  76. if errors.Is(err, os.ErrNotExist) && c.Name == "model" {
  77. continue
  78. } else if err != nil {
  79. return err
  80. }
  81. defer bin.Close()
  82. hash := sha256.New()
  83. if _, err := io.Copy(hash, bin); err != nil {
  84. return err
  85. }
  86. bin.Seek(0, io.SeekStart)
  87. digest := fmt.Sprintf("sha256:%x", hash.Sum(nil))
  88. if err = client.CreateBlob(cmd.Context(), digest, bin); err != nil {
  89. return err
  90. }
  91. modelfile = bytes.ReplaceAll(modelfile, []byte(c.Args), []byte("@"+digest))
  92. }
  93. }
  94. fn := func(resp api.ProgressResponse) error {
  95. if resp.Digest != "" {
  96. spinner.Stop()
  97. bar, ok := bars[resp.Digest]
  98. if !ok {
  99. bar = progress.NewBar(fmt.Sprintf("pulling %s...", resp.Digest[7:19]), resp.Total, resp.Completed)
  100. bars[resp.Digest] = bar
  101. p.Add(resp.Digest, bar)
  102. }
  103. bar.Set(resp.Completed)
  104. } else if status != resp.Status {
  105. spinner.Stop()
  106. status = resp.Status
  107. spinner = progress.NewSpinner(status)
  108. p.Add(status, spinner)
  109. }
  110. return nil
  111. }
  112. request := api.CreateRequest{Name: args[0], Modelfile: string(modelfile)}
  113. if err := client.Create(context.Background(), &request, fn); err != nil {
  114. return err
  115. }
  116. return nil
  117. }
  118. func RunHandler(cmd *cobra.Command, args []string) error {
  119. client, err := api.ClientFromEnvironment()
  120. if err != nil {
  121. return err
  122. }
  123. name := args[0]
  124. // check if the model exists on the server
  125. _, err = client.Show(context.Background(), &api.ShowRequest{Name: name})
  126. var statusError api.StatusError
  127. switch {
  128. case errors.As(err, &statusError) && statusError.StatusCode == http.StatusNotFound:
  129. if err := PullHandler(cmd, args); err != nil {
  130. return err
  131. }
  132. case err != nil:
  133. return err
  134. }
  135. return RunGenerate(cmd, args)
  136. }
  137. func PushHandler(cmd *cobra.Command, args []string) error {
  138. client, err := api.ClientFromEnvironment()
  139. if err != nil {
  140. return err
  141. }
  142. insecure, err := cmd.Flags().GetBool("insecure")
  143. if err != nil {
  144. return err
  145. }
  146. p := progress.NewProgress(os.Stderr)
  147. defer p.Stop()
  148. bars := make(map[string]*progress.Bar)
  149. var status string
  150. var spinner *progress.Spinner
  151. fn := func(resp api.ProgressResponse) error {
  152. if resp.Digest != "" {
  153. if spinner != nil {
  154. spinner.Stop()
  155. }
  156. bar, ok := bars[resp.Digest]
  157. if !ok {
  158. bar = progress.NewBar(fmt.Sprintf("pushing %s...", resp.Digest[7:19]), resp.Total, resp.Completed)
  159. bars[resp.Digest] = bar
  160. p.Add(resp.Digest, bar)
  161. }
  162. bar.Set(resp.Completed)
  163. } else if status != resp.Status {
  164. if spinner != nil {
  165. spinner.Stop()
  166. }
  167. status = resp.Status
  168. spinner = progress.NewSpinner(status)
  169. p.Add(status, spinner)
  170. }
  171. return nil
  172. }
  173. request := api.PushRequest{Name: args[0], Insecure: insecure}
  174. if err := client.Push(context.Background(), &request, fn); err != nil {
  175. return err
  176. }
  177. spinner.Stop()
  178. return nil
  179. }
  180. func ListHandler(cmd *cobra.Command, args []string) error {
  181. client, err := api.ClientFromEnvironment()
  182. if err != nil {
  183. return err
  184. }
  185. models, err := client.List(context.Background())
  186. if err != nil {
  187. return err
  188. }
  189. var data [][]string
  190. for _, m := range models.Models {
  191. if len(args) == 0 || strings.HasPrefix(m.Name, args[0]) {
  192. data = append(data, []string{m.Name, m.Digest[:12], format.HumanBytes(m.Size), format.HumanTime(m.ModifiedAt, "Never")})
  193. }
  194. }
  195. table := tablewriter.NewWriter(os.Stdout)
  196. table.SetHeader([]string{"NAME", "ID", "SIZE", "MODIFIED"})
  197. table.SetHeaderAlignment(tablewriter.ALIGN_LEFT)
  198. table.SetAlignment(tablewriter.ALIGN_LEFT)
  199. table.SetHeaderLine(false)
  200. table.SetBorder(false)
  201. table.SetNoWhiteSpace(true)
  202. table.SetTablePadding("\t")
  203. table.AppendBulk(data)
  204. table.Render()
  205. return nil
  206. }
  207. func DeleteHandler(cmd *cobra.Command, args []string) error {
  208. client, err := api.ClientFromEnvironment()
  209. if err != nil {
  210. return err
  211. }
  212. for _, name := range args {
  213. req := api.DeleteRequest{Name: name}
  214. if err := client.Delete(context.Background(), &req); err != nil {
  215. return err
  216. }
  217. fmt.Printf("deleted '%s'\n", name)
  218. }
  219. return nil
  220. }
  221. func ShowHandler(cmd *cobra.Command, args []string) error {
  222. client, err := api.ClientFromEnvironment()
  223. if err != nil {
  224. return err
  225. }
  226. if len(args) != 1 {
  227. return errors.New("missing model name")
  228. }
  229. license, errLicense := cmd.Flags().GetBool("license")
  230. modelfile, errModelfile := cmd.Flags().GetBool("modelfile")
  231. parameters, errParams := cmd.Flags().GetBool("parameters")
  232. system, errSystem := cmd.Flags().GetBool("system")
  233. template, errTemplate := cmd.Flags().GetBool("template")
  234. for _, boolErr := range []error{errLicense, errModelfile, errParams, errSystem, errTemplate} {
  235. if boolErr != nil {
  236. return errors.New("error retrieving flags")
  237. }
  238. }
  239. flagsSet := 0
  240. showType := ""
  241. if license {
  242. flagsSet++
  243. showType = "license"
  244. }
  245. if modelfile {
  246. flagsSet++
  247. showType = "modelfile"
  248. }
  249. if parameters {
  250. flagsSet++
  251. showType = "parameters"
  252. }
  253. if system {
  254. flagsSet++
  255. showType = "system"
  256. }
  257. if template {
  258. flagsSet++
  259. showType = "template"
  260. }
  261. if flagsSet > 1 {
  262. return errors.New("only one of '--license', '--modelfile', '--parameters', '--system', or '--template' can be specified")
  263. } else if flagsSet == 0 {
  264. return errors.New("one of '--license', '--modelfile', '--parameters', '--system', or '--template' must be specified")
  265. }
  266. req := api.ShowRequest{Name: args[0]}
  267. resp, err := client.Show(context.Background(), &req)
  268. if err != nil {
  269. return err
  270. }
  271. switch showType {
  272. case "license":
  273. fmt.Println(resp.License)
  274. case "modelfile":
  275. fmt.Println(resp.Modelfile)
  276. case "parameters":
  277. fmt.Println(resp.Parameters)
  278. case "system":
  279. fmt.Println(resp.System)
  280. case "template":
  281. fmt.Println(resp.Template)
  282. }
  283. return nil
  284. }
  285. func CopyHandler(cmd *cobra.Command, args []string) error {
  286. client, err := api.ClientFromEnvironment()
  287. if err != nil {
  288. return err
  289. }
  290. req := api.CopyRequest{Source: args[0], Destination: args[1]}
  291. if err := client.Copy(context.Background(), &req); err != nil {
  292. return err
  293. }
  294. fmt.Printf("copied '%s' to '%s'\n", args[0], args[1])
  295. return nil
  296. }
  297. func PullHandler(cmd *cobra.Command, args []string) error {
  298. insecure, err := cmd.Flags().GetBool("insecure")
  299. if err != nil {
  300. return err
  301. }
  302. client, err := api.ClientFromEnvironment()
  303. if err != nil {
  304. return err
  305. }
  306. p := progress.NewProgress(os.Stderr)
  307. defer p.Stop()
  308. bars := make(map[string]*progress.Bar)
  309. var status string
  310. var spinner *progress.Spinner
  311. fn := func(resp api.ProgressResponse) error {
  312. if resp.Digest != "" {
  313. if spinner != nil {
  314. spinner.Stop()
  315. }
  316. bar, ok := bars[resp.Digest]
  317. if !ok {
  318. bar = progress.NewBar(fmt.Sprintf("pulling %s...", resp.Digest[7:19]), resp.Total, resp.Completed)
  319. bars[resp.Digest] = bar
  320. p.Add(resp.Digest, bar)
  321. }
  322. bar.Set(resp.Completed)
  323. } else if status != resp.Status {
  324. if spinner != nil {
  325. spinner.Stop()
  326. }
  327. status = resp.Status
  328. spinner = progress.NewSpinner(status)
  329. p.Add(status, spinner)
  330. }
  331. return nil
  332. }
  333. request := api.PullRequest{Name: args[0], Insecure: insecure}
  334. if err := client.Pull(context.Background(), &request, fn); err != nil {
  335. return err
  336. }
  337. return nil
  338. }
  339. func RunGenerate(cmd *cobra.Command, args []string) error {
  340. interactive := true
  341. opts := generateOptions{
  342. Model: args[0],
  343. WordWrap: os.Getenv("TERM") == "xterm-256color",
  344. Options: map[string]interface{}{},
  345. }
  346. format, err := cmd.Flags().GetString("format")
  347. if err != nil {
  348. return err
  349. }
  350. opts.Format = format
  351. prompts := args[1:]
  352. // prepend stdin to the prompt if provided
  353. if !term.IsTerminal(int(os.Stdin.Fd())) {
  354. in, err := io.ReadAll(os.Stdin)
  355. if err != nil {
  356. return err
  357. }
  358. prompts = append([]string{string(in)}, prompts...)
  359. opts.WordWrap = false
  360. interactive = false
  361. }
  362. opts.Prompt = strings.Join(prompts, " ")
  363. if len(prompts) > 0 {
  364. interactive = false
  365. }
  366. nowrap, err := cmd.Flags().GetBool("nowordwrap")
  367. if err != nil {
  368. return err
  369. }
  370. opts.WordWrap = !nowrap
  371. if !interactive {
  372. return generate(cmd, opts)
  373. }
  374. return generateInteractive(cmd, opts)
  375. }
  376. type generateContextKey string
  377. type generateOptions struct {
  378. Model string
  379. Prompt string
  380. WordWrap bool
  381. Format string
  382. System string
  383. Template string
  384. Options map[string]interface{}
  385. }
  386. func generate(cmd *cobra.Command, opts generateOptions) error {
  387. client, err := api.ClientFromEnvironment()
  388. if err != nil {
  389. return err
  390. }
  391. p := progress.NewProgress(os.Stderr)
  392. defer p.StopAndClear()
  393. spinner := progress.NewSpinner("")
  394. p.Add("", spinner)
  395. var latest api.GenerateResponse
  396. generateContext, ok := cmd.Context().Value(generateContextKey("context")).([]int)
  397. if !ok {
  398. generateContext = []int{}
  399. }
  400. termWidth, _, err := term.GetSize(int(os.Stdout.Fd()))
  401. if err != nil {
  402. opts.WordWrap = false
  403. }
  404. cancelCtx, cancel := context.WithCancel(context.Background())
  405. defer cancel()
  406. sigChan := make(chan os.Signal, 1)
  407. signal.Notify(sigChan, syscall.SIGINT)
  408. go func() {
  409. <-sigChan
  410. cancel()
  411. }()
  412. var currentLineLength int
  413. var wordBuffer string
  414. request := api.GenerateRequest{
  415. Model: opts.Model,
  416. Prompt: opts.Prompt,
  417. Context: generateContext,
  418. Format: opts.Format,
  419. System: opts.System,
  420. Template: opts.Template,
  421. Options: opts.Options,
  422. }
  423. fn := func(response api.GenerateResponse) error {
  424. p.StopAndClear()
  425. latest = response
  426. termWidth, _, _ = term.GetSize(int(os.Stdout.Fd()))
  427. if opts.WordWrap && termWidth >= 10 {
  428. for _, ch := range response.Response {
  429. if currentLineLength+1 > termWidth-5 {
  430. if len(wordBuffer) > termWidth-10 {
  431. fmt.Printf("%s%c", wordBuffer, ch)
  432. wordBuffer = ""
  433. currentLineLength = 0
  434. continue
  435. }
  436. // backtrack the length of the last word and clear to the end of the line
  437. fmt.Printf("\x1b[%dD\x1b[K\n", len(wordBuffer))
  438. fmt.Printf("%s%c", wordBuffer, ch)
  439. currentLineLength = len(wordBuffer) + 1
  440. } else {
  441. fmt.Print(string(ch))
  442. currentLineLength += 1
  443. switch ch {
  444. case ' ':
  445. wordBuffer = ""
  446. case '\n':
  447. currentLineLength = 0
  448. default:
  449. wordBuffer += string(ch)
  450. }
  451. }
  452. }
  453. } else {
  454. fmt.Printf("%s%s", wordBuffer, response.Response)
  455. if len(wordBuffer) > 0 {
  456. wordBuffer = ""
  457. }
  458. }
  459. return nil
  460. }
  461. if err := client.Generate(cancelCtx, &request, fn); err != nil {
  462. if errors.Is(err, context.Canceled) {
  463. return nil
  464. }
  465. return err
  466. }
  467. if opts.Prompt != "" {
  468. fmt.Println()
  469. fmt.Println()
  470. }
  471. if !latest.Done {
  472. return nil
  473. }
  474. verbose, err := cmd.Flags().GetBool("verbose")
  475. if err != nil {
  476. return err
  477. }
  478. if verbose {
  479. latest.Summary()
  480. }
  481. ctx := cmd.Context()
  482. ctx = context.WithValue(ctx, generateContextKey("context"), latest.Context)
  483. cmd.SetContext(ctx)
  484. return nil
  485. }
  486. type MultilineState int
  487. const (
  488. MultilineNone MultilineState = iota
  489. MultilinePrompt
  490. MultilineSystem
  491. MultilineTemplate
  492. )
  493. func generateInteractive(cmd *cobra.Command, opts generateOptions) error {
  494. // load the model
  495. loadOpts := generateOptions{
  496. Model: opts.Model,
  497. Prompt: "",
  498. }
  499. if err := generate(cmd, loadOpts); err != nil {
  500. return err
  501. }
  502. usage := func() {
  503. fmt.Fprintln(os.Stderr, "Available Commands:")
  504. fmt.Fprintln(os.Stderr, " /set Set session variables")
  505. fmt.Fprintln(os.Stderr, " /show Show model information")
  506. fmt.Fprintln(os.Stderr, " /bye Exit")
  507. fmt.Fprintln(os.Stderr, " /?, /help Help for a command")
  508. fmt.Fprintln(os.Stderr, "")
  509. fmt.Fprintln(os.Stderr, "Use \"\"\" to begin a multi-line message.")
  510. fmt.Fprintln(os.Stderr, "")
  511. }
  512. usageSet := func() {
  513. fmt.Fprintln(os.Stderr, "Available Commands:")
  514. fmt.Fprintln(os.Stderr, " /set parameter ... Set a parameter")
  515. fmt.Fprintln(os.Stderr, " /set system <string> Set system prompt")
  516. fmt.Fprintln(os.Stderr, " /set template <string> Set prompt template")
  517. fmt.Fprintln(os.Stderr, " /set history Enable history")
  518. fmt.Fprintln(os.Stderr, " /set nohistory Disable history")
  519. fmt.Fprintln(os.Stderr, " /set wordwrap Enable wordwrap")
  520. fmt.Fprintln(os.Stderr, " /set nowordwrap Disable wordwrap")
  521. fmt.Fprintln(os.Stderr, " /set format json Enable JSON mode")
  522. fmt.Fprintln(os.Stderr, " /set noformat Disable formatting")
  523. fmt.Fprintln(os.Stderr, " /set verbose Show LLM stats")
  524. fmt.Fprintln(os.Stderr, " /set quiet Disable LLM stats")
  525. fmt.Fprintln(os.Stderr, "")
  526. }
  527. usageShow := func() {
  528. fmt.Fprintln(os.Stderr, "Available Commands:")
  529. fmt.Fprintln(os.Stderr, " /show license Show model license")
  530. fmt.Fprintln(os.Stderr, " /show modelfile Show Modelfile for this model")
  531. fmt.Fprintln(os.Stderr, " /show parameters Show parameters for this model")
  532. fmt.Fprintln(os.Stderr, " /show system Show system prompt")
  533. fmt.Fprintln(os.Stderr, " /show template Show prompt template")
  534. fmt.Fprintln(os.Stderr, "")
  535. }
  536. // only list out the most common parameters
  537. usageParameters := func() {
  538. fmt.Fprintln(os.Stderr, "Available Parameters:")
  539. fmt.Fprintln(os.Stderr, " /set parameter seed <int> Random number seed")
  540. fmt.Fprintln(os.Stderr, " /set parameter num_predict <int> Max number of tokens to predict")
  541. fmt.Fprintln(os.Stderr, " /set parameter top_k <int> Pick from top k num of tokens")
  542. fmt.Fprintln(os.Stderr, " /set parameter top_p <float> Pick token based on sum of probabilities")
  543. fmt.Fprintln(os.Stderr, " /set parameter num_ctx <int> Set the context size")
  544. fmt.Fprintln(os.Stderr, " /set parameter temperature <float> Set creativity level")
  545. fmt.Fprintln(os.Stderr, " /set parameter repeat_penalty <float> How strongly to penalize repetitions")
  546. fmt.Fprintln(os.Stderr, " /set parameter repeat_last_n <int> Set how far back to look for repetitions")
  547. fmt.Fprintln(os.Stderr, " /set parameter num_gpu <int> The number of layers to send to the GPU")
  548. fmt.Fprintln(os.Stderr, " /set parameter stop \"<string>\", ... Set the stop parameters")
  549. fmt.Fprintln(os.Stderr, "")
  550. }
  551. scanner, err := readline.New(readline.Prompt{
  552. Prompt: ">>> ",
  553. AltPrompt: "... ",
  554. Placeholder: "Send a message (/? for help)",
  555. AltPlaceholder: `Use """ to end multi-line input`,
  556. })
  557. if err != nil {
  558. return err
  559. }
  560. fmt.Print(readline.StartBracketedPaste)
  561. defer fmt.Printf(readline.EndBracketedPaste)
  562. var multiline MultilineState
  563. var prompt string
  564. for {
  565. line, err := scanner.Readline()
  566. switch {
  567. case errors.Is(err, io.EOF):
  568. fmt.Println()
  569. return nil
  570. case errors.Is(err, readline.ErrInterrupt):
  571. if line == "" {
  572. fmt.Println("\nUse Ctrl-D or /bye to exit.")
  573. }
  574. scanner.Prompt.UseAlt = false
  575. prompt = ""
  576. continue
  577. case err != nil:
  578. return err
  579. }
  580. switch {
  581. case strings.HasPrefix(prompt, `"""`):
  582. // if the prompt so far starts with """ then we're in multiline mode
  583. // and we need to keep reading until we find a line that ends with """
  584. cut, found := strings.CutSuffix(line, `"""`)
  585. prompt += cut + "\n"
  586. if !found {
  587. continue
  588. }
  589. prompt = strings.TrimPrefix(prompt, `"""`)
  590. scanner.Prompt.UseAlt = false
  591. switch multiline {
  592. case MultilineSystem:
  593. opts.System = prompt
  594. prompt = ""
  595. fmt.Println("Set system template.\n")
  596. case MultilineTemplate:
  597. opts.Template = prompt
  598. prompt = ""
  599. fmt.Println("Set model template.\n")
  600. }
  601. multiline = MultilineNone
  602. case strings.HasPrefix(line, `"""`) && len(prompt) == 0:
  603. scanner.Prompt.UseAlt = true
  604. multiline = MultilinePrompt
  605. prompt += line + "\n"
  606. continue
  607. case scanner.Pasting:
  608. prompt += line + "\n"
  609. continue
  610. case strings.HasPrefix(line, "/list"):
  611. args := strings.Fields(line)
  612. if err := ListHandler(cmd, args[1:]); err != nil {
  613. return err
  614. }
  615. case strings.HasPrefix(line, "/set"):
  616. args := strings.Fields(line)
  617. if len(args) > 1 {
  618. switch args[1] {
  619. case "history":
  620. scanner.HistoryEnable()
  621. case "nohistory":
  622. scanner.HistoryDisable()
  623. case "wordwrap":
  624. opts.WordWrap = true
  625. fmt.Println("Set 'wordwrap' mode.")
  626. case "nowordwrap":
  627. opts.WordWrap = false
  628. fmt.Println("Set 'nowordwrap' mode.")
  629. case "verbose":
  630. cmd.Flags().Set("verbose", "true")
  631. fmt.Println("Set 'verbose' mode.")
  632. case "quiet":
  633. cmd.Flags().Set("verbose", "false")
  634. fmt.Println("Set 'quiet' mode.")
  635. case "format":
  636. if len(args) < 3 || args[2] != "json" {
  637. fmt.Println("Invalid or missing format. For 'json' mode use '/set format json'")
  638. } else {
  639. opts.Format = args[2]
  640. fmt.Printf("Set format to '%s' mode.\n", args[2])
  641. }
  642. case "noformat":
  643. opts.Format = ""
  644. fmt.Println("Disabled format.")
  645. case "parameter":
  646. if len(args) < 4 {
  647. usageParameters()
  648. continue
  649. }
  650. var params []string
  651. for _, p := range args[3:] {
  652. params = append(params, p)
  653. }
  654. fp, err := api.FormatParams(map[string][]string{args[2]: params})
  655. if err != nil {
  656. fmt.Printf("Couldn't set parameter: %q\n\n", err)
  657. continue
  658. }
  659. fmt.Printf("Set parameter '%s' to '%s'\n\n", args[2], strings.Join(params, ", "))
  660. opts.Options[args[2]] = fp[args[2]]
  661. case "system", "template":
  662. if len(args) < 3 {
  663. usageSet()
  664. continue
  665. }
  666. line := strings.Join(args[2:], " ")
  667. line = strings.TrimPrefix(line, `"""`)
  668. if strings.HasPrefix(args[2], `"""`) {
  669. cut, found := strings.CutSuffix(line, `"""`)
  670. prompt += cut + "\n"
  671. if found {
  672. opts.System = prompt
  673. if args[1] == "system" {
  674. fmt.Println("Set system template.\n")
  675. } else {
  676. fmt.Println("Set prompt template.\n")
  677. }
  678. prompt = ""
  679. } else {
  680. prompt = `"""` + prompt
  681. if args[1] == "system" {
  682. multiline = MultilineSystem
  683. } else {
  684. multiline = MultilineTemplate
  685. }
  686. scanner.Prompt.UseAlt = true
  687. }
  688. } else {
  689. opts.System = line
  690. fmt.Println("Set system template.\n")
  691. }
  692. default:
  693. fmt.Printf("Unknown command '/set %s'. Type /? for help\n", args[1])
  694. }
  695. } else {
  696. usageSet()
  697. }
  698. case strings.HasPrefix(line, "/show"):
  699. args := strings.Fields(line)
  700. if len(args) > 1 {
  701. client, err := api.ClientFromEnvironment()
  702. if err != nil {
  703. fmt.Println("error: couldn't connect to ollama server")
  704. return err
  705. }
  706. resp, err := client.Show(cmd.Context(), &api.ShowRequest{Name: opts.Model})
  707. if err != nil {
  708. fmt.Println("error: couldn't get model")
  709. return err
  710. }
  711. switch args[1] {
  712. case "license":
  713. if resp.License == "" {
  714. fmt.Print("No license was specified for this model.\n\n")
  715. } else {
  716. fmt.Println(resp.License)
  717. }
  718. case "modelfile":
  719. fmt.Println(resp.Modelfile)
  720. case "parameters":
  721. if resp.Parameters == "" {
  722. fmt.Print("No parameters were specified for this model.\n\n")
  723. } else {
  724. if len(opts.Options) > 0 {
  725. fmt.Println("User defined parameters:")
  726. for k, v := range opts.Options {
  727. fmt.Printf("%-*s %v\n", 30, k, v)
  728. }
  729. fmt.Println()
  730. }
  731. fmt.Println("Model defined parameters:")
  732. fmt.Println(resp.Parameters)
  733. }
  734. case "system":
  735. switch {
  736. case opts.System != "":
  737. fmt.Println(opts.System + "\n")
  738. case resp.System != "":
  739. fmt.Println(resp.System + "\n")
  740. default:
  741. fmt.Print("No system prompt was specified for this model.\n\n")
  742. }
  743. case "template":
  744. switch {
  745. case opts.Template != "":
  746. fmt.Println(opts.Template + "\n")
  747. case resp.Template != "":
  748. fmt.Println(resp.Template)
  749. default:
  750. fmt.Print("No prompt template was specified for this model.\n\n")
  751. }
  752. default:
  753. fmt.Printf("Unknown command '/show %s'. Type /? for help\n", args[1])
  754. }
  755. } else {
  756. usageShow()
  757. }
  758. case strings.HasPrefix(line, "/help"), strings.HasPrefix(line, "/?"):
  759. args := strings.Fields(line)
  760. if len(args) > 1 {
  761. switch args[1] {
  762. case "set", "/set":
  763. usageSet()
  764. case "show", "/show":
  765. usageShow()
  766. }
  767. } else {
  768. usage()
  769. }
  770. case line == "/exit", line == "/bye":
  771. return nil
  772. case strings.HasPrefix(line, "/"):
  773. args := strings.Fields(line)
  774. fmt.Printf("Unknown command '%s'. Type /? for help\n", args[0])
  775. continue
  776. default:
  777. prompt += line
  778. }
  779. if len(prompt) > 0 && multiline == MultilineNone {
  780. opts.Prompt = prompt
  781. if err := generate(cmd, opts); err != nil {
  782. return err
  783. }
  784. prompt = ""
  785. }
  786. }
  787. }
  788. func RunServer(cmd *cobra.Command, _ []string) error {
  789. host, port, err := net.SplitHostPort(os.Getenv("OLLAMA_HOST"))
  790. if err != nil {
  791. host, port = "127.0.0.1", "11434"
  792. if ip := net.ParseIP(strings.Trim(os.Getenv("OLLAMA_HOST"), "[]")); ip != nil {
  793. host = ip.String()
  794. }
  795. }
  796. if err := initializeKeypair(); err != nil {
  797. return err
  798. }
  799. ln, err := net.Listen("tcp", net.JoinHostPort(host, port))
  800. if err != nil {
  801. return err
  802. }
  803. var origins []string
  804. if o := os.Getenv("OLLAMA_ORIGINS"); o != "" {
  805. origins = strings.Split(o, ",")
  806. }
  807. return server.Serve(ln, origins)
  808. }
  809. func initializeKeypair() error {
  810. home, err := os.UserHomeDir()
  811. if err != nil {
  812. return err
  813. }
  814. privKeyPath := filepath.Join(home, ".ollama", "id_ed25519")
  815. pubKeyPath := filepath.Join(home, ".ollama", "id_ed25519.pub")
  816. _, err = os.Stat(privKeyPath)
  817. if os.IsNotExist(err) {
  818. fmt.Printf("Couldn't find '%s'. Generating new private key.\n", privKeyPath)
  819. _, privKey, err := ed25519.GenerateKey(rand.Reader)
  820. if err != nil {
  821. return err
  822. }
  823. privKeyBytes, err := format.OpenSSHPrivateKey(privKey, "")
  824. if err != nil {
  825. return err
  826. }
  827. err = os.MkdirAll(filepath.Dir(privKeyPath), 0o755)
  828. if err != nil {
  829. return fmt.Errorf("could not create directory %w", err)
  830. }
  831. err = os.WriteFile(privKeyPath, pem.EncodeToMemory(privKeyBytes), 0o600)
  832. if err != nil {
  833. return err
  834. }
  835. sshPrivateKey, err := ssh.NewSignerFromKey(privKey)
  836. if err != nil {
  837. return err
  838. }
  839. pubKeyData := ssh.MarshalAuthorizedKey(sshPrivateKey.PublicKey())
  840. err = os.WriteFile(pubKeyPath, pubKeyData, 0o644)
  841. if err != nil {
  842. return err
  843. }
  844. fmt.Printf("Your new public key is: \n\n%s\n", string(pubKeyData))
  845. }
  846. return nil
  847. }
  848. func startMacApp(client *api.Client) error {
  849. exe, err := os.Executable()
  850. if err != nil {
  851. return err
  852. }
  853. link, err := os.Readlink(exe)
  854. if err != nil {
  855. return err
  856. }
  857. if !strings.Contains(link, "Ollama.app") {
  858. return fmt.Errorf("could not find ollama app")
  859. }
  860. path := strings.Split(link, "Ollama.app")
  861. if err := exec.Command("/usr/bin/open", "-a", path[0]+"Ollama.app").Run(); err != nil {
  862. return err
  863. }
  864. // wait for the server to start
  865. timeout := time.After(5 * time.Second)
  866. tick := time.Tick(500 * time.Millisecond)
  867. for {
  868. select {
  869. case <-timeout:
  870. return errors.New("timed out waiting for server to start")
  871. case <-tick:
  872. if err := client.Heartbeat(context.Background()); err == nil {
  873. return nil // server has started
  874. }
  875. }
  876. }
  877. }
  878. func checkServerHeartbeat(_ *cobra.Command, _ []string) error {
  879. client, err := api.ClientFromEnvironment()
  880. if err != nil {
  881. return err
  882. }
  883. if err := client.Heartbeat(context.Background()); err != nil {
  884. if !strings.Contains(err.Error(), "connection refused") {
  885. return err
  886. }
  887. if runtime.GOOS == "darwin" {
  888. if err := startMacApp(client); err != nil {
  889. return fmt.Errorf("could not connect to ollama app, is it running?")
  890. }
  891. } else {
  892. return fmt.Errorf("could not connect to ollama server, run 'ollama serve' to start it")
  893. }
  894. }
  895. return nil
  896. }
  897. func NewCLI() *cobra.Command {
  898. log.SetFlags(log.LstdFlags | log.Lshortfile)
  899. rootCmd := &cobra.Command{
  900. Use: "ollama",
  901. Short: "Large language model runner",
  902. SilenceUsage: true,
  903. SilenceErrors: true,
  904. CompletionOptions: cobra.CompletionOptions{
  905. DisableDefaultCmd: true,
  906. },
  907. Version: version.Version,
  908. }
  909. cobra.EnableCommandSorting = false
  910. createCmd := &cobra.Command{
  911. Use: "create MODEL",
  912. Short: "Create a model from a Modelfile",
  913. Args: cobra.ExactArgs(1),
  914. PreRunE: checkServerHeartbeat,
  915. RunE: CreateHandler,
  916. }
  917. createCmd.Flags().StringP("file", "f", "Modelfile", "Name of the Modelfile (default \"Modelfile\")")
  918. showCmd := &cobra.Command{
  919. Use: "show MODEL",
  920. Short: "Show information for a model",
  921. Args: cobra.ExactArgs(1),
  922. PreRunE: checkServerHeartbeat,
  923. RunE: ShowHandler,
  924. }
  925. showCmd.Flags().Bool("license", false, "Show license of a model")
  926. showCmd.Flags().Bool("modelfile", false, "Show Modelfile of a model")
  927. showCmd.Flags().Bool("parameters", false, "Show parameters of a model")
  928. showCmd.Flags().Bool("template", false, "Show template of a model")
  929. showCmd.Flags().Bool("system", false, "Show system prompt of a model")
  930. runCmd := &cobra.Command{
  931. Use: "run MODEL [PROMPT]",
  932. Short: "Run a model",
  933. Args: cobra.MinimumNArgs(1),
  934. PreRunE: checkServerHeartbeat,
  935. RunE: RunHandler,
  936. }
  937. runCmd.Flags().Bool("verbose", false, "Show timings for response")
  938. runCmd.Flags().Bool("insecure", false, "Use an insecure registry")
  939. runCmd.Flags().Bool("nowordwrap", false, "Don't wrap words to the next line automatically")
  940. runCmd.Flags().String("format", "", "Response format (e.g. json)")
  941. serveCmd := &cobra.Command{
  942. Use: "serve",
  943. Aliases: []string{"start"},
  944. Short: "Start ollama",
  945. Args: cobra.ExactArgs(0),
  946. RunE: RunServer,
  947. }
  948. pullCmd := &cobra.Command{
  949. Use: "pull MODEL",
  950. Short: "Pull a model from a registry",
  951. Args: cobra.ExactArgs(1),
  952. PreRunE: checkServerHeartbeat,
  953. RunE: PullHandler,
  954. }
  955. pullCmd.Flags().Bool("insecure", false, "Use an insecure registry")
  956. pushCmd := &cobra.Command{
  957. Use: "push MODEL",
  958. Short: "Push a model to a registry",
  959. Args: cobra.ExactArgs(1),
  960. PreRunE: checkServerHeartbeat,
  961. RunE: PushHandler,
  962. }
  963. pushCmd.Flags().Bool("insecure", false, "Use an insecure registry")
  964. listCmd := &cobra.Command{
  965. Use: "list",
  966. Aliases: []string{"ls"},
  967. Short: "List models",
  968. PreRunE: checkServerHeartbeat,
  969. RunE: ListHandler,
  970. }
  971. copyCmd := &cobra.Command{
  972. Use: "cp SOURCE TARGET",
  973. Short: "Copy a model",
  974. Args: cobra.ExactArgs(2),
  975. PreRunE: checkServerHeartbeat,
  976. RunE: CopyHandler,
  977. }
  978. deleteCmd := &cobra.Command{
  979. Use: "rm MODEL [MODEL...]",
  980. Short: "Remove a model",
  981. Args: cobra.MinimumNArgs(1),
  982. PreRunE: checkServerHeartbeat,
  983. RunE: DeleteHandler,
  984. }
  985. rootCmd.AddCommand(
  986. serveCmd,
  987. createCmd,
  988. showCmd,
  989. runCmd,
  990. pullCmd,
  991. pushCmd,
  992. listCmd,
  993. copyCmd,
  994. deleteCmd,
  995. )
  996. return rootCmd
  997. }