routes_test.go 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591
  1. package server
  2. import (
  3. "bytes"
  4. "context"
  5. "encoding/binary"
  6. "encoding/json"
  7. "fmt"
  8. "io"
  9. "math"
  10. "net/http"
  11. "net/http/httptest"
  12. "net/url"
  13. "os"
  14. "sort"
  15. "strings"
  16. "testing"
  17. "github.com/gin-gonic/gin"
  18. "github.com/stretchr/testify/assert"
  19. "github.com/stretchr/testify/require"
  20. "github.com/ollama/ollama/api"
  21. "github.com/ollama/ollama/auth"
  22. "github.com/ollama/ollama/envconfig"
  23. "github.com/ollama/ollama/llm"
  24. "github.com/ollama/ollama/openai"
  25. "github.com/ollama/ollama/parser"
  26. "github.com/ollama/ollama/types/model"
  27. "github.com/ollama/ollama/version"
  28. )
  29. func createTestFile(t *testing.T, name string) string {
  30. t.Helper()
  31. f, err := os.CreateTemp(t.TempDir(), name)
  32. require.NoError(t, err)
  33. defer f.Close()
  34. err = binary.Write(f, binary.LittleEndian, []byte("GGUF"))
  35. require.NoError(t, err)
  36. err = binary.Write(f, binary.LittleEndian, uint32(3))
  37. require.NoError(t, err)
  38. err = binary.Write(f, binary.LittleEndian, uint64(0))
  39. require.NoError(t, err)
  40. err = binary.Write(f, binary.LittleEndian, uint64(0))
  41. require.NoError(t, err)
  42. return f.Name()
  43. }
  44. func Test_Routes(t *testing.T) {
  45. type testCase struct {
  46. Name string
  47. Method string
  48. Path string
  49. Setup func(t *testing.T, req *http.Request)
  50. Expected func(t *testing.T, resp *http.Response)
  51. }
  52. createTestModel := func(t *testing.T, name string) {
  53. t.Helper()
  54. fname := createTestFile(t, "ollama-model")
  55. r := strings.NewReader(fmt.Sprintf("FROM %s\nPARAMETER seed 42\nPARAMETER top_p 0.9\nPARAMETER stop foo\nPARAMETER stop bar", fname))
  56. modelfile, err := parser.ParseFile(r)
  57. require.NoError(t, err)
  58. fn := func(resp api.ProgressResponse) {
  59. t.Logf("Status: %s", resp.Status)
  60. }
  61. err = CreateModel(context.TODO(), model.ParseName(name), "", "", modelfile, fn)
  62. require.NoError(t, err)
  63. }
  64. testCases := []testCase{
  65. {
  66. Name: "Version Handler",
  67. Method: http.MethodGet,
  68. Path: "/api/version",
  69. Setup: func(t *testing.T, req *http.Request) {
  70. },
  71. Expected: func(t *testing.T, resp *http.Response) {
  72. contentType := resp.Header.Get("Content-Type")
  73. assert.Equal(t, "application/json; charset=utf-8", contentType)
  74. body, err := io.ReadAll(resp.Body)
  75. require.NoError(t, err)
  76. assert.Equal(t, fmt.Sprintf(`{"version":"%s"}`, version.Version), string(body))
  77. },
  78. },
  79. {
  80. Name: "Tags Handler (no tags)",
  81. Method: http.MethodGet,
  82. Path: "/api/tags",
  83. Expected: func(t *testing.T, resp *http.Response) {
  84. contentType := resp.Header.Get("Content-Type")
  85. assert.Equal(t, "application/json; charset=utf-8", contentType)
  86. body, err := io.ReadAll(resp.Body)
  87. require.NoError(t, err)
  88. var modelList api.ListResponse
  89. err = json.Unmarshal(body, &modelList)
  90. require.NoError(t, err)
  91. assert.NotNil(t, modelList.Models)
  92. assert.Empty(t, len(modelList.Models))
  93. },
  94. },
  95. {
  96. Name: "openai empty list",
  97. Method: http.MethodGet,
  98. Path: "/v1/models",
  99. Expected: func(t *testing.T, resp *http.Response) {
  100. contentType := resp.Header.Get("Content-Type")
  101. assert.Equal(t, "application/json", contentType)
  102. body, err := io.ReadAll(resp.Body)
  103. require.NoError(t, err)
  104. var modelList openai.ListCompletion
  105. err = json.Unmarshal(body, &modelList)
  106. require.NoError(t, err)
  107. assert.Equal(t, "list", modelList.Object)
  108. assert.Empty(t, modelList.Data)
  109. },
  110. },
  111. {
  112. Name: "Tags Handler (yes tags)",
  113. Method: http.MethodGet,
  114. Path: "/api/tags",
  115. Setup: func(t *testing.T, req *http.Request) {
  116. createTestModel(t, "test-model")
  117. },
  118. Expected: func(t *testing.T, resp *http.Response) {
  119. contentType := resp.Header.Get("Content-Type")
  120. assert.Equal(t, "application/json; charset=utf-8", contentType)
  121. body, err := io.ReadAll(resp.Body)
  122. require.NoError(t, err)
  123. assert.NotContains(t, string(body), "expires_at")
  124. var modelList api.ListResponse
  125. err = json.Unmarshal(body, &modelList)
  126. require.NoError(t, err)
  127. assert.Len(t, modelList.Models, 1)
  128. assert.Equal(t, "test-model:latest", modelList.Models[0].Name)
  129. },
  130. },
  131. {
  132. Name: "openai list models with tags",
  133. Method: http.MethodGet,
  134. Path: "/v1/models",
  135. Expected: func(t *testing.T, resp *http.Response) {
  136. contentType := resp.Header.Get("Content-Type")
  137. assert.Equal(t, "application/json", contentType)
  138. body, err := io.ReadAll(resp.Body)
  139. require.NoError(t, err)
  140. var modelList openai.ListCompletion
  141. err = json.Unmarshal(body, &modelList)
  142. require.NoError(t, err)
  143. assert.Len(t, modelList.Data, 1)
  144. assert.Equal(t, "test-model:latest", modelList.Data[0].Id)
  145. assert.Equal(t, "library", modelList.Data[0].OwnedBy)
  146. },
  147. },
  148. {
  149. Name: "Create Model Handler",
  150. Method: http.MethodPost,
  151. Path: "/api/create",
  152. Setup: func(t *testing.T, req *http.Request) {
  153. fname := createTestFile(t, "ollama-model")
  154. stream := false
  155. createReq := api.CreateRequest{
  156. Name: "t-bone",
  157. Modelfile: fmt.Sprintf("FROM %s", fname),
  158. Stream: &stream,
  159. }
  160. jsonData, err := json.Marshal(createReq)
  161. require.NoError(t, err)
  162. req.Body = io.NopCloser(bytes.NewReader(jsonData))
  163. },
  164. Expected: func(t *testing.T, resp *http.Response) {
  165. contentType := resp.Header.Get("Content-Type")
  166. assert.Equal(t, "application/json", contentType)
  167. _, err := io.ReadAll(resp.Body)
  168. require.NoError(t, err)
  169. assert.Equal(t, 200, resp.StatusCode)
  170. model, err := GetModel("t-bone")
  171. require.NoError(t, err)
  172. assert.Equal(t, "t-bone:latest", model.ShortName)
  173. },
  174. },
  175. {
  176. Name: "Copy Model Handler",
  177. Method: http.MethodPost,
  178. Path: "/api/copy",
  179. Setup: func(t *testing.T, req *http.Request) {
  180. createTestModel(t, "hamshank")
  181. copyReq := api.CopyRequest{
  182. Source: "hamshank",
  183. Destination: "beefsteak",
  184. }
  185. jsonData, err := json.Marshal(copyReq)
  186. require.NoError(t, err)
  187. req.Body = io.NopCloser(bytes.NewReader(jsonData))
  188. },
  189. Expected: func(t *testing.T, resp *http.Response) {
  190. model, err := GetModel("beefsteak")
  191. require.NoError(t, err)
  192. assert.Equal(t, "beefsteak:latest", model.ShortName)
  193. },
  194. },
  195. {
  196. Name: "Show Model Handler",
  197. Method: http.MethodPost,
  198. Path: "/api/show",
  199. Setup: func(t *testing.T, req *http.Request) {
  200. createTestModel(t, "show-model")
  201. showReq := api.ShowRequest{Model: "show-model"}
  202. jsonData, err := json.Marshal(showReq)
  203. require.NoError(t, err)
  204. req.Body = io.NopCloser(bytes.NewReader(jsonData))
  205. },
  206. Expected: func(t *testing.T, resp *http.Response) {
  207. contentType := resp.Header.Get("Content-Type")
  208. assert.Equal(t, "application/json; charset=utf-8", contentType)
  209. body, err := io.ReadAll(resp.Body)
  210. require.NoError(t, err)
  211. var showResp api.ShowResponse
  212. err = json.Unmarshal(body, &showResp)
  213. require.NoError(t, err)
  214. var params []string
  215. paramsSplit := strings.Split(showResp.Parameters, "\n")
  216. for _, p := range paramsSplit {
  217. params = append(params, strings.Join(strings.Fields(p), " "))
  218. }
  219. sort.Strings(params)
  220. expectedParams := []string{
  221. "seed 42",
  222. "stop \"bar\"",
  223. "stop \"foo\"",
  224. "top_p 0.9",
  225. }
  226. assert.Equal(t, expectedParams, params)
  227. assert.InDelta(t, 0, showResp.ModelInfo["general.parameter_count"], 1e-9, "Parameter count should be 0")
  228. },
  229. },
  230. {
  231. Name: "openai retrieve model handler",
  232. Method: http.MethodGet,
  233. Path: "/v1/models/show-model",
  234. Expected: func(t *testing.T, resp *http.Response) {
  235. contentType := resp.Header.Get("Content-Type")
  236. assert.Equal(t, "application/json", contentType)
  237. body, err := io.ReadAll(resp.Body)
  238. require.NoError(t, err)
  239. var retrieveResp api.RetrieveModelResponse
  240. err = json.Unmarshal(body, &retrieveResp)
  241. require.NoError(t, err)
  242. assert.Equal(t, "show-model", retrieveResp.Id)
  243. assert.Equal(t, "library", retrieveResp.OwnedBy)
  244. },
  245. },
  246. {
  247. Name: "Embed Handler Empty Input",
  248. Method: http.MethodPost,
  249. Path: "/api/embed",
  250. Setup: func(t *testing.T, req *http.Request) {
  251. embedReq := api.EmbedRequest{
  252. Model: "t-bone",
  253. Input: "",
  254. }
  255. jsonData, err := json.Marshal(embedReq)
  256. require.NoError(t, err)
  257. req.Body = io.NopCloser(bytes.NewReader(jsonData))
  258. },
  259. Expected: func(t *testing.T, resp *http.Response) {
  260. contentType := resp.Header.Get("Content-Type")
  261. if contentType != "application/json; charset=utf-8" {
  262. t.Fatalf("expected content type application/json; charset=utf-8, got %s", contentType)
  263. }
  264. body, err := io.ReadAll(resp.Body)
  265. if err != nil {
  266. t.Fatal(err)
  267. }
  268. var embedResp api.EmbedResponse
  269. err = json.Unmarshal(body, &embedResp)
  270. if err != nil {
  271. t.Fatal(err)
  272. }
  273. if embedResp.Model != "t-bone" {
  274. t.Fatalf("expected model t-bone, got %s", embedResp.Model)
  275. }
  276. if embedResp.Embeddings == nil {
  277. t.Fatalf("expected embeddings to not be nil, got %v", embedResp.Embeddings)
  278. }
  279. if len(embedResp.Embeddings) != 0 {
  280. t.Fatalf("expected embeddings to be empty, got %v", embedResp.Embeddings)
  281. }
  282. },
  283. },
  284. {
  285. Name: "Embed Handler Invalid Input",
  286. Method: http.MethodPost,
  287. Path: "/api/embed",
  288. Setup: func(t *testing.T, req *http.Request) {
  289. embedReq := api.EmbedRequest{
  290. Model: "t-bone",
  291. Input: 2,
  292. }
  293. jsonData, err := json.Marshal(embedReq)
  294. require.NoError(t, err)
  295. req.Body = io.NopCloser(bytes.NewReader(jsonData))
  296. },
  297. Expected: func(t *testing.T, resp *http.Response) {
  298. contentType := resp.Header.Get("Content-Type")
  299. if contentType != "application/json; charset=utf-8" {
  300. t.Fatalf("expected content type application/json; charset=utf-8, got %s", contentType)
  301. }
  302. _, err := io.ReadAll(resp.Body)
  303. if err != nil {
  304. t.Fatal(err)
  305. }
  306. if resp.StatusCode != http.StatusBadRequest {
  307. t.Fatalf("expected status code 400, got %d", resp.StatusCode)
  308. }
  309. },
  310. },
  311. }
  312. t.Setenv("OLLAMA_MODELS", t.TempDir())
  313. envconfig.LoadConfig()
  314. s := &Server{}
  315. router := s.GenerateRoutes()
  316. httpSrv := httptest.NewServer(router)
  317. t.Cleanup(httpSrv.Close)
  318. for _, tc := range testCases {
  319. t.Run(tc.Name, func(t *testing.T) {
  320. u := httpSrv.URL + tc.Path
  321. req, err := http.NewRequestWithContext(context.TODO(), tc.Method, u, nil)
  322. require.NoError(t, err)
  323. if tc.Setup != nil {
  324. tc.Setup(t, req)
  325. }
  326. resp, err := httpSrv.Client().Do(req)
  327. require.NoError(t, err)
  328. defer resp.Body.Close()
  329. if tc.Expected != nil {
  330. tc.Expected(t, resp)
  331. }
  332. })
  333. }
  334. }
  335. func TestCase(t *testing.T) {
  336. t.Setenv("OLLAMA_MODELS", t.TempDir())
  337. envconfig.LoadConfig()
  338. cases := []string{
  339. "mistral",
  340. "llama3:latest",
  341. "library/phi3:q4_0",
  342. "registry.ollama.ai/library/gemma:q5_K_M",
  343. // TODO: host:port currently fails on windows (#4107)
  344. // "localhost:5000/alice/bob:latest",
  345. }
  346. var s Server
  347. for _, tt := range cases {
  348. t.Run(tt, func(t *testing.T) {
  349. w := createRequest(t, s.CreateModelHandler, api.CreateRequest{
  350. Name: tt,
  351. Modelfile: fmt.Sprintf("FROM %s", createBinFile(t, nil, nil)),
  352. Stream: &stream,
  353. })
  354. if w.Code != http.StatusOK {
  355. t.Fatalf("expected status 200 got %d", w.Code)
  356. }
  357. expect, err := json.Marshal(map[string]string{"error": "a model with that name already exists"})
  358. if err != nil {
  359. t.Fatal(err)
  360. }
  361. t.Run("create", func(t *testing.T) {
  362. w = createRequest(t, s.CreateModelHandler, api.CreateRequest{
  363. Name: strings.ToUpper(tt),
  364. Modelfile: fmt.Sprintf("FROM %s", createBinFile(t, nil, nil)),
  365. Stream: &stream,
  366. })
  367. if w.Code != http.StatusBadRequest {
  368. t.Fatalf("expected status 500 got %d", w.Code)
  369. }
  370. if !bytes.Equal(w.Body.Bytes(), expect) {
  371. t.Fatalf("expected error %s got %s", expect, w.Body.String())
  372. }
  373. })
  374. t.Run("pull", func(t *testing.T) {
  375. w := createRequest(t, s.PullModelHandler, api.PullRequest{
  376. Name: strings.ToUpper(tt),
  377. Stream: &stream,
  378. })
  379. if w.Code != http.StatusBadRequest {
  380. t.Fatalf("expected status 500 got %d", w.Code)
  381. }
  382. if !bytes.Equal(w.Body.Bytes(), expect) {
  383. t.Fatalf("expected error %s got %s", expect, w.Body.String())
  384. }
  385. })
  386. t.Run("copy", func(t *testing.T) {
  387. w := createRequest(t, s.CopyModelHandler, api.CopyRequest{
  388. Source: tt,
  389. Destination: strings.ToUpper(tt),
  390. })
  391. if w.Code != http.StatusBadRequest {
  392. t.Fatalf("expected status 500 got %d", w.Code)
  393. }
  394. if !bytes.Equal(w.Body.Bytes(), expect) {
  395. t.Fatalf("expected error %s got %s", expect, w.Body.String())
  396. }
  397. })
  398. })
  399. }
  400. }
  401. func TestShow(t *testing.T) {
  402. t.Setenv("OLLAMA_MODELS", t.TempDir())
  403. envconfig.LoadConfig()
  404. var s Server
  405. createRequest(t, s.CreateModelHandler, api.CreateRequest{
  406. Name: "show-model",
  407. Modelfile: fmt.Sprintf(
  408. "FROM %s\nFROM %s",
  409. createBinFile(t, llm.KV{"general.architecture": "test"}, nil),
  410. createBinFile(t, llm.KV{"general.architecture": "clip"}, nil),
  411. ),
  412. })
  413. w := createRequest(t, s.ShowModelHandler, api.ShowRequest{
  414. Name: "show-model",
  415. })
  416. if w.Code != http.StatusOK {
  417. t.Fatalf("expected status code 200, actual %d", w.Code)
  418. }
  419. var resp api.ShowResponse
  420. if err := json.NewDecoder(w.Body).Decode(&resp); err != nil {
  421. t.Fatal(err)
  422. }
  423. if resp.ModelInfo["general.architecture"] != "test" {
  424. t.Fatal("Expected model architecture to be 'test', but got", resp.ModelInfo["general.architecture"])
  425. }
  426. if resp.ProjectorInfo["general.architecture"] != "clip" {
  427. t.Fatal("Expected projector architecture to be 'clip', but got", resp.ProjectorInfo["general.architecture"])
  428. }
  429. }
  430. func TestNormalize(t *testing.T) {
  431. type testCase struct {
  432. input []float32
  433. }
  434. testCases := []testCase{
  435. {input: []float32{1}},
  436. {input: []float32{0, 1, 2, 3}},
  437. {input: []float32{0.1, 0.2, 0.3}},
  438. {input: []float32{-0.1, 0.2, 0.3, -0.4}},
  439. {input: []float32{0, 0, 0}},
  440. }
  441. isNormalized := func(vec []float32) (res bool) {
  442. sum := 0.0
  443. for _, v := range vec {
  444. sum += float64(v * v)
  445. }
  446. if math.Abs(sum-1) > 1e-6 {
  447. return sum == 0
  448. } else {
  449. return true
  450. }
  451. }
  452. for _, tc := range testCases {
  453. t.Run("", func(t *testing.T) {
  454. normalized := normalize(tc.input)
  455. if !isNormalized(normalized) {
  456. t.Errorf("Vector %v is not normalized", tc.input)
  457. }
  458. })
  459. }
  460. }
  461. func TestIsLocalReal(t *testing.T) {
  462. gin.SetMode(gin.TestMode)
  463. clientPubLoc := t.TempDir()
  464. t.Setenv("HOME", clientPubLoc)
  465. _, err := auth.GetPublicKey()
  466. if err != nil {
  467. t.Fatal(err)
  468. }
  469. w := httptest.NewRecorder()
  470. ctx, _ := gin.CreateTestContext(w)
  471. ctx.Request = &http.Request{
  472. Header: make(http.Header),
  473. }
  474. requestURL := url.URL{
  475. Scheme: "http",
  476. Host: "localhost:8080",
  477. Path: "/api/blobs",
  478. }
  479. request := &http.Request{
  480. Method: http.MethodPost,
  481. URL: &requestURL,
  482. }
  483. s := &Server{}
  484. authz, err := api.Authorization(ctx, request)
  485. if err != nil {
  486. t.Fatal(err)
  487. }
  488. // Set client authorization header
  489. ctx.Request.Header.Set("Authorization", authz)
  490. if !s.isLocal(ctx) {
  491. t.Fatal("Expected isLocal to return true")
  492. }
  493. t.Run("different server pubkey", func(t *testing.T) {
  494. serverPubLoc := t.TempDir()
  495. t.Setenv("HOME", serverPubLoc)
  496. _, err := auth.GetPublicKey()
  497. if err != nil {
  498. t.Fatal(err)
  499. }
  500. if s.isLocal(ctx) {
  501. t.Fatal("Expected isLocal to return false")
  502. }
  503. })
  504. t.Run("invalid pubkey", func(t *testing.T) {
  505. ctx.Request.Header.Set("Authorization", "sha-25616:invalid")
  506. if s.isLocal(ctx) {
  507. t.Fatal("Expected isLocal to return false")
  508. }
  509. })
  510. }