routes_test.go 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529
  1. package server
  2. import (
  3. "bytes"
  4. "context"
  5. "encoding/binary"
  6. "encoding/json"
  7. "fmt"
  8. "io"
  9. "math"
  10. "net/http"
  11. "net/http/httptest"
  12. "os"
  13. "sort"
  14. "strings"
  15. "testing"
  16. "github.com/stretchr/testify/assert"
  17. "github.com/stretchr/testify/require"
  18. "github.com/ollama/ollama/api"
  19. "github.com/ollama/ollama/envconfig"
  20. "github.com/ollama/ollama/llm"
  21. "github.com/ollama/ollama/openai"
  22. "github.com/ollama/ollama/parser"
  23. "github.com/ollama/ollama/types/model"
  24. "github.com/ollama/ollama/version"
  25. )
  26. func createTestFile(t *testing.T, name string) string {
  27. t.Helper()
  28. f, err := os.CreateTemp(t.TempDir(), name)
  29. require.NoError(t, err)
  30. defer f.Close()
  31. err = binary.Write(f, binary.LittleEndian, []byte("GGUF"))
  32. require.NoError(t, err)
  33. err = binary.Write(f, binary.LittleEndian, uint32(3))
  34. require.NoError(t, err)
  35. err = binary.Write(f, binary.LittleEndian, uint64(0))
  36. require.NoError(t, err)
  37. err = binary.Write(f, binary.LittleEndian, uint64(0))
  38. require.NoError(t, err)
  39. return f.Name()
  40. }
  41. func Test_Routes(t *testing.T) {
  42. type testCase struct {
  43. Name string
  44. Method string
  45. Path string
  46. Setup func(t *testing.T, req *http.Request)
  47. Expected func(t *testing.T, resp *http.Response)
  48. }
  49. createTestModel := func(t *testing.T, name string) {
  50. t.Helper()
  51. fname := createTestFile(t, "ollama-model")
  52. r := strings.NewReader(fmt.Sprintf("FROM %s\nPARAMETER seed 42\nPARAMETER top_p 0.9\nPARAMETER stop foo\nPARAMETER stop bar", fname))
  53. modelfile, err := parser.ParseFile(r)
  54. require.NoError(t, err)
  55. fn := func(resp api.ProgressResponse) {
  56. t.Logf("Status: %s", resp.Status)
  57. }
  58. err = CreateModel(context.TODO(), model.ParseName(name), "", "", modelfile, fn)
  59. require.NoError(t, err)
  60. }
  61. testCases := []testCase{
  62. {
  63. Name: "Version Handler",
  64. Method: http.MethodGet,
  65. Path: "/api/version",
  66. Setup: func(t *testing.T, req *http.Request) {
  67. },
  68. Expected: func(t *testing.T, resp *http.Response) {
  69. contentType := resp.Header.Get("Content-Type")
  70. assert.Equal(t, "application/json; charset=utf-8", contentType)
  71. body, err := io.ReadAll(resp.Body)
  72. require.NoError(t, err)
  73. assert.Equal(t, fmt.Sprintf(`{"version":"%s"}`, version.Version), string(body))
  74. },
  75. },
  76. {
  77. Name: "Tags Handler (no tags)",
  78. Method: http.MethodGet,
  79. Path: "/api/tags",
  80. Expected: func(t *testing.T, resp *http.Response) {
  81. contentType := resp.Header.Get("Content-Type")
  82. assert.Equal(t, "application/json; charset=utf-8", contentType)
  83. body, err := io.ReadAll(resp.Body)
  84. require.NoError(t, err)
  85. var modelList api.ListResponse
  86. err = json.Unmarshal(body, &modelList)
  87. require.NoError(t, err)
  88. assert.NotNil(t, modelList.Models)
  89. assert.Empty(t, len(modelList.Models))
  90. },
  91. },
  92. {
  93. Name: "openai empty list",
  94. Method: http.MethodGet,
  95. Path: "/v1/models",
  96. Expected: func(t *testing.T, resp *http.Response) {
  97. contentType := resp.Header.Get("Content-Type")
  98. assert.Equal(t, "application/json", contentType)
  99. body, err := io.ReadAll(resp.Body)
  100. require.NoError(t, err)
  101. var modelList openai.ListCompletion
  102. err = json.Unmarshal(body, &modelList)
  103. require.NoError(t, err)
  104. assert.Equal(t, "list", modelList.Object)
  105. assert.Empty(t, modelList.Data)
  106. },
  107. },
  108. {
  109. Name: "Tags Handler (yes tags)",
  110. Method: http.MethodGet,
  111. Path: "/api/tags",
  112. Setup: func(t *testing.T, req *http.Request) {
  113. createTestModel(t, "test-model")
  114. },
  115. Expected: func(t *testing.T, resp *http.Response) {
  116. contentType := resp.Header.Get("Content-Type")
  117. assert.Equal(t, "application/json; charset=utf-8", contentType)
  118. body, err := io.ReadAll(resp.Body)
  119. require.NoError(t, err)
  120. assert.NotContains(t, string(body), "expires_at")
  121. var modelList api.ListResponse
  122. err = json.Unmarshal(body, &modelList)
  123. require.NoError(t, err)
  124. assert.Len(t, modelList.Models, 1)
  125. assert.Equal(t, "test-model:latest", modelList.Models[0].Name)
  126. },
  127. },
  128. {
  129. Name: "openai list models with tags",
  130. Method: http.MethodGet,
  131. Path: "/v1/models",
  132. Expected: func(t *testing.T, resp *http.Response) {
  133. contentType := resp.Header.Get("Content-Type")
  134. assert.Equal(t, "application/json", contentType)
  135. body, err := io.ReadAll(resp.Body)
  136. require.NoError(t, err)
  137. var modelList openai.ListCompletion
  138. err = json.Unmarshal(body, &modelList)
  139. require.NoError(t, err)
  140. assert.Len(t, modelList.Data, 1)
  141. assert.Equal(t, "test-model:latest", modelList.Data[0].Id)
  142. assert.Equal(t, "library", modelList.Data[0].OwnedBy)
  143. },
  144. },
  145. {
  146. Name: "Create Model Handler",
  147. Method: http.MethodPost,
  148. Path: "/api/create",
  149. Setup: func(t *testing.T, req *http.Request) {
  150. fname := createTestFile(t, "ollama-model")
  151. stream := false
  152. createReq := api.CreateRequest{
  153. Name: "t-bone",
  154. Modelfile: fmt.Sprintf("FROM %s", fname),
  155. Stream: &stream,
  156. }
  157. jsonData, err := json.Marshal(createReq)
  158. require.NoError(t, err)
  159. req.Body = io.NopCloser(bytes.NewReader(jsonData))
  160. },
  161. Expected: func(t *testing.T, resp *http.Response) {
  162. contentType := resp.Header.Get("Content-Type")
  163. assert.Equal(t, "application/json", contentType)
  164. _, err := io.ReadAll(resp.Body)
  165. require.NoError(t, err)
  166. assert.Equal(t, 200, resp.StatusCode)
  167. model, err := GetModel("t-bone")
  168. require.NoError(t, err)
  169. assert.Equal(t, "t-bone:latest", model.ShortName)
  170. },
  171. },
  172. {
  173. Name: "Copy Model Handler",
  174. Method: http.MethodPost,
  175. Path: "/api/copy",
  176. Setup: func(t *testing.T, req *http.Request) {
  177. createTestModel(t, "hamshank")
  178. copyReq := api.CopyRequest{
  179. Source: "hamshank",
  180. Destination: "beefsteak",
  181. }
  182. jsonData, err := json.Marshal(copyReq)
  183. require.NoError(t, err)
  184. req.Body = io.NopCloser(bytes.NewReader(jsonData))
  185. },
  186. Expected: func(t *testing.T, resp *http.Response) {
  187. model, err := GetModel("beefsteak")
  188. require.NoError(t, err)
  189. assert.Equal(t, "beefsteak:latest", model.ShortName)
  190. },
  191. },
  192. {
  193. Name: "Show Model Handler",
  194. Method: http.MethodPost,
  195. Path: "/api/show",
  196. Setup: func(t *testing.T, req *http.Request) {
  197. createTestModel(t, "show-model")
  198. showReq := api.ShowRequest{Model: "show-model"}
  199. jsonData, err := json.Marshal(showReq)
  200. require.NoError(t, err)
  201. req.Body = io.NopCloser(bytes.NewReader(jsonData))
  202. },
  203. Expected: func(t *testing.T, resp *http.Response) {
  204. contentType := resp.Header.Get("Content-Type")
  205. assert.Equal(t, "application/json; charset=utf-8", contentType)
  206. body, err := io.ReadAll(resp.Body)
  207. require.NoError(t, err)
  208. var showResp api.ShowResponse
  209. err = json.Unmarshal(body, &showResp)
  210. require.NoError(t, err)
  211. var params []string
  212. paramsSplit := strings.Split(showResp.Parameters, "\n")
  213. for _, p := range paramsSplit {
  214. params = append(params, strings.Join(strings.Fields(p), " "))
  215. }
  216. sort.Strings(params)
  217. expectedParams := []string{
  218. "seed 42",
  219. "stop \"bar\"",
  220. "stop \"foo\"",
  221. "top_p 0.9",
  222. }
  223. assert.Equal(t, expectedParams, params)
  224. assert.InDelta(t, 0, showResp.ModelInfo["general.parameter_count"], 1e-9, "Parameter count should be 0")
  225. },
  226. },
  227. {
  228. Name: "openai retrieve model handler",
  229. Method: http.MethodGet,
  230. Path: "/v1/models/show-model",
  231. Expected: func(t *testing.T, resp *http.Response) {
  232. contentType := resp.Header.Get("Content-Type")
  233. assert.Equal(t, "application/json", contentType)
  234. body, err := io.ReadAll(resp.Body)
  235. require.NoError(t, err)
  236. var retrieveResp api.RetrieveModelResponse
  237. err = json.Unmarshal(body, &retrieveResp)
  238. require.NoError(t, err)
  239. assert.Equal(t, "show-model", retrieveResp.Id)
  240. assert.Equal(t, "library", retrieveResp.OwnedBy)
  241. },
  242. },
  243. {
  244. Name: "Embed Handler Empty Input",
  245. Method: http.MethodPost,
  246. Path: "/api/embed",
  247. Setup: func(t *testing.T, req *http.Request) {
  248. embedReq := api.EmbedRequest{
  249. Model: "t-bone",
  250. Input: "",
  251. }
  252. jsonData, err := json.Marshal(embedReq)
  253. require.NoError(t, err)
  254. req.Body = io.NopCloser(bytes.NewReader(jsonData))
  255. },
  256. Expected: func(t *testing.T, resp *http.Response) {
  257. contentType := resp.Header.Get("Content-Type")
  258. if contentType != "application/json; charset=utf-8" {
  259. t.Fatalf("expected content type application/json; charset=utf-8, got %s", contentType)
  260. }
  261. body, err := io.ReadAll(resp.Body)
  262. if err != nil {
  263. t.Fatal(err)
  264. }
  265. var embedResp api.EmbedResponse
  266. err = json.Unmarshal(body, &embedResp)
  267. if err != nil {
  268. t.Fatal(err)
  269. }
  270. if embedResp.Model != "t-bone" {
  271. t.Fatalf("expected model t-bone, got %s", embedResp.Model)
  272. }
  273. if embedResp.Embeddings == nil {
  274. t.Fatalf("expected embeddings to not be nil, got %v", embedResp.Embeddings)
  275. }
  276. if len(embedResp.Embeddings) != 0 {
  277. t.Fatalf("expected embeddings to be empty, got %v", embedResp.Embeddings)
  278. }
  279. },
  280. },
  281. {
  282. Name: "Embed Handler Invalid Input",
  283. Method: http.MethodPost,
  284. Path: "/api/embed",
  285. Setup: func(t *testing.T, req *http.Request) {
  286. embedReq := api.EmbedRequest{
  287. Model: "t-bone",
  288. Input: 2,
  289. }
  290. jsonData, err := json.Marshal(embedReq)
  291. require.NoError(t, err)
  292. req.Body = io.NopCloser(bytes.NewReader(jsonData))
  293. },
  294. Expected: func(t *testing.T, resp *http.Response) {
  295. contentType := resp.Header.Get("Content-Type")
  296. if contentType != "application/json; charset=utf-8" {
  297. t.Fatalf("expected content type application/json; charset=utf-8, got %s", contentType)
  298. }
  299. _, err := io.ReadAll(resp.Body)
  300. if err != nil {
  301. t.Fatal(err)
  302. }
  303. if resp.StatusCode != http.StatusBadRequest {
  304. t.Fatalf("expected status code 400, got %d", resp.StatusCode)
  305. }
  306. },
  307. },
  308. }
  309. t.Setenv("OLLAMA_MODELS", t.TempDir())
  310. envconfig.LoadConfig()
  311. s := &Server{}
  312. router := s.GenerateRoutes()
  313. httpSrv := httptest.NewServer(router)
  314. t.Cleanup(httpSrv.Close)
  315. for _, tc := range testCases {
  316. t.Run(tc.Name, func(t *testing.T) {
  317. u := httpSrv.URL + tc.Path
  318. req, err := http.NewRequestWithContext(context.TODO(), tc.Method, u, nil)
  319. require.NoError(t, err)
  320. if tc.Setup != nil {
  321. tc.Setup(t, req)
  322. }
  323. resp, err := httpSrv.Client().Do(req)
  324. require.NoError(t, err)
  325. defer resp.Body.Close()
  326. if tc.Expected != nil {
  327. tc.Expected(t, resp)
  328. }
  329. })
  330. }
  331. }
  332. func TestCase(t *testing.T) {
  333. t.Setenv("OLLAMA_MODELS", t.TempDir())
  334. envconfig.LoadConfig()
  335. cases := []string{
  336. "mistral",
  337. "llama3:latest",
  338. "library/phi3:q4_0",
  339. "registry.ollama.ai/library/gemma:q5_K_M",
  340. // TODO: host:port currently fails on windows (#4107)
  341. // "localhost:5000/alice/bob:latest",
  342. }
  343. var s Server
  344. for _, tt := range cases {
  345. t.Run(tt, func(t *testing.T) {
  346. w := createRequest(t, s.CreateModelHandler, api.CreateRequest{
  347. Name: tt,
  348. Modelfile: fmt.Sprintf("FROM %s", createBinFile(t, nil, nil)),
  349. Stream: &stream,
  350. })
  351. if w.Code != http.StatusOK {
  352. t.Fatalf("expected status 200 got %d", w.Code)
  353. }
  354. expect, err := json.Marshal(map[string]string{"error": "a model with that name already exists"})
  355. if err != nil {
  356. t.Fatal(err)
  357. }
  358. t.Run("create", func(t *testing.T) {
  359. w = createRequest(t, s.CreateModelHandler, api.CreateRequest{
  360. Name: strings.ToUpper(tt),
  361. Modelfile: fmt.Sprintf("FROM %s", createBinFile(t, nil, nil)),
  362. Stream: &stream,
  363. })
  364. if w.Code != http.StatusBadRequest {
  365. t.Fatalf("expected status 500 got %d", w.Code)
  366. }
  367. if !bytes.Equal(w.Body.Bytes(), expect) {
  368. t.Fatalf("expected error %s got %s", expect, w.Body.String())
  369. }
  370. })
  371. t.Run("pull", func(t *testing.T) {
  372. w := createRequest(t, s.PullModelHandler, api.PullRequest{
  373. Name: strings.ToUpper(tt),
  374. Stream: &stream,
  375. })
  376. if w.Code != http.StatusBadRequest {
  377. t.Fatalf("expected status 500 got %d", w.Code)
  378. }
  379. if !bytes.Equal(w.Body.Bytes(), expect) {
  380. t.Fatalf("expected error %s got %s", expect, w.Body.String())
  381. }
  382. })
  383. t.Run("copy", func(t *testing.T) {
  384. w := createRequest(t, s.CopyModelHandler, api.CopyRequest{
  385. Source: tt,
  386. Destination: strings.ToUpper(tt),
  387. })
  388. if w.Code != http.StatusBadRequest {
  389. t.Fatalf("expected status 500 got %d", w.Code)
  390. }
  391. if !bytes.Equal(w.Body.Bytes(), expect) {
  392. t.Fatalf("expected error %s got %s", expect, w.Body.String())
  393. }
  394. })
  395. })
  396. }
  397. }
  398. func TestShow(t *testing.T) {
  399. t.Setenv("OLLAMA_MODELS", t.TempDir())
  400. envconfig.LoadConfig()
  401. var s Server
  402. createRequest(t, s.CreateModelHandler, api.CreateRequest{
  403. Name: "show-model",
  404. Modelfile: fmt.Sprintf(
  405. "FROM %s\nFROM %s",
  406. createBinFile(t, llm.KV{"general.architecture": "test"}, nil),
  407. createBinFile(t, llm.KV{"general.architecture": "clip"}, nil),
  408. ),
  409. })
  410. w := createRequest(t, s.ShowModelHandler, api.ShowRequest{
  411. Name: "show-model",
  412. })
  413. if w.Code != http.StatusOK {
  414. t.Fatalf("expected status code 200, actual %d", w.Code)
  415. }
  416. var resp api.ShowResponse
  417. if err := json.NewDecoder(w.Body).Decode(&resp); err != nil {
  418. t.Fatal(err)
  419. }
  420. if resp.ModelInfo["general.architecture"] != "test" {
  421. t.Fatal("Expected model architecture to be 'test', but got", resp.ModelInfo["general.architecture"])
  422. }
  423. if resp.ProjectorInfo["general.architecture"] != "clip" {
  424. t.Fatal("Expected projector architecture to be 'clip', but got", resp.ProjectorInfo["general.architecture"])
  425. }
  426. }
  427. func TestNormalize(t *testing.T) {
  428. type testCase struct {
  429. input []float32
  430. }
  431. testCases := []testCase{
  432. {input: []float32{1}},
  433. {input: []float32{0, 1, 2, 3}},
  434. {input: []float32{0.1, 0.2, 0.3}},
  435. {input: []float32{-0.1, 0.2, 0.3, -0.4}},
  436. {input: []float32{0, 0, 0}},
  437. }
  438. isNormalized := func(vec []float32) (res bool) {
  439. sum := 0.0
  440. for _, v := range vec {
  441. sum += float64(v * v)
  442. }
  443. if math.Abs(sum-1) > 1e-6 {
  444. return sum == 0
  445. } else {
  446. return true
  447. }
  448. }
  449. for _, tc := range testCases {
  450. t.Run("", func(t *testing.T) {
  451. normalized := normalize(tc.input)
  452. if !isNormalized(normalized) {
  453. t.Errorf("Vector %v is not normalized", tc.input)
  454. }
  455. })
  456. }
  457. }