routes_test.go 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506
  1. package server
  2. import (
  3. "bytes"
  4. "context"
  5. "encoding/binary"
  6. "encoding/json"
  7. "fmt"
  8. "io"
  9. "math"
  10. "net/http"
  11. "net/http/httptest"
  12. "os"
  13. "sort"
  14. "strings"
  15. "testing"
  16. "github.com/stretchr/testify/assert"
  17. "github.com/stretchr/testify/require"
  18. "github.com/ollama/ollama/api"
  19. "github.com/ollama/ollama/envconfig"
  20. "github.com/ollama/ollama/llm"
  21. "github.com/ollama/ollama/openai"
  22. "github.com/ollama/ollama/parser"
  23. "github.com/ollama/ollama/types/model"
  24. "github.com/ollama/ollama/version"
  25. )
  26. func createTestFile(t *testing.T, name string) string {
  27. t.Helper()
  28. f, err := os.CreateTemp(t.TempDir(), name)
  29. require.NoError(t, err)
  30. defer f.Close()
  31. err = binary.Write(f, binary.LittleEndian, []byte("GGUF"))
  32. require.NoError(t, err)
  33. err = binary.Write(f, binary.LittleEndian, uint32(3))
  34. require.NoError(t, err)
  35. err = binary.Write(f, binary.LittleEndian, uint64(0))
  36. require.NoError(t, err)
  37. err = binary.Write(f, binary.LittleEndian, uint64(0))
  38. require.NoError(t, err)
  39. return f.Name()
  40. }
  41. func Test_Routes(t *testing.T) {
  42. type testCase struct {
  43. Name string
  44. Method string
  45. Path string
  46. Setup func(t *testing.T, req *http.Request)
  47. Expected func(t *testing.T, resp *http.Response)
  48. }
  49. createTestModel := func(t *testing.T, name string) {
  50. t.Helper()
  51. fname := createTestFile(t, "ollama-model")
  52. r := strings.NewReader(fmt.Sprintf("FROM %s\nPARAMETER seed 42\nPARAMETER top_p 0.9\nPARAMETER stop foo\nPARAMETER stop bar", fname))
  53. modelfile, err := parser.ParseFile(r)
  54. require.NoError(t, err)
  55. fn := func(resp api.ProgressResponse) {
  56. t.Logf("Status: %s", resp.Status)
  57. }
  58. err = CreateModel(context.TODO(), model.ParseName(name), "", "", modelfile, fn)
  59. require.NoError(t, err)
  60. }
  61. testCases := []testCase{
  62. {
  63. Name: "Version Handler",
  64. Method: http.MethodGet,
  65. Path: "/api/version",
  66. Setup: func(t *testing.T, req *http.Request) {
  67. },
  68. Expected: func(t *testing.T, resp *http.Response) {
  69. contentType := resp.Header.Get("Content-Type")
  70. assert.Equal(t, "application/json; charset=utf-8", contentType)
  71. body, err := io.ReadAll(resp.Body)
  72. require.NoError(t, err)
  73. assert.Equal(t, fmt.Sprintf(`{"version":"%s"}`, version.Version), string(body))
  74. },
  75. },
  76. {
  77. Name: "Tags Handler (no tags)",
  78. Method: http.MethodGet,
  79. Path: "/api/tags",
  80. Expected: func(t *testing.T, resp *http.Response) {
  81. contentType := resp.Header.Get("Content-Type")
  82. assert.Equal(t, "application/json; charset=utf-8", contentType)
  83. body, err := io.ReadAll(resp.Body)
  84. require.NoError(t, err)
  85. var modelList api.ListResponse
  86. err = json.Unmarshal(body, &modelList)
  87. require.NoError(t, err)
  88. assert.NotNil(t, modelList.Models)
  89. assert.Empty(t, len(modelList.Models))
  90. },
  91. },
  92. {
  93. Name: "openai empty list",
  94. Method: http.MethodGet,
  95. Path: "/v1/models",
  96. Expected: func(t *testing.T, resp *http.Response) {
  97. contentType := resp.Header.Get("Content-Type")
  98. assert.Equal(t, "application/json", contentType)
  99. body, err := io.ReadAll(resp.Body)
  100. require.NoError(t, err)
  101. var modelList openai.ListCompletion
  102. err = json.Unmarshal(body, &modelList)
  103. require.NoError(t, err)
  104. assert.Equal(t, "list", modelList.Object)
  105. assert.Empty(t, modelList.Data)
  106. },
  107. },
  108. {
  109. Name: "Tags Handler (yes tags)",
  110. Method: http.MethodGet,
  111. Path: "/api/tags",
  112. Setup: func(t *testing.T, req *http.Request) {
  113. createTestModel(t, "test-model")
  114. },
  115. Expected: func(t *testing.T, resp *http.Response) {
  116. contentType := resp.Header.Get("Content-Type")
  117. assert.Equal(t, "application/json; charset=utf-8", contentType)
  118. body, err := io.ReadAll(resp.Body)
  119. require.NoError(t, err)
  120. assert.NotContains(t, string(body), "expires_at")
  121. var modelList api.ListResponse
  122. err = json.Unmarshal(body, &modelList)
  123. require.NoError(t, err)
  124. assert.Len(t, modelList.Models, 1)
  125. assert.Equal(t, "test-model:latest", modelList.Models[0].Name)
  126. },
  127. },
  128. {
  129. Name: "openai list models with tags",
  130. Method: http.MethodGet,
  131. Path: "/v1/models",
  132. Expected: func(t *testing.T, resp *http.Response) {
  133. contentType := resp.Header.Get("Content-Type")
  134. assert.Equal(t, "application/json", contentType)
  135. body, err := io.ReadAll(resp.Body)
  136. require.NoError(t, err)
  137. var modelList openai.ListCompletion
  138. err = json.Unmarshal(body, &modelList)
  139. require.NoError(t, err)
  140. assert.Len(t, modelList.Data, 1)
  141. assert.Equal(t, "test-model:latest", modelList.Data[0].Id)
  142. assert.Equal(t, "library", modelList.Data[0].OwnedBy)
  143. },
  144. },
  145. {
  146. Name: "Create Model Handler",
  147. Method: http.MethodPost,
  148. Path: "/api/create",
  149. Setup: func(t *testing.T, req *http.Request) {
  150. fname := createTestFile(t, "ollama-model")
  151. stream := false
  152. createReq := api.CreateRequest{
  153. Name: "t-bone",
  154. Modelfile: fmt.Sprintf("FROM %s", fname),
  155. Stream: &stream,
  156. }
  157. jsonData, err := json.Marshal(createReq)
  158. require.NoError(t, err)
  159. req.Body = io.NopCloser(bytes.NewReader(jsonData))
  160. },
  161. Expected: func(t *testing.T, resp *http.Response) {
  162. contentType := resp.Header.Get("Content-Type")
  163. assert.Equal(t, "application/json", contentType)
  164. _, err := io.ReadAll(resp.Body)
  165. require.NoError(t, err)
  166. assert.Equal(t, 200, resp.StatusCode)
  167. model, err := GetModel("t-bone")
  168. require.NoError(t, err)
  169. assert.Equal(t, "t-bone:latest", model.ShortName)
  170. },
  171. },
  172. {
  173. Name: "Copy Model Handler",
  174. Method: http.MethodPost,
  175. Path: "/api/copy",
  176. Setup: func(t *testing.T, req *http.Request) {
  177. createTestModel(t, "hamshank")
  178. copyReq := api.CopyRequest{
  179. Source: "hamshank",
  180. Destination: "beefsteak",
  181. }
  182. jsonData, err := json.Marshal(copyReq)
  183. require.NoError(t, err)
  184. req.Body = io.NopCloser(bytes.NewReader(jsonData))
  185. },
  186. Expected: func(t *testing.T, resp *http.Response) {
  187. model, err := GetModel("beefsteak")
  188. require.NoError(t, err)
  189. assert.Equal(t, "beefsteak:latest", model.ShortName)
  190. },
  191. },
  192. {
  193. Name: "Show Model Handler",
  194. Method: http.MethodPost,
  195. Path: "/api/show",
  196. Setup: func(t *testing.T, req *http.Request) {
  197. createTestModel(t, "show-model")
  198. showReq := api.ShowRequest{Model: "show-model"}
  199. jsonData, err := json.Marshal(showReq)
  200. require.NoError(t, err)
  201. req.Body = io.NopCloser(bytes.NewReader(jsonData))
  202. },
  203. Expected: func(t *testing.T, resp *http.Response) {
  204. contentType := resp.Header.Get("Content-Type")
  205. assert.Equal(t, "application/json; charset=utf-8", contentType)
  206. body, err := io.ReadAll(resp.Body)
  207. require.NoError(t, err)
  208. var showResp api.ShowResponse
  209. err = json.Unmarshal(body, &showResp)
  210. require.NoError(t, err)
  211. var params []string
  212. paramsSplit := strings.Split(showResp.Parameters, "\n")
  213. for _, p := range paramsSplit {
  214. params = append(params, strings.Join(strings.Fields(p), " "))
  215. }
  216. sort.Strings(params)
  217. expectedParams := []string{
  218. "seed 42",
  219. "stop \"bar\"",
  220. "stop \"foo\"",
  221. "top_p 0.9",
  222. }
  223. assert.Equal(t, expectedParams, params)
  224. assert.InDelta(t, 0, showResp.ModelInfo["general.parameter_count"], 1e-9, "Parameter count should be 0")
  225. },
  226. },
  227. {
  228. Name: "openai retrieve model handler",
  229. Method: http.MethodGet,
  230. Path: "/v1/models/show-model",
  231. Expected: func(t *testing.T, resp *http.Response) {
  232. contentType := resp.Header.Get("Content-Type")
  233. assert.Equal(t, "application/json", contentType)
  234. body, err := io.ReadAll(resp.Body)
  235. require.NoError(t, err)
  236. var retrieveResp api.RetrieveModelResponse
  237. err = json.Unmarshal(body, &retrieveResp)
  238. require.NoError(t, err)
  239. assert.Equal(t, "show-model", retrieveResp.Id)
  240. assert.Equal(t, "library", retrieveResp.OwnedBy)
  241. },
  242. },
  243. {
  244. Name: "Embed Handler Empty Input",
  245. Method: http.MethodPost,
  246. Path: "/api/embed",
  247. Setup: func(t *testing.T, req *http.Request) {
  248. embedReq := api.EmbedRequest{
  249. Model: "t-bone",
  250. Input: "",
  251. }
  252. jsonData, err := json.Marshal(embedReq)
  253. require.NoError(t, err)
  254. req.Body = io.NopCloser(bytes.NewReader(jsonData))
  255. },
  256. Expected: func(t *testing.T, resp *http.Response) {
  257. contentType := resp.Header.Get("Content-Type")
  258. assert.Equal(t, "application/json; charset=utf-8", contentType)
  259. body, err := io.ReadAll(resp.Body)
  260. require.NoError(t, err)
  261. var embedResp api.EmbedResponse
  262. err = json.Unmarshal(body, &embedResp)
  263. require.NoError(t, err)
  264. assert.Equal(t, "t-bone", embedResp.Model)
  265. assert.Nil(t, embedResp.Embeddings)
  266. },
  267. },
  268. {
  269. Name: "Embed Handler Invalid Input",
  270. Method: http.MethodPost,
  271. Path: "/api/embed",
  272. Setup: func(t *testing.T, req *http.Request) {
  273. embedReq := api.EmbedRequest{
  274. Model: "t-bone",
  275. Input: 2,
  276. }
  277. jsonData, err := json.Marshal(embedReq)
  278. require.NoError(t, err)
  279. req.Body = io.NopCloser(bytes.NewReader(jsonData))
  280. },
  281. Expected: func(t *testing.T, resp *http.Response) {
  282. contentType := resp.Header.Get("Content-Type")
  283. assert.Equal(t, "application/json; charset=utf-8", contentType)
  284. _, err := io.ReadAll(resp.Body)
  285. require.NoError(t, err)
  286. assert.Equal(t, 400, resp.StatusCode)
  287. },
  288. },
  289. }
  290. t.Setenv("OLLAMA_MODELS", t.TempDir())
  291. envconfig.LoadConfig()
  292. s := &Server{}
  293. router := s.GenerateRoutes()
  294. httpSrv := httptest.NewServer(router)
  295. t.Cleanup(httpSrv.Close)
  296. for _, tc := range testCases {
  297. t.Run(tc.Name, func(t *testing.T) {
  298. u := httpSrv.URL + tc.Path
  299. req, err := http.NewRequestWithContext(context.TODO(), tc.Method, u, nil)
  300. require.NoError(t, err)
  301. if tc.Setup != nil {
  302. tc.Setup(t, req)
  303. }
  304. resp, err := httpSrv.Client().Do(req)
  305. require.NoError(t, err)
  306. defer resp.Body.Close()
  307. if tc.Expected != nil {
  308. tc.Expected(t, resp)
  309. }
  310. })
  311. }
  312. }
  313. func TestCase(t *testing.T) {
  314. t.Setenv("OLLAMA_MODELS", t.TempDir())
  315. envconfig.LoadConfig()
  316. cases := []string{
  317. "mistral",
  318. "llama3:latest",
  319. "library/phi3:q4_0",
  320. "registry.ollama.ai/library/gemma:q5_K_M",
  321. // TODO: host:port currently fails on windows (#4107)
  322. // "localhost:5000/alice/bob:latest",
  323. }
  324. var s Server
  325. for _, tt := range cases {
  326. t.Run(tt, func(t *testing.T) {
  327. w := createRequest(t, s.CreateModelHandler, api.CreateRequest{
  328. Name: tt,
  329. Modelfile: fmt.Sprintf("FROM %s", createBinFile(t, nil, nil)),
  330. Stream: &stream,
  331. })
  332. if w.Code != http.StatusOK {
  333. t.Fatalf("expected status 200 got %d", w.Code)
  334. }
  335. expect, err := json.Marshal(map[string]string{"error": "a model with that name already exists"})
  336. if err != nil {
  337. t.Fatal(err)
  338. }
  339. t.Run("create", func(t *testing.T) {
  340. w = createRequest(t, s.CreateModelHandler, api.CreateRequest{
  341. Name: strings.ToUpper(tt),
  342. Modelfile: fmt.Sprintf("FROM %s", createBinFile(t, nil, nil)),
  343. Stream: &stream,
  344. })
  345. if w.Code != http.StatusBadRequest {
  346. t.Fatalf("expected status 500 got %d", w.Code)
  347. }
  348. if !bytes.Equal(w.Body.Bytes(), expect) {
  349. t.Fatalf("expected error %s got %s", expect, w.Body.String())
  350. }
  351. })
  352. t.Run("pull", func(t *testing.T) {
  353. w := createRequest(t, s.PullModelHandler, api.PullRequest{
  354. Name: strings.ToUpper(tt),
  355. Stream: &stream,
  356. })
  357. if w.Code != http.StatusBadRequest {
  358. t.Fatalf("expected status 500 got %d", w.Code)
  359. }
  360. if !bytes.Equal(w.Body.Bytes(), expect) {
  361. t.Fatalf("expected error %s got %s", expect, w.Body.String())
  362. }
  363. })
  364. t.Run("copy", func(t *testing.T) {
  365. w := createRequest(t, s.CopyModelHandler, api.CopyRequest{
  366. Source: tt,
  367. Destination: strings.ToUpper(tt),
  368. })
  369. if w.Code != http.StatusBadRequest {
  370. t.Fatalf("expected status 500 got %d", w.Code)
  371. }
  372. if !bytes.Equal(w.Body.Bytes(), expect) {
  373. t.Fatalf("expected error %s got %s", expect, w.Body.String())
  374. }
  375. })
  376. })
  377. }
  378. }
  379. func TestShow(t *testing.T) {
  380. t.Setenv("OLLAMA_MODELS", t.TempDir())
  381. envconfig.LoadConfig()
  382. var s Server
  383. createRequest(t, s.CreateModelHandler, api.CreateRequest{
  384. Name: "show-model",
  385. Modelfile: fmt.Sprintf(
  386. "FROM %s\nFROM %s",
  387. createBinFile(t, llm.KV{"general.architecture": "test"}, nil),
  388. createBinFile(t, llm.KV{"general.architecture": "clip"}, nil),
  389. ),
  390. })
  391. w := createRequest(t, s.ShowModelHandler, api.ShowRequest{
  392. Name: "show-model",
  393. })
  394. if w.Code != http.StatusOK {
  395. t.Fatalf("expected status code 200, actual %d", w.Code)
  396. }
  397. var resp api.ShowResponse
  398. if err := json.NewDecoder(w.Body).Decode(&resp); err != nil {
  399. t.Fatal(err)
  400. }
  401. if resp.ModelInfo["general.architecture"] != "test" {
  402. t.Fatal("Expected model architecture to be 'test', but got", resp.ModelInfo["general.architecture"])
  403. }
  404. if resp.ProjectorInfo["general.architecture"] != "clip" {
  405. t.Fatal("Expected projector architecture to be 'clip', but got", resp.ProjectorInfo["general.architecture"])
  406. }
  407. }
  408. func TestNormalize(t *testing.T) {
  409. type testCase struct {
  410. input []float32
  411. }
  412. testCases := []testCase{
  413. {input: []float32{1}},
  414. {input: []float32{0, 1, 2, 3}},
  415. {input: []float32{0.1, 0.2, 0.3}},
  416. {input: []float32{-0.1, 0.2, 0.3, -0.4}},
  417. {input: []float32{0, 0, 0}},
  418. }
  419. isNormalized := func(vec []float32) (res bool) {
  420. sum := 0.0
  421. for _, v := range vec {
  422. sum += float64(v * v)
  423. }
  424. if math.Abs(sum-1) > 1e-6 {
  425. return sum == 0
  426. } else {
  427. return true
  428. }
  429. }
  430. for _, tc := range testCases {
  431. t.Run("", func(t *testing.T) {
  432. normalized := normalize(tc.input)
  433. if !isNormalized(normalized) {
  434. t.Errorf("Vector %v is not normalized", tc.input)
  435. }
  436. })
  437. }
  438. }