routes_test.go 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525
  1. package server
  2. import (
  3. "bytes"
  4. "context"
  5. "encoding/binary"
  6. "encoding/json"
  7. "fmt"
  8. "io"
  9. "math"
  10. "net/http"
  11. "net/http/httptest"
  12. "os"
  13. "sort"
  14. "strings"
  15. "testing"
  16. "github.com/stretchr/testify/assert"
  17. "github.com/stretchr/testify/require"
  18. "github.com/ollama/ollama/api"
  19. "github.com/ollama/ollama/envconfig"
  20. "github.com/ollama/ollama/llm"
  21. "github.com/ollama/ollama/openai"
  22. "github.com/ollama/ollama/parser"
  23. "github.com/ollama/ollama/types/model"
  24. "github.com/ollama/ollama/version"
  25. )
  26. func createTestFile(t *testing.T, name string) string {
  27. t.Helper()
  28. f, err := os.CreateTemp(t.TempDir(), name)
  29. require.NoError(t, err)
  30. defer f.Close()
  31. err = binary.Write(f, binary.LittleEndian, []byte("GGUF"))
  32. require.NoError(t, err)
  33. err = binary.Write(f, binary.LittleEndian, uint32(3))
  34. require.NoError(t, err)
  35. err = binary.Write(f, binary.LittleEndian, uint64(0))
  36. require.NoError(t, err)
  37. err = binary.Write(f, binary.LittleEndian, uint64(0))
  38. require.NoError(t, err)
  39. return f.Name()
  40. }
  41. func Test_Routes(t *testing.T) {
  42. type testCase struct {
  43. Name string
  44. Method string
  45. Path string
  46. Setup func(t *testing.T, req *http.Request)
  47. Expected func(t *testing.T, resp *http.Response)
  48. }
  49. createTestModel := func(t *testing.T, name string) {
  50. t.Helper()
  51. fname := createTestFile(t, "ollama-model")
  52. r := strings.NewReader(fmt.Sprintf("FROM %s\nPARAMETER seed 42\nPARAMETER top_p 0.9\nPARAMETER stop foo\nPARAMETER stop bar", fname))
  53. modelfile, err := parser.ParseFile(r)
  54. require.NoError(t, err)
  55. fn := func(resp api.ProgressResponse) {
  56. t.Logf("Status: %s", resp.Status)
  57. }
  58. err = CreateModel(context.TODO(), model.ParseName(name), "", "", modelfile, fn)
  59. require.NoError(t, err)
  60. }
  61. testCases := []testCase{
  62. {
  63. Name: "Version Handler",
  64. Method: http.MethodGet,
  65. Path: "/api/version",
  66. Setup: func(t *testing.T, req *http.Request) {
  67. },
  68. Expected: func(t *testing.T, resp *http.Response) {
  69. contentType := resp.Header.Get("Content-Type")
  70. assert.Equal(t, "application/json; charset=utf-8", contentType)
  71. body, err := io.ReadAll(resp.Body)
  72. require.NoError(t, err)
  73. assert.Equal(t, fmt.Sprintf(`{"version":"%s"}`, version.Version), string(body))
  74. },
  75. },
  76. {
  77. Name: "Tags Handler (no tags)",
  78. Method: http.MethodGet,
  79. Path: "/api/tags",
  80. Expected: func(t *testing.T, resp *http.Response) {
  81. contentType := resp.Header.Get("Content-Type")
  82. assert.Equal(t, "application/json; charset=utf-8", contentType)
  83. body, err := io.ReadAll(resp.Body)
  84. require.NoError(t, err)
  85. var modelList api.ListResponse
  86. err = json.Unmarshal(body, &modelList)
  87. require.NoError(t, err)
  88. assert.NotNil(t, modelList.Models)
  89. assert.Empty(t, len(modelList.Models))
  90. },
  91. },
  92. {
  93. Name: "openai empty list",
  94. Method: http.MethodGet,
  95. Path: "/v1/models",
  96. Expected: func(t *testing.T, resp *http.Response) {
  97. contentType := resp.Header.Get("Content-Type")
  98. assert.Equal(t, "application/json", contentType)
  99. body, err := io.ReadAll(resp.Body)
  100. require.NoError(t, err)
  101. var modelList openai.ListCompletion
  102. err = json.Unmarshal(body, &modelList)
  103. require.NoError(t, err)
  104. assert.Equal(t, "list", modelList.Object)
  105. assert.Empty(t, modelList.Data)
  106. },
  107. },
  108. {
  109. Name: "Tags Handler (yes tags)",
  110. Method: http.MethodGet,
  111. Path: "/api/tags",
  112. Setup: func(t *testing.T, req *http.Request) {
  113. createTestModel(t, "test-model")
  114. },
  115. Expected: func(t *testing.T, resp *http.Response) {
  116. contentType := resp.Header.Get("Content-Type")
  117. assert.Equal(t, "application/json; charset=utf-8", contentType)
  118. body, err := io.ReadAll(resp.Body)
  119. require.NoError(t, err)
  120. assert.NotContains(t, string(body), "expires_at")
  121. var modelList api.ListResponse
  122. err = json.Unmarshal(body, &modelList)
  123. require.NoError(t, err)
  124. assert.Len(t, modelList.Models, 1)
  125. assert.Equal(t, "test-model:latest", modelList.Models[0].Name)
  126. },
  127. },
  128. {
  129. Name: "openai list models with tags",
  130. Method: http.MethodGet,
  131. Path: "/v1/models",
  132. Expected: func(t *testing.T, resp *http.Response) {
  133. contentType := resp.Header.Get("Content-Type")
  134. assert.Equal(t, "application/json", contentType)
  135. body, err := io.ReadAll(resp.Body)
  136. require.NoError(t, err)
  137. var modelList openai.ListCompletion
  138. err = json.Unmarshal(body, &modelList)
  139. require.NoError(t, err)
  140. assert.Len(t, modelList.Data, 1)
  141. assert.Equal(t, "test-model:latest", modelList.Data[0].Id)
  142. assert.Equal(t, "library", modelList.Data[0].OwnedBy)
  143. },
  144. },
  145. {
  146. Name: "Create Model Handler",
  147. Method: http.MethodPost,
  148. Path: "/api/create",
  149. Setup: func(t *testing.T, req *http.Request) {
  150. fname := createTestFile(t, "ollama-model")
  151. stream := false
  152. createReq := api.CreateRequest{
  153. Name: "t-bone",
  154. Modelfile: fmt.Sprintf("FROM %s", fname),
  155. Stream: &stream,
  156. }
  157. jsonData, err := json.Marshal(createReq)
  158. require.NoError(t, err)
  159. req.Body = io.NopCloser(bytes.NewReader(jsonData))
  160. },
  161. Expected: func(t *testing.T, resp *http.Response) {
  162. contentType := resp.Header.Get("Content-Type")
  163. assert.Equal(t, "application/json", contentType)
  164. _, err := io.ReadAll(resp.Body)
  165. require.NoError(t, err)
  166. assert.Equal(t, 200, resp.StatusCode)
  167. model, err := GetModel("t-bone")
  168. require.NoError(t, err)
  169. assert.Equal(t, "t-bone:latest", model.ShortName)
  170. },
  171. },
  172. {
  173. Name: "Copy Model Handler",
  174. Method: http.MethodPost,
  175. Path: "/api/copy",
  176. Setup: func(t *testing.T, req *http.Request) {
  177. createTestModel(t, "hamshank")
  178. copyReq := api.CopyRequest{
  179. Source: "hamshank",
  180. Destination: "beefsteak",
  181. }
  182. jsonData, err := json.Marshal(copyReq)
  183. require.NoError(t, err)
  184. req.Body = io.NopCloser(bytes.NewReader(jsonData))
  185. },
  186. Expected: func(t *testing.T, resp *http.Response) {
  187. model, err := GetModel("beefsteak")
  188. require.NoError(t, err)
  189. assert.Equal(t, "beefsteak:latest", model.ShortName)
  190. },
  191. },
  192. {
  193. Name: "Show Model Handler",
  194. Method: http.MethodPost,
  195. Path: "/api/show",
  196. Setup: func(t *testing.T, req *http.Request) {
  197. createTestModel(t, "show-model")
  198. showReq := api.ShowRequest{Model: "show-model"}
  199. jsonData, err := json.Marshal(showReq)
  200. require.NoError(t, err)
  201. req.Body = io.NopCloser(bytes.NewReader(jsonData))
  202. },
  203. Expected: func(t *testing.T, resp *http.Response) {
  204. contentType := resp.Header.Get("Content-Type")
  205. assert.Equal(t, "application/json; charset=utf-8", contentType)
  206. body, err := io.ReadAll(resp.Body)
  207. require.NoError(t, err)
  208. var showResp api.ShowResponse
  209. err = json.Unmarshal(body, &showResp)
  210. require.NoError(t, err)
  211. var params []string
  212. paramsSplit := strings.Split(showResp.Parameters, "\n")
  213. for _, p := range paramsSplit {
  214. params = append(params, strings.Join(strings.Fields(p), " "))
  215. }
  216. sort.Strings(params)
  217. expectedParams := []string{
  218. "seed 42",
  219. "stop \"bar\"",
  220. "stop \"foo\"",
  221. "top_p 0.9",
  222. }
  223. assert.Equal(t, expectedParams, params)
  224. assert.InDelta(t, 0, showResp.ModelInfo["general.parameter_count"], 1e-9, "Parameter count should be 0")
  225. },
  226. },
  227. {
  228. Name: "openai retrieve model handler",
  229. Method: http.MethodGet,
  230. Path: "/v1/models/show-model",
  231. Expected: func(t *testing.T, resp *http.Response) {
  232. contentType := resp.Header.Get("Content-Type")
  233. assert.Equal(t, "application/json", contentType)
  234. body, err := io.ReadAll(resp.Body)
  235. require.NoError(t, err)
  236. var retrieveResp api.RetrieveModelResponse
  237. err = json.Unmarshal(body, &retrieveResp)
  238. require.NoError(t, err)
  239. assert.Equal(t, "show-model", retrieveResp.Id)
  240. assert.Equal(t, "library", retrieveResp.OwnedBy)
  241. },
  242. },
  243. {
  244. Name: "Embed Handler Empty Input",
  245. Method: http.MethodPost,
  246. Path: "/api/embed",
  247. Setup: func(t *testing.T, req *http.Request) {
  248. embedReq := api.EmbedRequest{
  249. Model: "t-bone",
  250. Input: "",
  251. }
  252. jsonData, err := json.Marshal(embedReq)
  253. require.NoError(t, err)
  254. req.Body = io.NopCloser(bytes.NewReader(jsonData))
  255. },
  256. Expected: func(t *testing.T, resp *http.Response) {
  257. contentType := resp.Header.Get("Content-Type")
  258. if contentType != "application/json; charset=utf-8" {
  259. t.Fatalf("expected content type application/json; charset=utf-8, got %s", contentType)
  260. }
  261. body, err := io.ReadAll(resp.Body)
  262. if err != nil {
  263. t.Fatal(err)
  264. }
  265. var embedResp api.EmbedResponse
  266. err = json.Unmarshal(body, &embedResp)
  267. if err != nil {
  268. t.Fatal(err)
  269. }
  270. if embedResp.Model != "t-bone" {
  271. t.Fatalf("expected model t-bone, got %s", embedResp.Model)
  272. }
  273. if embedResp.Embeddings != nil {
  274. t.Fatalf("expected embeddings to be nil, got %v", embedResp.Embeddings)
  275. }
  276. },
  277. },
  278. {
  279. Name: "Embed Handler Invalid Input",
  280. Method: http.MethodPost,
  281. Path: "/api/embed",
  282. Setup: func(t *testing.T, req *http.Request) {
  283. embedReq := api.EmbedRequest{
  284. Model: "t-bone",
  285. Input: 2,
  286. }
  287. jsonData, err := json.Marshal(embedReq)
  288. require.NoError(t, err)
  289. req.Body = io.NopCloser(bytes.NewReader(jsonData))
  290. },
  291. Expected: func(t *testing.T, resp *http.Response) {
  292. contentType := resp.Header.Get("Content-Type")
  293. if contentType != "application/json; charset=utf-8" {
  294. t.Fatalf("expected content type application/json; charset=utf-8, got %s", contentType)
  295. }
  296. _, err := io.ReadAll(resp.Body)
  297. if err != nil {
  298. t.Fatal(err)
  299. }
  300. if resp.StatusCode != http.StatusBadRequest {
  301. t.Fatalf("expected status code 400, got %d", resp.StatusCode)
  302. }
  303. },
  304. },
  305. }
  306. t.Setenv("OLLAMA_MODELS", t.TempDir())
  307. envconfig.LoadConfig()
  308. s := &Server{}
  309. router := s.GenerateRoutes()
  310. httpSrv := httptest.NewServer(router)
  311. t.Cleanup(httpSrv.Close)
  312. for _, tc := range testCases {
  313. t.Run(tc.Name, func(t *testing.T) {
  314. u := httpSrv.URL + tc.Path
  315. req, err := http.NewRequestWithContext(context.TODO(), tc.Method, u, nil)
  316. require.NoError(t, err)
  317. if tc.Setup != nil {
  318. tc.Setup(t, req)
  319. }
  320. resp, err := httpSrv.Client().Do(req)
  321. require.NoError(t, err)
  322. defer resp.Body.Close()
  323. if tc.Expected != nil {
  324. tc.Expected(t, resp)
  325. }
  326. })
  327. }
  328. }
  329. func TestCase(t *testing.T) {
  330. t.Setenv("OLLAMA_MODELS", t.TempDir())
  331. envconfig.LoadConfig()
  332. cases := []string{
  333. "mistral",
  334. "llama3:latest",
  335. "library/phi3:q4_0",
  336. "registry.ollama.ai/library/gemma:q5_K_M",
  337. // TODO: host:port currently fails on windows (#4107)
  338. // "localhost:5000/alice/bob:latest",
  339. }
  340. var s Server
  341. for _, tt := range cases {
  342. t.Run(tt, func(t *testing.T) {
  343. w := createRequest(t, s.CreateModelHandler, api.CreateRequest{
  344. Name: tt,
  345. Modelfile: fmt.Sprintf("FROM %s", createBinFile(t, nil, nil)),
  346. Stream: &stream,
  347. })
  348. if w.Code != http.StatusOK {
  349. t.Fatalf("expected status 200 got %d", w.Code)
  350. }
  351. expect, err := json.Marshal(map[string]string{"error": "a model with that name already exists"})
  352. if err != nil {
  353. t.Fatal(err)
  354. }
  355. t.Run("create", func(t *testing.T) {
  356. w = createRequest(t, s.CreateModelHandler, api.CreateRequest{
  357. Name: strings.ToUpper(tt),
  358. Modelfile: fmt.Sprintf("FROM %s", createBinFile(t, nil, nil)),
  359. Stream: &stream,
  360. })
  361. if w.Code != http.StatusBadRequest {
  362. t.Fatalf("expected status 500 got %d", w.Code)
  363. }
  364. if !bytes.Equal(w.Body.Bytes(), expect) {
  365. t.Fatalf("expected error %s got %s", expect, w.Body.String())
  366. }
  367. })
  368. t.Run("pull", func(t *testing.T) {
  369. w := createRequest(t, s.PullModelHandler, api.PullRequest{
  370. Name: strings.ToUpper(tt),
  371. Stream: &stream,
  372. })
  373. if w.Code != http.StatusBadRequest {
  374. t.Fatalf("expected status 500 got %d", w.Code)
  375. }
  376. if !bytes.Equal(w.Body.Bytes(), expect) {
  377. t.Fatalf("expected error %s got %s", expect, w.Body.String())
  378. }
  379. })
  380. t.Run("copy", func(t *testing.T) {
  381. w := createRequest(t, s.CopyModelHandler, api.CopyRequest{
  382. Source: tt,
  383. Destination: strings.ToUpper(tt),
  384. })
  385. if w.Code != http.StatusBadRequest {
  386. t.Fatalf("expected status 500 got %d", w.Code)
  387. }
  388. if !bytes.Equal(w.Body.Bytes(), expect) {
  389. t.Fatalf("expected error %s got %s", expect, w.Body.String())
  390. }
  391. })
  392. })
  393. }
  394. }
  395. func TestShow(t *testing.T) {
  396. t.Setenv("OLLAMA_MODELS", t.TempDir())
  397. envconfig.LoadConfig()
  398. var s Server
  399. createRequest(t, s.CreateModelHandler, api.CreateRequest{
  400. Name: "show-model",
  401. Modelfile: fmt.Sprintf(
  402. "FROM %s\nFROM %s",
  403. createBinFile(t, llm.KV{"general.architecture": "test"}, nil),
  404. createBinFile(t, llm.KV{"general.architecture": "clip"}, nil),
  405. ),
  406. })
  407. w := createRequest(t, s.ShowModelHandler, api.ShowRequest{
  408. Name: "show-model",
  409. })
  410. if w.Code != http.StatusOK {
  411. t.Fatalf("expected status code 200, actual %d", w.Code)
  412. }
  413. var resp api.ShowResponse
  414. if err := json.NewDecoder(w.Body).Decode(&resp); err != nil {
  415. t.Fatal(err)
  416. }
  417. if resp.ModelInfo["general.architecture"] != "test" {
  418. t.Fatal("Expected model architecture to be 'test', but got", resp.ModelInfo["general.architecture"])
  419. }
  420. if resp.ProjectorInfo["general.architecture"] != "clip" {
  421. t.Fatal("Expected projector architecture to be 'clip', but got", resp.ProjectorInfo["general.architecture"])
  422. }
  423. }
  424. func TestNormalize(t *testing.T) {
  425. type testCase struct {
  426. input []float32
  427. }
  428. testCases := []testCase{
  429. {input: []float32{1}},
  430. {input: []float32{0, 1, 2, 3}},
  431. {input: []float32{0.1, 0.2, 0.3}},
  432. {input: []float32{-0.1, 0.2, 0.3, -0.4}},
  433. {input: []float32{0, 0, 0}},
  434. }
  435. isNormalized := func(vec []float32) (res bool) {
  436. sum := 0.0
  437. for _, v := range vec {
  438. sum += float64(v * v)
  439. }
  440. if math.Abs(sum-1) > 1e-6 {
  441. return sum == 0
  442. } else {
  443. return true
  444. }
  445. }
  446. for _, tc := range testCases {
  447. t.Run("", func(t *testing.T) {
  448. normalized := normalize(tc.input)
  449. if !isNormalized(normalized) {
  450. t.Errorf("Vector %v is not normalized", tc.input)
  451. }
  452. })
  453. }
  454. }