routes_test.go 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540
  1. package server
  2. import (
  3. "bytes"
  4. "context"
  5. "encoding/binary"
  6. "encoding/json"
  7. "errors"
  8. "fmt"
  9. "io"
  10. "math"
  11. "net"
  12. "net/http"
  13. "net/http/httptest"
  14. "os"
  15. "path/filepath"
  16. "sort"
  17. "strings"
  18. "testing"
  19. "time"
  20. "github.com/gin-gonic/gin"
  21. "github.com/stretchr/testify/assert"
  22. "github.com/stretchr/testify/require"
  23. "github.com/ollama/ollama/api"
  24. "github.com/ollama/ollama/llm"
  25. "github.com/ollama/ollama/openai"
  26. "github.com/ollama/ollama/parser"
  27. "github.com/ollama/ollama/types/model"
  28. "github.com/ollama/ollama/version"
  29. )
  30. func createTestFile(t *testing.T, name string) string {
  31. t.Helper()
  32. f, err := os.CreateTemp(t.TempDir(), name)
  33. require.NoError(t, err)
  34. defer f.Close()
  35. err = binary.Write(f, binary.LittleEndian, []byte("GGUF"))
  36. require.NoError(t, err)
  37. err = binary.Write(f, binary.LittleEndian, uint32(3))
  38. require.NoError(t, err)
  39. err = binary.Write(f, binary.LittleEndian, uint64(0))
  40. require.NoError(t, err)
  41. err = binary.Write(f, binary.LittleEndian, uint64(0))
  42. require.NoError(t, err)
  43. return f.Name()
  44. }
  45. func Test_Routes(t *testing.T) {
  46. type testCase struct {
  47. Name string
  48. Method string
  49. Path string
  50. Setup func(t *testing.T, req *http.Request)
  51. Expected func(t *testing.T, resp *http.Response)
  52. }
  53. createTestModel := func(t *testing.T, name string) {
  54. t.Helper()
  55. fname := createTestFile(t, "ollama-model")
  56. r := strings.NewReader(fmt.Sprintf("FROM %s\nPARAMETER seed 42\nPARAMETER top_p 0.9\nPARAMETER stop foo\nPARAMETER stop bar", fname))
  57. modelfile, err := parser.ParseFile(r)
  58. require.NoError(t, err)
  59. fn := func(resp api.ProgressResponse) {
  60. t.Logf("Status: %s", resp.Status)
  61. }
  62. err = CreateModel(context.TODO(), model.ParseName(name), "", "", modelfile, fn)
  63. require.NoError(t, err)
  64. }
  65. testCases := []testCase{
  66. {
  67. Name: "Version Handler",
  68. Method: http.MethodGet,
  69. Path: "/api/version",
  70. Setup: func(t *testing.T, req *http.Request) {
  71. },
  72. Expected: func(t *testing.T, resp *http.Response) {
  73. contentType := resp.Header.Get("Content-Type")
  74. assert.Equal(t, "application/json; charset=utf-8", contentType)
  75. body, err := io.ReadAll(resp.Body)
  76. require.NoError(t, err)
  77. assert.Equal(t, fmt.Sprintf(`{"version":"%s"}`, version.Version), string(body))
  78. },
  79. },
  80. {
  81. Name: "Tags Handler (no tags)",
  82. Method: http.MethodGet,
  83. Path: "/api/tags",
  84. Expected: func(t *testing.T, resp *http.Response) {
  85. contentType := resp.Header.Get("Content-Type")
  86. assert.Equal(t, "application/json; charset=utf-8", contentType)
  87. body, err := io.ReadAll(resp.Body)
  88. require.NoError(t, err)
  89. var modelList api.ListResponse
  90. err = json.Unmarshal(body, &modelList)
  91. require.NoError(t, err)
  92. assert.NotNil(t, modelList.Models)
  93. assert.Empty(t, len(modelList.Models))
  94. },
  95. },
  96. {
  97. Name: "openai empty list",
  98. Method: http.MethodGet,
  99. Path: "/v1/models",
  100. Expected: func(t *testing.T, resp *http.Response) {
  101. contentType := resp.Header.Get("Content-Type")
  102. assert.Equal(t, "application/json", contentType)
  103. body, err := io.ReadAll(resp.Body)
  104. require.NoError(t, err)
  105. var modelList openai.ListCompletion
  106. err = json.Unmarshal(body, &modelList)
  107. require.NoError(t, err)
  108. assert.Equal(t, "list", modelList.Object)
  109. assert.Empty(t, modelList.Data)
  110. },
  111. },
  112. {
  113. Name: "Tags Handler (yes tags)",
  114. Method: http.MethodGet,
  115. Path: "/api/tags",
  116. Setup: func(t *testing.T, req *http.Request) {
  117. createTestModel(t, "test-model")
  118. },
  119. Expected: func(t *testing.T, resp *http.Response) {
  120. contentType := resp.Header.Get("Content-Type")
  121. assert.Equal(t, "application/json; charset=utf-8", contentType)
  122. body, err := io.ReadAll(resp.Body)
  123. require.NoError(t, err)
  124. assert.NotContains(t, string(body), "expires_at")
  125. var modelList api.ListResponse
  126. err = json.Unmarshal(body, &modelList)
  127. require.NoError(t, err)
  128. assert.Len(t, modelList.Models, 1)
  129. assert.Equal(t, "test-model:latest", modelList.Models[0].Name)
  130. },
  131. },
  132. {
  133. Name: "openai list models with tags",
  134. Method: http.MethodGet,
  135. Path: "/v1/models",
  136. Expected: func(t *testing.T, resp *http.Response) {
  137. contentType := resp.Header.Get("Content-Type")
  138. assert.Equal(t, "application/json", contentType)
  139. body, err := io.ReadAll(resp.Body)
  140. require.NoError(t, err)
  141. var modelList openai.ListCompletion
  142. err = json.Unmarshal(body, &modelList)
  143. require.NoError(t, err)
  144. assert.Len(t, modelList.Data, 1)
  145. assert.Equal(t, "test-model:latest", modelList.Data[0].Id)
  146. assert.Equal(t, "library", modelList.Data[0].OwnedBy)
  147. },
  148. },
  149. {
  150. Name: "Create Model Handler",
  151. Method: http.MethodPost,
  152. Path: "/api/create",
  153. Setup: func(t *testing.T, req *http.Request) {
  154. fname := createTestFile(t, "ollama-model")
  155. stream := false
  156. createReq := api.CreateRequest{
  157. Name: "t-bone",
  158. Modelfile: fmt.Sprintf("FROM %s", fname),
  159. Stream: &stream,
  160. }
  161. jsonData, err := json.Marshal(createReq)
  162. require.NoError(t, err)
  163. req.Body = io.NopCloser(bytes.NewReader(jsonData))
  164. },
  165. Expected: func(t *testing.T, resp *http.Response) {
  166. contentType := resp.Header.Get("Content-Type")
  167. assert.Equal(t, "application/json", contentType)
  168. _, err := io.ReadAll(resp.Body)
  169. require.NoError(t, err)
  170. assert.Equal(t, 200, resp.StatusCode)
  171. model, err := GetModel("t-bone")
  172. require.NoError(t, err)
  173. assert.Equal(t, "t-bone:latest", model.ShortName)
  174. },
  175. },
  176. {
  177. Name: "Copy Model Handler",
  178. Method: http.MethodPost,
  179. Path: "/api/copy",
  180. Setup: func(t *testing.T, req *http.Request) {
  181. createTestModel(t, "hamshank")
  182. copyReq := api.CopyRequest{
  183. Source: "hamshank",
  184. Destination: "beefsteak",
  185. }
  186. jsonData, err := json.Marshal(copyReq)
  187. require.NoError(t, err)
  188. req.Body = io.NopCloser(bytes.NewReader(jsonData))
  189. },
  190. Expected: func(t *testing.T, resp *http.Response) {
  191. model, err := GetModel("beefsteak")
  192. require.NoError(t, err)
  193. assert.Equal(t, "beefsteak:latest", model.ShortName)
  194. },
  195. },
  196. {
  197. Name: "Show Model Handler",
  198. Method: http.MethodPost,
  199. Path: "/api/show",
  200. Setup: func(t *testing.T, req *http.Request) {
  201. createTestModel(t, "show-model")
  202. showReq := api.ShowRequest{Model: "show-model"}
  203. jsonData, err := json.Marshal(showReq)
  204. require.NoError(t, err)
  205. req.Body = io.NopCloser(bytes.NewReader(jsonData))
  206. },
  207. Expected: func(t *testing.T, resp *http.Response) {
  208. contentType := resp.Header.Get("Content-Type")
  209. assert.Equal(t, "application/json; charset=utf-8", contentType)
  210. body, err := io.ReadAll(resp.Body)
  211. require.NoError(t, err)
  212. var showResp api.ShowResponse
  213. err = json.Unmarshal(body, &showResp)
  214. require.NoError(t, err)
  215. var params []string
  216. paramsSplit := strings.Split(showResp.Parameters, "\n")
  217. for _, p := range paramsSplit {
  218. params = append(params, strings.Join(strings.Fields(p), " "))
  219. }
  220. sort.Strings(params)
  221. expectedParams := []string{
  222. "seed 42",
  223. "stop \"bar\"",
  224. "stop \"foo\"",
  225. "top_p 0.9",
  226. }
  227. assert.Equal(t, expectedParams, params)
  228. assert.InDelta(t, 0, showResp.ModelInfo["general.parameter_count"], 1e-9, "Parameter count should be 0")
  229. },
  230. },
  231. {
  232. Name: "openai retrieve model handler",
  233. Method: http.MethodGet,
  234. Path: "/v1/models/show-model",
  235. Expected: func(t *testing.T, resp *http.Response) {
  236. contentType := resp.Header.Get("Content-Type")
  237. assert.Equal(t, "application/json", contentType)
  238. body, err := io.ReadAll(resp.Body)
  239. require.NoError(t, err)
  240. var retrieveResp api.RetrieveModelResponse
  241. err = json.Unmarshal(body, &retrieveResp)
  242. require.NoError(t, err)
  243. assert.Equal(t, "show-model", retrieveResp.Id)
  244. assert.Equal(t, "library", retrieveResp.OwnedBy)
  245. },
  246. },
  247. }
  248. t.Setenv("OLLAMA_MODELS", t.TempDir())
  249. s := &Server{}
  250. router := s.GenerateRoutes()
  251. httpSrv := httptest.NewServer(router)
  252. t.Cleanup(httpSrv.Close)
  253. for _, tc := range testCases {
  254. t.Run(tc.Name, func(t *testing.T) {
  255. u := httpSrv.URL + tc.Path
  256. req, err := http.NewRequestWithContext(context.TODO(), tc.Method, u, nil)
  257. require.NoError(t, err)
  258. if tc.Setup != nil {
  259. tc.Setup(t, req)
  260. }
  261. resp, err := httpSrv.Client().Do(req)
  262. require.NoError(t, err)
  263. defer resp.Body.Close()
  264. if tc.Expected != nil {
  265. tc.Expected(t, resp)
  266. }
  267. })
  268. }
  269. }
  270. func TestCase(t *testing.T) {
  271. t.Setenv("OLLAMA_MODELS", t.TempDir())
  272. cases := []string{
  273. "mistral",
  274. "llama3:latest",
  275. "library/phi3:q4_0",
  276. "registry.ollama.ai/library/gemma:q5_K_M",
  277. // TODO: host:port currently fails on windows (#4107)
  278. // "localhost:5000/alice/bob:latest",
  279. }
  280. var s Server
  281. for _, tt := range cases {
  282. t.Run(tt, func(t *testing.T) {
  283. w := createRequest(t, s.CreateHandler, api.CreateRequest{
  284. Name: tt,
  285. Modelfile: fmt.Sprintf("FROM %s", createBinFile(t, nil, nil)),
  286. Stream: &stream,
  287. })
  288. if w.Code != http.StatusOK {
  289. t.Fatalf("expected status 200 got %d", w.Code)
  290. }
  291. expect, err := json.Marshal(map[string]string{"error": "a model with that name already exists"})
  292. if err != nil {
  293. t.Fatal(err)
  294. }
  295. t.Run("create", func(t *testing.T) {
  296. w = createRequest(t, s.CreateHandler, api.CreateRequest{
  297. Name: strings.ToUpper(tt),
  298. Modelfile: fmt.Sprintf("FROM %s", createBinFile(t, nil, nil)),
  299. Stream: &stream,
  300. })
  301. if w.Code != http.StatusBadRequest {
  302. t.Fatalf("expected status 500 got %d", w.Code)
  303. }
  304. if !bytes.Equal(w.Body.Bytes(), expect) {
  305. t.Fatalf("expected error %s got %s", expect, w.Body.String())
  306. }
  307. })
  308. t.Run("pull", func(t *testing.T) {
  309. w := createRequest(t, s.PullHandler, api.PullRequest{
  310. Name: strings.ToUpper(tt),
  311. Stream: &stream,
  312. })
  313. if w.Code != http.StatusBadRequest {
  314. t.Fatalf("expected status 500 got %d", w.Code)
  315. }
  316. if !bytes.Equal(w.Body.Bytes(), expect) {
  317. t.Fatalf("expected error %s got %s", expect, w.Body.String())
  318. }
  319. })
  320. t.Run("copy", func(t *testing.T) {
  321. w := createRequest(t, s.CopyHandler, api.CopyRequest{
  322. Source: tt,
  323. Destination: strings.ToUpper(tt),
  324. })
  325. if w.Code != http.StatusBadRequest {
  326. t.Fatalf("expected status 500 got %d", w.Code)
  327. }
  328. if !bytes.Equal(w.Body.Bytes(), expect) {
  329. t.Fatalf("expected error %s got %s", expect, w.Body.String())
  330. }
  331. })
  332. })
  333. }
  334. }
  335. func TestShow(t *testing.T) {
  336. t.Setenv("OLLAMA_MODELS", t.TempDir())
  337. var s Server
  338. createRequest(t, s.CreateHandler, api.CreateRequest{
  339. Name: "show-model",
  340. Modelfile: fmt.Sprintf(
  341. "FROM %s\nFROM %s",
  342. createBinFile(t, llm.KV{"general.architecture": "test"}, nil),
  343. createBinFile(t, llm.KV{"general.architecture": "clip"}, nil),
  344. ),
  345. })
  346. w := createRequest(t, s.ShowHandler, api.ShowRequest{
  347. Name: "show-model",
  348. })
  349. if w.Code != http.StatusOK {
  350. t.Fatalf("expected status code 200, actual %d", w.Code)
  351. }
  352. var resp api.ShowResponse
  353. if err := json.NewDecoder(w.Body).Decode(&resp); err != nil {
  354. t.Fatal(err)
  355. }
  356. if resp.ModelInfo["general.architecture"] != "test" {
  357. t.Fatal("Expected model architecture to be 'test', but got", resp.ModelInfo["general.architecture"])
  358. }
  359. if resp.ProjectorInfo["general.architecture"] != "clip" {
  360. t.Fatal("Expected projector architecture to be 'clip', but got", resp.ProjectorInfo["general.architecture"])
  361. }
  362. }
  363. func TestNormalize(t *testing.T) {
  364. type testCase struct {
  365. input []float32
  366. }
  367. testCases := []testCase{
  368. {input: []float32{1}},
  369. {input: []float32{0, 1, 2, 3}},
  370. {input: []float32{0.1, 0.2, 0.3}},
  371. {input: []float32{-0.1, 0.2, 0.3, -0.4}},
  372. {input: []float32{0, 0, 0}},
  373. }
  374. isNormalized := func(vec []float32) (res bool) {
  375. sum := 0.0
  376. for _, v := range vec {
  377. sum += float64(v * v)
  378. }
  379. if math.Abs(sum-1) > 1e-6 {
  380. return sum == 0
  381. } else {
  382. return true
  383. }
  384. }
  385. for _, tc := range testCases {
  386. t.Run("", func(t *testing.T) {
  387. normalized := normalize(tc.input)
  388. if !isNormalized(normalized) {
  389. t.Errorf("Vector %v is not normalized", tc.input)
  390. }
  391. })
  392. }
  393. }
  394. func TestServe(t *testing.T) {
  395. gin.SetMode(gin.TestMode)
  396. p := t.TempDir()
  397. t.Setenv("OLLAMA_MODELS", p)
  398. var s Server
  399. // seed some models
  400. createRequest(t, s.CreateHandler, api.CreateRequest{
  401. Name: "test-model",
  402. Modelfile: fmt.Sprintf("FROM %s", createBinFile(t, nil, nil)),
  403. })
  404. createRequest(t, s.CreateHandler, api.CreateRequest{
  405. Name: "test-model-2",
  406. Modelfile: "FROM test-model\nSYSTEM You are a good robot.",
  407. })
  408. createRequest(t, s.CreateHandler, api.CreateRequest{
  409. Name: "test-model-3",
  410. Modelfile: "FROM test-model\nSYSTEM You are a bad robot.",
  411. })
  412. checkFileExists(t, filepath.Join(p, "blobs", "*"), []string{
  413. filepath.Join(p, "blobs", "sha256-1c515c46e60f849c6aeffa86e256508ac450464762a31ca08648e418f07c9819"),
  414. filepath.Join(p, "blobs", "sha256-461fd034bb72312965d46160399b1b882c6a2f8c7305237ed7dd65f848fba10c"),
  415. filepath.Join(p, "blobs", "sha256-66e9776a5bb7e5f6093681aa8ba01a7a6b6ae1dd697281f11fa714eaa948a6a4"),
  416. filepath.Join(p, "blobs", "sha256-a4e5e156ddec27e286f75328784d7106b60a4eb1d246e950a001a3f944fbda99"),
  417. filepath.Join(p, "blobs", "sha256-b3a5b5b438604c5103ba403a5455af94ea98494b5bbc177f4665716a37b99c1e"),
  418. filepath.Join(p, "blobs", "sha256-ca239d7bd8ea90e4a5d2e6bf88f8d74a47b14336e73eb4e18bed4dd325018116"),
  419. })
  420. ln, err := net.Listen("tcp", "127.0.0.1:0")
  421. if err != nil {
  422. t.Fatal(err)
  423. }
  424. defer ln.Close()
  425. //nolint:errcheck
  426. go Serve(ln)
  427. // wait for server to be healthy (GET / => 200)
  428. ctx, cancel := context.WithTimeout(context.TODO(), time.Second)
  429. defer cancel()
  430. if err := func() error {
  431. tick := time.NewTicker(20 * time.Millisecond)
  432. defer tick.Stop()
  433. for {
  434. select {
  435. case <-ctx.Done():
  436. return errors.New("server did not become healthy")
  437. case <-tick.C:
  438. r, err := http.Get(fmt.Sprintf("http://%s", ln.Addr()))
  439. if err != nil {
  440. continue
  441. }
  442. if err := r.Body.Close(); err != nil {
  443. return err
  444. }
  445. if r.StatusCode == http.StatusOK {
  446. return nil
  447. }
  448. }
  449. }
  450. }(); err != nil {
  451. t.Fatal(err)
  452. }
  453. checkFileExists(t, filepath.Join(p, "blobs", "*"), []string{
  454. filepath.Join(p, "blobs", "sha256-1c515c46e60f849c6aeffa86e256508ac450464762a31ca08648e418f07c9819"),
  455. filepath.Join(p, "blobs", "sha256-461fd034bb72312965d46160399b1b882c6a2f8c7305237ed7dd65f848fba10c"),
  456. filepath.Join(p, "blobs", "sha256-66e9776a5bb7e5f6093681aa8ba01a7a6b6ae1dd697281f11fa714eaa948a6a4"),
  457. filepath.Join(p, "blobs", "sha256-a4e5e156ddec27e286f75328784d7106b60a4eb1d246e950a001a3f944fbda99"),
  458. filepath.Join(p, "blobs", "sha256-b3a5b5b438604c5103ba403a5455af94ea98494b5bbc177f4665716a37b99c1e"),
  459. filepath.Join(p, "blobs", "sha256-ca239d7bd8ea90e4a5d2e6bf88f8d74a47b14336e73eb4e18bed4dd325018116"),
  460. })
  461. }