123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427 |
- package ollamarunner
- import (
- "image"
- "testing"
- "time"
- "github.com/ollama/ollama/model/input"
- )
- func TestCountCommon(t *testing.T) {
- imgA := image.NewRGBA(image.Rect(0, 0, 100, 100))
- imgB := image.NewRGBA(image.Rect(0, 0, 50, 50))
- imgC := image.NewRGBA(image.Rect(50, 50, 100, 100))
- tests := []struct {
- name string
- t1 []input.Input
- t2 []input.Input
- expected int32
- }{
- {
- name: "Equal",
- t1: []input.Input{{Token: 1}, {Token: 2}, {Token: 3}},
- t2: []input.Input{{Token: 1}, {Token: 2}, {Token: 3}},
- expected: 3,
- },
- {
- name: "Prefix",
- t1: []input.Input{{Token: 1}},
- t2: []input.Input{{Token: 1}, {Token: 2}, {Token: 3}},
- expected: 1,
- },
- {
- name: "Image Prefix",
- t1: []input.Input{{Multimodal: imgA, MultimodalHash: 1}},
- t2: []input.Input{{Multimodal: imgA, MultimodalHash: 1}, {Multimodal: imgB, MultimodalHash: 2}, {Multimodal: imgC, MultimodalHash: 3}},
- expected: 1,
- },
- {
- name: "Mixed",
- t1: []input.Input{{Token: 1}, {Multimodal: imgA, MultimodalHash: 1}},
- t2: []input.Input{{Token: 1}, {Multimodal: imgA, MultimodalHash: 1}, {Token: 5}},
- expected: 2,
- },
- {
- name: "Mixed, Same Length",
- t1: []input.Input{{Token: 1}, {Multimodal: imgA, MultimodalHash: 1}},
- t2: []input.Input{{Token: 1}, {Multimodal: imgB, MultimodalHash: 2}},
- expected: 1,
- },
- {
- name: "Empty",
- t1: []input.Input{},
- t2: []input.Input{{Token: 1}, {Token: 2}, {Token: 3}},
- expected: 0,
- },
- {
- name: "Both Empty",
- t1: []input.Input{},
- t2: []input.Input{},
- expected: 0,
- },
- }
- for _, tt := range tests {
- t.Run(tt.name, func(t *testing.T) {
- result := countCommonPrefix(tt.t1, tt.t2)
- if result != tt.expected {
- t.Errorf("countCommonPrefix(%v, %v): have %v; want %v", tt.t1, tt.t2, result, tt.expected)
- }
- })
- }
- }
- func TestFindCacheSlot(t *testing.T) {
- type expected struct {
- result int
- len int32
- }
- tests := []struct {
- name string
- cache InputCache
- prompt []input.Input
- longest expected
- best expected
- }{
- {
- name: "Empty",
- cache: InputCache{slots: []InputCacheSlot{
- {
- Id: 0,
- Inputs: []input.Input{},
- InUse: false,
- lastUsed: time.Time{},
- },
- {
- Id: 1,
- Inputs: []input.Input{},
- InUse: false,
- lastUsed: time.Time{},
- },
- }},
- prompt: []input.Input{{Token: 1}},
- longest: expected{result: 0, len: 0},
- best: expected{result: 0, len: 0},
- },
- {
- name: "Extend",
- cache: InputCache{slots: []InputCacheSlot{
- {
- Id: 0,
- Inputs: []input.Input{{Token: 1}},
- InUse: false,
- lastUsed: time.Now().Add(-time.Second),
- },
- {
- Id: 1,
- Inputs: []input.Input{{Token: 1}, {Token: 2}},
- InUse: false,
- lastUsed: time.Now().Add(-2 * time.Second),
- },
- }},
- prompt: []input.Input{{Token: 1}, {Token: 2}},
- longest: expected{result: 1, len: 2},
- best: expected{result: 1, len: 2},
- },
- {
- name: "New",
- cache: InputCache{slots: []InputCacheSlot{
- {
- Id: 0,
- Inputs: []input.Input{{Token: 1}, {Token: 2}},
- InUse: false,
- lastUsed: time.Now().Add(-time.Second),
- },
- {
- Id: 1,
- Inputs: []input.Input{},
- InUse: false,
- lastUsed: time.Time{},
- },
- }},
- prompt: []input.Input{{Token: 2}},
- longest: expected{result: 0, len: 0},
- best: expected{result: 1, len: 0},
- },
- {
- name: "Fork",
- cache: InputCache{
- slots: []InputCacheSlot{
- {
- Id: 0,
- Inputs: []input.Input{{Token: 1}, {Token: 2}},
- InUse: false,
- lastUsed: time.Now().Add(-time.Second),
- },
- {
- Id: 1,
- Inputs: []input.Input{},
- InUse: false,
- lastUsed: time.Time{},
- },
- },
- },
- prompt: []input.Input{{Token: 1}},
- longest: expected{result: 0, len: 1},
- best: expected{result: 1, len: 1},
- },
- {
- name: "Evict",
- cache: InputCache{slots: []InputCacheSlot{
- {
- Id: 0,
- Inputs: []input.Input{{Token: 1}},
- InUse: false,
- lastUsed: time.Now().Add(-time.Second),
- },
- {
- Id: 1,
- Inputs: []input.Input{{Token: 1}, {Token: 2}},
- InUse: false,
- lastUsed: time.Now().Add(-2 * time.Second),
- },
- }},
- prompt: []input.Input{{Token: 2}, {Token: 3}},
- longest: expected{result: 0, len: 0},
- best: expected{result: 1, len: 0},
- },
- {
- name: "In use",
- cache: InputCache{slots: []InputCacheSlot{
- {
- Id: 0,
- Inputs: []input.Input{{Token: 1}, {Token: 2}},
- InUse: true,
- lastUsed: time.Now().Add(-time.Second),
- },
- {
- Id: 1,
- Inputs: []input.Input{{Token: 1}},
- InUse: false,
- lastUsed: time.Now().Add(-2 * time.Second),
- },
- }},
- prompt: []input.Input{{Token: 1}, {Token: 2}},
- longest: expected{result: 1, len: 1},
- best: expected{result: 1, len: 2},
- },
- }
- for _, tt := range tests {
- t.Run("Longest-"+tt.name, func(t *testing.T) {
- result, resultLen, err := tt.cache.findLongestCacheSlot(tt.prompt)
- if err != nil {
- t.Errorf("findLongestCacheSlot: err %v", err)
- } else if result.Id != tt.longest.result || resultLen != tt.longest.len {
- t.Errorf("findLongestCacheSlot: slot have %v, want %v len have %v, want %v",
- result.Id, tt.longest.result, resultLen, tt.longest.len)
- }
- })
- }
- for _, tt := range tests {
- t.Run("Best-"+tt.name, func(t *testing.T) {
- result, resultLen, err := tt.cache.findBestCacheSlot(tt.prompt)
- if err != nil {
- t.Errorf("findBestCacheSlot: err %v", err)
- } else if result.Id != tt.best.result || resultLen != tt.best.len {
- t.Errorf("findBestCacheSlot: slot have %v, want %v len have %v, want %v",
- result.Id, tt.best.result, resultLen, tt.best.len)
- }
- })
- }
- }
- func TestShiftDiscard(t *testing.T) {
- tests := []struct {
- name string
- numCtx int32
- numKeep int32
- inputLen int32
- expected int32
- }{
- {
- name: "Shift",
- numCtx: 2048,
- numKeep: 5,
- inputLen: 2048,
- expected: 1021,
- },
- {
- name: "Max Keep",
- numCtx: 2048,
- numKeep: 2047,
- inputLen: 2048,
- expected: 1,
- },
- {
- name: "No Keep",
- numCtx: 2048,
- numKeep: 0,
- inputLen: 2048,
- expected: 1024,
- },
- {
- name: "Truncate",
- numCtx: 2048,
- numKeep: 5,
- inputLen: 5000,
- expected: 3973,
- },
- {
- name: "Truncate Keep",
- numCtx: 2048,
- numKeep: 2047,
- inputLen: 5000,
- expected: 2953,
- },
- {
- name: "No Op",
- numCtx: 2048,
- numKeep: 5,
- inputLen: 512,
- expected: 0,
- },
- }
- for _, tt := range tests {
- t.Run(tt.name, func(t *testing.T) {
- c := InputCache{numCtx: tt.numCtx}
- result := c.ShiftDiscard(tt.inputLen, tt.numKeep)
- if result != tt.expected {
- t.Errorf("shiftDiscard(ctx: %v, keep: %v input: %v): have %v; want %v", tt.numCtx, tt.numKeep, tt.inputLen, result, tt.expected)
- }
- })
- }
- }
- func TestLoadCacheSlot(t *testing.T) {
- tests := []struct {
- name string
- cache InputCache
- prompt []input.Input
- wantErr bool
- expectedSlotId int
- expectedPrompt int // expected length of remaining prompt
- }{
- {
- name: "Basic cache hit - single user",
- cache: InputCache{
- multiUserCache: false,
- slots: []InputCacheSlot{
- {
- Id: 0,
- Inputs: []input.Input{{Token: 1}, {Token: 2}},
- InUse: false,
- lastUsed: time.Now().Add(-time.Second),
- },
- {
- Id: 1,
- Inputs: []input.Input{},
- InUse: false,
- lastUsed: time.Now().Add(-2 * time.Second),
- },
- },
- },
- prompt: []input.Input{{Token: 1}, {Token: 2}, {Token: 3}},
- wantErr: false,
- expectedSlotId: 0,
- expectedPrompt: 1, // Only token 3 remains
- },
- {
- name: "Basic cache hit - multi user",
- cache: InputCache{
- multiUserCache: true,
- slots: []InputCacheSlot{
- {
- Id: 0,
- Inputs: []input.Input{{Token: 1}, {Token: 2}},
- InUse: false,
- lastUsed: time.Now().Add(-time.Second),
- },
- {
- Id: 1,
- Inputs: []input.Input{},
- InUse: false,
- lastUsed: time.Now().Add(-2 * time.Second),
- },
- },
- },
- prompt: []input.Input{{Token: 1}, {Token: 2}, {Token: 3}},
- wantErr: false,
- expectedSlotId: 0,
- expectedPrompt: 1, // Only token 3 remains
- },
- {
- name: "Exact match - leave one input",
- cache: InputCache{
- multiUserCache: false,
- slots: []InputCacheSlot{
- {
- Id: 0,
- Inputs: []input.Input{{Token: 1}, {Token: 2}},
- InUse: false,
- lastUsed: time.Now().Add(-time.Second),
- },
- },
- },
- prompt: []input.Input{{Token: 1}, {Token: 2}},
- wantErr: false,
- expectedSlotId: 0,
- expectedPrompt: 1, // Should leave 1 token for sampling
- },
- {
- name: "No available slots",
- cache: InputCache{
- multiUserCache: false,
- slots: []InputCacheSlot{
- {
- Id: 0,
- Inputs: []input.Input{{Token: 1}, {Token: 2}},
- InUse: true,
- lastUsed: time.Now().Add(-time.Second),
- },
- },
- },
- prompt: []input.Input{{Token: 1}, {Token: 2}, {Token: 3}},
- wantErr: true,
- expectedSlotId: -1,
- expectedPrompt: -1,
- },
- }
- for _, tt := range tests {
- t.Run(tt.name, func(t *testing.T) {
- slot, remainingPrompt, err := tt.cache.LoadCacheSlot(tt.prompt)
- // Check error state
- if (err != nil) != tt.wantErr {
- t.Errorf("LoadCacheSlot() error = %v, wantErr %v", err, tt.wantErr)
- return
- }
- if tt.wantErr {
- return // Skip further checks if we expected an error
- }
- // Verify slot ID
- if slot.Id != tt.expectedSlotId {
- t.Errorf("LoadCacheSlot() slot ID = %v, expected %v", slot.Id, tt.expectedSlotId)
- }
- // Verify slot is now marked in use
- if !slot.InUse {
- t.Errorf("LoadCacheSlot() slot not marked InUse")
- }
- // Verify remaining prompt length
- if len(remainingPrompt) != tt.expectedPrompt {
- t.Errorf("LoadCacheSlot() remaining prompt length = %v, expected %v",
- len(remainingPrompt), tt.expectedPrompt)
- }
- })
- }
- }
|