Parcourir la source

Merge pull request #3466 from ollama/mxyng/head-kv

default head_kv to 1
Michael Yang il y a 1 an
Parent
commit
4f895d633f
1 fichiers modifiés avec 6 ajouts et 6 suppressions
  1. 6 6
      llm/ggml.go

+ 6 - 6
llm/ggml.go

@@ -148,15 +148,15 @@ func (kv KV) HeadCount() uint64 {
 }
 
 func (kv KV) HeadCountKV() uint64 {
-	return kv.u64(fmt.Sprintf("%s.attention.head_count_kv", kv.Architecture()))
+	if headCountKV := kv.u64(fmt.Sprintf("%s.attention.head_count_kv", kv.Architecture())); headCountKV > 0 {
+		return headCountKV
+	}
+
+	return 1
 }
 
 func (kv KV) GQA() uint64 {
-	if headCountKV := kv.HeadCountKV(); headCountKV > 0 {
-		return kv.HeadCount() / headCountKV
-	}
-
-	return 0
+	return kv.HeadCount() / kv.HeadCountKV()
 }
 
 func (kv KV) EmbeddingLength() uint64 {