Michael Yang 1 年之前
父節點
當前提交
f921e2696e
共有 1 個文件被更改,包括 1 次插入1 次删除
  1. 1 1
      llm/llm.go

+ 1 - 1
llm/llm.go

@@ -61,7 +61,7 @@ func New(workDir, model string, adapters, projectors []string, opts api.Options)
 	requiredKv := 2 * 2 * int64(opts.NumCtx) * int64(ggml.NumLayers()) * int64(ggml.NumEmbed()) * int64(ggml.NumHeadKv()) / int64(ggml.NumHead())
 	requiredKv := 2 * 2 * int64(opts.NumCtx) * int64(ggml.NumLayers()) * int64(ggml.NumEmbed()) * int64(ggml.NumHeadKv()) / int64(ggml.NumHead())
 
 
 	// this amount is the overhead + tensors in memory
 	// this amount is the overhead + tensors in memory
-	// TODO: get this from the llama.cpp's graph calcluations instead of
+	// TODO: get this from the llama.cpp's graph calculations instead of
 	// estimating it's 1/6 * kv_cache_size * num_gqa
 	// estimating it's 1/6 * kv_cache_size * num_gqa
 	requiredAlloc := int64(ggml.NumGQA()) * requiredKv / 6
 	requiredAlloc := int64(ggml.NumGQA()) * requiredKv / 6