Josh Yan 8 mēneši atpakaļ
vecāks
revīzija
cc17b02b23
3 mainītis faili ar 3 papildinājumiem un 1 dzēšanām
  1. 1 0
      .gitattributes
  2. 1 0
      llm/llm.go
  3. 1 1
      server/images.go

+ 1 - 0
.gitattributes

@@ -1,3 +1,4 @@
 llm/ext_server/* linguist-vendored
+llm/*.h linguist-vendored
 * text=auto
 *.go text eol=lf

+ 1 - 0
llm/llm.go

@@ -20,6 +20,7 @@ package llm
 import "C"
 
 import (
+	"errors"
 	"fmt"
 	"sync/atomic"
 	"time"

+ 1 - 1
server/images.go

@@ -435,7 +435,7 @@ func CreateModel(ctx context.Context, name model.Name, modelFileDir, quantizatio
 						return err
 					}
 
-					tensorCount := len(baseLayer.GGML.Tensors())
+					tensorCount := len(baseLayer.GGML.Tensors().Items)
 					ft := baseLayer.GGML.KV().FileType()
 					if !slices.Contains([]string{"F16", "F32"}, ft.String()) {
 						return errors.New("quantization is only supported for F16 and F32 models")