Michael Yang преди 4 месеца
родител
ревизия
cef3cf353a
променени са 2 файла, в които са добавени 4 реда и са изтрити 4 реда
  1. 3 3
      llm/memory.go
  2. 1 1
      llm/server.go

+ 3 - 3
llm/memory.go

@@ -338,7 +338,7 @@ func EstimateGPULayers(gpus []discover.GpuInfo, f *ggml.GGML, projectors []strin
 	return estimate
 	return estimate
 }
 }
 
 
-func (m MemoryEstimate) log() {
+func (m MemoryEstimate) LogValue() slog.Value {
 	overhead := envconfig.GpuOverhead()
 	overhead := envconfig.GpuOverhead()
 
 
 	log := slog.With()
 	log := slog.With()
@@ -352,8 +352,8 @@ func (m MemoryEstimate) log() {
 		)
 		)
 	}
 	}
 
 
-	log.Info(
-		"offload to "+m.inferenceLibrary,
+	return slog.GroupValue(
+		slog.String("library", m.inferenceLibrary),
 		slog.Group(
 		slog.Group(
 			"layers",
 			"layers",
 			// requested number of layers to offload
 			// requested number of layers to offload

+ 1 - 1
llm/server.go

@@ -139,7 +139,7 @@ func NewLlamaServer(gpus discover.GpuInfoList, model string, f *ggml.GGML, adapt
 		}
 		}
 	}
 	}
 
 
-	estimate.log()
+	slog.Info("offload", "", estimate)
 
 
 	// Loop through potential servers
 	// Loop through potential servers
 	finalErr := errors.New("no suitable llama servers found")
 	finalErr := errors.New("no suitable llama servers found")