9 месяцев назад · 369113970a
--- a/llm/llm.go
+++ b/llm/llm.go
@@ -63,6 +63,7 @@ func Quantize(infile, outfile string, ftype fileType, fn func(resp api.ProgressR
 
															                     Status:   fmt.Sprintf("quantizing model %d%%", int(progress*100)),
														
 
															                     Quantize: "quant",
														
 
															                 })			
														
 
															+				fmt.Println("Progress: ", progress)
														
 
															 			case <-done:
														
 
															                 fn(api.ProgressResponse{
														
 
															                     Status:  "quantizing model",
														
--- a/server/images.go
+++ b/server/images.go
@@ -422,12 +422,7 @@ func CreateModel(ctx context.Context, name model.Name, modelFileDir, quantizatio
 
															 					if err != nil {
														
 
															 						return err
														
 
															 					}
														
 
															-
														
 
															-					fn(api.ProgressResponse{
														
 
															-						Status:   "quantizing model",
														
 
															-						Quantize: "quant",
														
 
															-					})
														
 
															-
														
 
															+					
														
 
															 					ft := baseLayer.GGML.KV().FileType()
														
 
															 					if !slices.Contains([]string{"F16", "F32"}, ft.String()) {
														
 
															 						return errors.New("quantization is only supported for F16 and F32 models")
														
@@ -467,11 +462,6 @@ func CreateModel(ctx context.Context, name model.Name, modelFileDir, quantizatio
 
															 						baseLayer.Layer = layer
														
 
															 						baseLayer.GGML = ggml
														
 
															 					}
														
 
															-
														
 
															-					fn(api.ProgressResponse{
														
 
															-						Status:   "quantizing model done",
														
 
															-						Quantize: quantization,
														
 
															-					})
														
 
															 				}
														
 
															 				if baseLayer.GGML != nil {