From b0e4e8d76c7c3cc61462a53b78d93f96077991ba Mon Sep 17 00:00:00 2001
From: Josh Yan <jyan00017@gmail.com>
Date: Wed, 10 Jul 2024 09:58:30 -0700
Subject: [PATCH] change

---
 llm/llm.go       | 4 ++--
 server/images.go | 3 ++-
 2 files changed, 4 insertions(+), 3 deletions(-)

diff --git a/llm/llm.go b/llm/llm.go
index 1008ee200..38b2aa13a 100644
--- a/llm/llm.go
+++ b/llm/llm.go
@@ -28,7 +28,7 @@ func SystemInfo() string {
 	return C.GoString(C.llama_print_system_info())
 }
 
-func Quantize(infile, outfile string, ftype fileType, fn func(resp api.ProgressResponse) ) error {
+func Quantize(infile, outfile string, ftype fileType, fn func(resp api.ProgressResponse), tensorCount int) error {
 	cinfile := C.CString(infile)
 	defer C.free(unsafe.Pointer(cinfile))
 
@@ -59,7 +59,7 @@ func Quantize(infile, outfile string, ftype fileType, fn func(resp api.ProgressR
 			select {
 			case <-ticker.C:
                 fn(api.ProgressResponse{
-                    Status:   fmt.Sprintf("quantizing model %d%%", int(*((*C.float)(store))*100)),
+                    Status:   fmt.Sprintf("quantizing model %d/%d", int(*((*C.float)(store))), tensorCount),
                     Quantize: "quant",
                 })			
 				fmt.Println("Progress: ", *((*C.float)(store)))
diff --git a/server/images.go b/server/images.go
index 4accb464c..65fe30725 100644
--- a/server/images.go
+++ b/server/images.go
@@ -422,6 +422,7 @@ func CreateModel(ctx context.Context, name model.Name, modelFileDir, quantizatio
 					if err != nil {
 						return err
 					}
+					tensorCount := len(baseLayer.GGML.Tensors())
 					
 					ft := baseLayer.GGML.KV().FileType()
 					if !slices.Contains([]string{"F16", "F32"}, ft.String()) {
@@ -441,7 +442,7 @@ func CreateModel(ctx context.Context, name model.Name, modelFileDir, quantizatio
 
 						// Quantizes per layer
 						// Save total quantized tensors
-						if err := llm.Quantize(blob, temp.Name(), want, fn); err != nil {
+						if err := llm.Quantize(blob, temp.Name(), want, fn, tensorCount); err != nil {
 							return err
 						}