From 134484351584dcaad6c98ccfd1a3859cd2ca3c54 Mon Sep 17 00:00:00 2001 From: Josh Yan Date: Tue, 9 Jul 2024 10:27:33 -0700 Subject: [PATCH] image --- server/images.go | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/server/images.go b/server/images.go index 13a3192ae..c163b247c 100644 --- a/server/images.go +++ b/server/images.go @@ -440,6 +440,8 @@ func CreateModel(ctx context.Context, name model.Name, modelFileDir, quantizatio defer temp.Close() defer os.Remove(temp.Name()) + // Quantizes per layer + // Save total quantized tensors if err := llm.Quantize(blob, temp.Name(), want); err != nil { return err } @@ -480,7 +482,7 @@ func CreateModel(ctx context.Context, name model.Name, modelFileDir, quantizatio } fn(api.ProgressResponse{ - Status: fmt.Sprintf("quantizing model %d%%", 100), + Status: "quantizing model done", Quantize: quantization, }) case "license", "template", "system":