From 512e0a7bdea6292675b0658ad59a7761d74153c3 Mon Sep 17 00:00:00 2001 From: Roy Han Date: Mon, 1 Jul 2024 16:29:54 -0700 Subject: [PATCH] Clean up --- llm/ext_server/server.cpp | 5 ----- llm/ext_server/utils.hpp | 17 ----------------- server/routes.go | 11 ----------- 3 files changed, 33 deletions(-) diff --git a/llm/ext_server/server.cpp b/llm/ext_server/server.cpp index cb0463919..8166af2bc 100644 --- a/llm/ext_server/server.cpp +++ b/llm/ext_server/server.cpp @@ -1206,7 +1206,6 @@ struct llama_server_context res.result_json = json { {"embedding", std::vector(n_embd, 0.0f)}, - {"truncated", slot.truncated} }; } else @@ -1224,7 +1223,6 @@ struct llama_server_context res.result_json = json { {"embedding", std::vector(n_embd, 0.0f)}, - {"truncated", slot.truncated} }; continue; } @@ -1233,7 +1231,6 @@ struct llama_server_context res.result_json = json { {"embedding", std::vector(embd, embd + n_embd)}, - {"truncated", slot.truncated} }; } } @@ -3063,7 +3060,6 @@ int main(int argc, char **argv) { if (!json_value(data, "stream", false)) { std::string completion_text; task_result result = llama.queue_results.recv(task_id); - LOG_INFO("completion", {{"result", result.result_json}}); if (!result.error && result.stop) { res.set_content(result.result_json.dump(-1, ' ', false, json::error_handler_t::replace), "application/json; charset=utf-8"); } @@ -3079,7 +3075,6 @@ int main(int argc, char **argv) { while (true) { task_result result = llama.queue_results.recv(task_id); - LOG_INFO("completion", {{"result", result.result_json}}); if (!result.error) { const std::string str = "data: " + diff --git a/llm/ext_server/utils.hpp b/llm/ext_server/utils.hpp index 3e54d0c0e..d63ead04c 100644 --- a/llm/ext_server/utils.hpp +++ b/llm/ext_server/utils.hpp @@ -656,20 +656,3 @@ static json probs_vector_to_json(const llama_context *ctx, const std::vector normalize_vector(const std::vector& vec, int size) { -// double sum = 0.0; -// for (float value : vec) { -// sum += value * value; -// } -// sum = std::sqrt(sum); - -// const float norm = sum > 0.0 ? 1.0f / sum : 0.0f; - -// std::vector normalized_vec(size); -// for (int i = 0; i < size; i++) { -// normalized_vec[i] = vec[i] * norm; -// } -// return normalized_vec; -// } diff --git a/server/routes.go b/server/routes.go index 90aeb3ba0..bd32c5faa 100644 --- a/server/routes.go +++ b/server/routes.go @@ -533,17 +533,6 @@ func (s *Server) EmbeddingsHandler(c *gin.Context) { return } - // assert that embedding is normalized - sum := 0.0 - for _, v := range embedding { - sum += v * v - } - if math.Abs(sum-1) < 1e-6 { - slog.Info("embedding is normalized", "sum", sum) - } else { - slog.Info("embedding is not normalized", "sum", sum) - } - resp := api.EmbeddingResponse{ Embedding: embedding, }