fix

ggml-org · ngxson · Dec 8, 2024 · Dec 8, 2024 · Dec 8, 2024 · Dec 8, 2024
commit 6ec3f77a4181cbe2dcad7994e15f315ec10c9019
diff --git a/examples/server/server.cpp b/examples/server/server.cpp
@@ -3519,7 +3519,7 @@ int main(int argc, char ** argv) {
         std::string prompt = json_value(data, "prompt", std::string());
         std::vector<llama_tokens> tokenized_prompts = tokenize_input_prompts(ctx_server.ctx, prompt, true, true);
         SRV_DBG("creating infill tasks, n_prompts = %d\n", (int) tokenized_prompts.size());
-        auto tokens = format_infill(
+        data["prompts"] = format_infill(
             ctx_server.ctx,
             data.at("input_prefix"),
             data.at("input_suffix"),