diff options
author | Alexey Parfenov <zxed@alkatrazstudio.net> | 2024-02-05 08:10:22 +0000 |
---|---|---|
committer | GitHub <noreply@github.com> | 2024-02-05 10:10:22 +0200 |
commit | a2d60c9158435ae9a6f14632f07f1acf7a3becef (patch) | |
tree | 1466e6a9bfc6ddc1810e0580eb404aa54de537e4 /examples/server/server.cpp | |
parent | e6f81775323f6f4e4a30abf022a6028fa86b79ac (diff) |
server : allow to get default generation settings for completion (#5307)
Diffstat (limited to 'examples/server/server.cpp')
-rw-r--r-- | examples/server/server.cpp | 7 |
1 files changed, 6 insertions, 1 deletions
diff --git a/examples/server/server.cpp b/examples/server/server.cpp index a9f8cb36..8000fee5 100644 --- a/examples/server/server.cpp +++ b/examples/server/server.cpp @@ -334,6 +334,7 @@ struct llama_server_context // slots / clients std::vector<llama_client_slot> slots; + json default_generation_settings_for_props; llama_server_queue queue_tasks; llama_server_response queue_results; @@ -430,6 +431,9 @@ struct llama_server_context slots.push_back(slot); } + default_generation_settings_for_props = get_formated_generation(slots.front()); + default_generation_settings_for_props["seed"] = -1; + batch = llama_batch_init(n_ctx, 0, params.n_parallel); // empty system prompt @@ -2614,7 +2618,8 @@ int main(int argc, char **argv) res.set_header("Access-Control-Allow-Origin", req.get_header_value("Origin")); json data = { { "user_name", llama.name_user.c_str() }, - { "assistant_name", llama.name_assistant.c_str() } + { "assistant_name", llama.name_assistant.c_str() }, + { "default_generation_settings", llama.default_generation_settings_for_props } }; res.set_content(data.dump(), "application/json; charset=utf-8"); }); |