diff options
author | Justin Parker <jparkerweb@gmail.com> | 2024-02-07 01:15:19 -0500 |
---|---|---|
committer | GitHub <noreply@github.com> | 2024-02-07 08:15:19 +0200 |
commit | f3e2b4fa3f81a410ecb7dec929c259ef8d8dbb7d (patch) | |
tree | 77bda53ac299ccac3ee35e91e5571d57485b63a4 /examples/server/server.cpp | |
parent | f68664ac241a6b5c233d8f1051eef20929b06008 (diff) |
server : update `/props` with "total_slots" value (#5373)
* include total "num_slots" in default_generation_settings_for_props
* cleanup total_slots return value in /props endpoint
* update /props endpoint docs with total_slots
* remove num_slots from default_generation_settings_for_props
* update /props endpoint section
Diffstat (limited to 'examples/server/server.cpp')
-rw-r--r-- | examples/server/server.cpp | 4 |
1 files changed, 2 insertions, 2 deletions
diff --git a/examples/server/server.cpp b/examples/server/server.cpp index 9481ce6b..eceda30d 100644 --- a/examples/server/server.cpp +++ b/examples/server/server.cpp @@ -432,7 +432,6 @@ struct llama_server_context } default_generation_settings_for_props = get_formated_generation(slots.front()); - default_generation_settings_for_props["num_slots"] = params.n_parallel; default_generation_settings_for_props["seed"] = -1; batch = llama_batch_init(n_ctx, 0, params.n_parallel); @@ -2639,7 +2638,8 @@ int main(int argc, char **argv) json data = { { "user_name", llama.name_user.c_str() }, { "assistant_name", llama.name_assistant.c_str() }, - { "default_generation_settings", llama.default_generation_settings_for_props } + { "default_generation_settings", llama.default_generation_settings_for_props }, + { "total_slots", llama.params.n_parallel } }; res.set_content(data.dump(), "application/json; charset=utf-8"); }); |