summaryrefslogtreecommitdiff
path: root/examples/server/server.cpp
diff options
context:
space:
mode:
authorJustin Parker <jparkerweb@gmail.com>2024-02-07 01:15:19 -0500
committerGitHub <noreply@github.com>2024-02-07 08:15:19 +0200
commitf3e2b4fa3f81a410ecb7dec929c259ef8d8dbb7d (patch)
tree77bda53ac299ccac3ee35e91e5571d57485b63a4 /examples/server/server.cpp
parentf68664ac241a6b5c233d8f1051eef20929b06008 (diff)
server : update `/props` with "total_slots" value (#5373)
* include total "num_slots" in default_generation_settings_for_props * cleanup total_slots return value in /props endpoint * update /props endpoint docs with total_slots * remove num_slots from default_generation_settings_for_props * update /props endpoint section
Diffstat (limited to 'examples/server/server.cpp')
-rw-r--r--examples/server/server.cpp4
1 files changed, 2 insertions, 2 deletions
diff --git a/examples/server/server.cpp b/examples/server/server.cpp
index 9481ce6b..eceda30d 100644
--- a/examples/server/server.cpp
+++ b/examples/server/server.cpp
@@ -432,7 +432,6 @@ struct llama_server_context
}
default_generation_settings_for_props = get_formated_generation(slots.front());
- default_generation_settings_for_props["num_slots"] = params.n_parallel;
default_generation_settings_for_props["seed"] = -1;
batch = llama_batch_init(n_ctx, 0, params.n_parallel);
@@ -2639,7 +2638,8 @@ int main(int argc, char **argv)
json data = {
{ "user_name", llama.name_user.c_str() },
{ "assistant_name", llama.name_assistant.c_str() },
- { "default_generation_settings", llama.default_generation_settings_for_props }
+ { "default_generation_settings", llama.default_generation_settings_for_props },
+ { "total_slots", llama.params.n_parallel }
};
res.set_content(data.dump(), "application/json; charset=utf-8");
});