summaryrefslogtreecommitdiff
path: root/ggml-rpc.cpp
diff options
context:
space:
mode:
authorRadoslav Gerganov <rgerganov@gmail.com>2024-06-03 20:03:26 +0300
committerGitHub <noreply@github.com>2024-06-03 20:03:26 +0300
commitbde7cd3cd949c1a85d3a199498ac98e78039d46f (patch)
tree738364c20669cea19d3ca5df2baec036429b9b40 /ggml-rpc.cpp
parenta5735e4426b19a3ebd0c653ad8ac01420458ee95 (diff)
llama : offload to RPC in addition to other backends (#7640)
* llama : offload to RPC in addition to other backends * - fix copy_tensor being called on the src buffer instead of the dst buffer - always initialize views in the view_src buffer - add RPC backend to Makefile build - add endpoint to all RPC object names * add rpc-server to Makefile * Update llama.cpp Co-authored-by: slaren <slarengh@gmail.com> --------- Co-authored-by: slaren <slarengh@gmail.com>
Diffstat (limited to 'ggml-rpc.cpp')
-rw-r--r--ggml-rpc.cpp4
1 files changed, 2 insertions, 2 deletions
diff --git a/ggml-rpc.cpp b/ggml-rpc.cpp
index 49a20df4..679ce4f2 100644
--- a/ggml-rpc.cpp
+++ b/ggml-rpc.cpp
@@ -491,7 +491,7 @@ GGML_CALL static ggml_backend_buffer_t ggml_backend_rpc_buffer_type_alloc_buffer
if (remote_ptr != 0) {
ggml_backend_buffer_t buffer = ggml_backend_buffer_init(buft,
ggml_backend_rpc_buffer_interface,
- new ggml_backend_rpc_buffer_context{sock, {}, remote_ptr, "RPC"},
+ new ggml_backend_rpc_buffer_context{sock, {}, remote_ptr, "RPC[" + std::string(buft_ctx->endpoint) + "]"},
remote_size);
return buffer;
} else {
@@ -692,7 +692,7 @@ GGML_API GGML_CALL ggml_backend_buffer_type_t ggml_backend_rpc_buffer_type(const
GGML_CALL ggml_backend_t ggml_backend_rpc_init(const char * endpoint) {
ggml_backend_rpc_context * ctx = new ggml_backend_rpc_context {
/* .endpoint = */ endpoint,
- /* .name = */ "RPC",
+ /* .name = */ "RPC[" + std::string(endpoint) + "]",
};
ggml_backend_t backend = new ggml_backend {