summaryrefslogtreecommitdiff
path: root/examples/gguf-split
diff options
context:
space:
mode:
authorPierrick Hymbert <pierrick.hymbert@gmail.com>2024-03-23 18:07:00 +0100
committerGitHub <noreply@github.com>2024-03-23 18:07:00 +0100
commitf482bb2e4920e544651fb832f2e0bcb4d2ff69ab (patch)
tree9fabefd6f3b34aef6bf13a8469c7cdf363cc88cb /examples/gguf-split
parent1997577d5e121568ae39f538021733ccd4278c23 (diff)
common: llama_load_model_from_url split support (#6192)
* llama: llama_split_prefix fix strncpy does not include string termination common: llama_load_model_from_url: - fix header name case sensitive - support downloading additional split in parallel - hide password in url * common: EOL EOF * common: remove redundant LLAMA_CURL_MAX_PATH_LENGTH definition * common: change max url max length * common: minor comment * server: support HF URL options * llama: llama_model_loader fix log * common: use a constant for max url length * common: clean up curl if file cannot be loaded in gguf * server: tests: add split tests, and HF options params * common: move llama_download_hide_password_in_url inside llama_download_file as a lambda * server: tests: enable back Release test on PR * spacing Co-authored-by: Georgi Gerganov <ggerganov@gmail.com> * spacing Co-authored-by: Georgi Gerganov <ggerganov@gmail.com> * spacing Co-authored-by: Georgi Gerganov <ggerganov@gmail.com> --------- Co-authored-by: Georgi Gerganov <ggerganov@gmail.com>
Diffstat (limited to 'examples/gguf-split')
-rw-r--r--examples/gguf-split/gguf-split.cpp4
1 files changed, 0 insertions, 4 deletions
diff --git a/examples/gguf-split/gguf-split.cpp b/examples/gguf-split/gguf-split.cpp
index f703588e..b1af5999 100644
--- a/examples/gguf-split/gguf-split.cpp
+++ b/examples/gguf-split/gguf-split.cpp
@@ -26,10 +26,6 @@ enum split_operation : uint8_t {
SPLIT_OP_MERGE,
};
-static const char * const LLM_KV_SPLIT_NO = "split.no";
-static const char * const LLM_KV_SPLIT_COUNT = "split.count";
-static const char * const LLM_KV_SPLIT_TENSORS_COUNT = "split.tensors.count";
-
struct split_params {
split_operation operation = SPLIT_OP_SPLIT;
int n_split_tensors = 128;