summaryrefslogtreecommitdiff
path: root/llama.h
diff options
context:
space:
mode:
authorKawrakow <48489457+ikawrakow@users.noreply.github.com>2024-03-26 13:09:30 +0100
committerGitHub <noreply@github.com>2024-03-26 14:09:30 +0200
commitd25b1c31b07c3675443a55a828dd58cfef5a241c (patch)
tree3ea7b6c04accf513b7493a893cd95ae42e760e4b /llama.h
parentdeb7240100da99555b9ab9dc635021e591fceaf5 (diff)
quantize : be able to override metadata by key (#6321)
* quantize: be able to override metadata by key * minor : spacing --------- Co-authored-by: Iwan Kawrakow <iwan.kawrakow@gmail.com> Co-authored-by: Georgi Gerganov <ggerganov@gmail.com>
Diffstat (limited to 'llama.h')
-rw-r--r--llama.h1
1 files changed, 1 insertions, 0 deletions
diff --git a/llama.h b/llama.h
index 74f0e56d..6daf3a35 100644
--- a/llama.h
+++ b/llama.h
@@ -284,6 +284,7 @@ extern "C" {
bool only_copy; // only copy tensors - ftype, allow_requantize and quantize_output_tensor are ignored
bool pure; // quantize all tensors to the default type
void * imatrix; // pointer to importance matrix data
+ void * kv_overrides; // pointer to vector containing overrides
} llama_model_quantize_params;
// grammar types