From d25b1c31b07c3675443a55a828dd58cfef5a241c Mon Sep 17 00:00:00 2001 From: Kawrakow <48489457+ikawrakow@users.noreply.github.com> Date: Tue, 26 Mar 2024 13:09:30 +0100 Subject: quantize : be able to override metadata by key (#6321) * quantize: be able to override metadata by key * minor : spacing --------- Co-authored-by: Iwan Kawrakow Co-authored-by: Georgi Gerganov --- llama.h | 1 + 1 file changed, 1 insertion(+) (limited to 'llama.h') diff --git a/llama.h b/llama.h index 74f0e56d..6daf3a35 100644 --- a/llama.h +++ b/llama.h @@ -284,6 +284,7 @@ extern "C" { bool only_copy; // only copy tensors - ftype, allow_requantize and quantize_output_tensor are ignored bool pure; // quantize all tensors to the default type void * imatrix; // pointer to importance matrix data + void * kv_overrides; // pointer to vector containing overrides } llama_model_quantize_params; // grammar types -- cgit v1.2.3