1 files changed, 1 insertions, 0 deletions
diff --git a/llama.h b/llama.h
index d901dcd9..6927bd60 100644
--- a/llama.h
+++ b/llama.h
@@ -191,6 +191,7 @@ extern "C" {
         bool allow_requantize;       // allow quantizing non-f32/f16 tensors
         bool quantize_output_tensor; // quantize output.weight
         bool only_copy;              // only copy tensors - ftype, allow_requantize and quantize_output_tensor are ignored
+        bool pure;                   // disable k-quant mixtures and quantize all tensors to the same type
     } llama_model_quantize_params;
 
     // grammar types