diff --git a/include/llama.h b/include/llama.h index b17e8f3353..f44e2383d0 100644 --- a/include/llama.h +++ b/include/llama.h @@ -358,6 +358,7 @@ extern "C" { void * kv_overrides; // pointer to vector containing overrides void * tensor_types; // pointer to vector containing tensor types void * prune_layers; // pointer to vector containing layer indices to prune + float target_bpw; // target bits per weight (bpw) } llama_model_quantize_params; typedef struct llama_logit_bias {