From 25d7ecc42aab1bdb25cf4f8b1e078f2549c550d6 Mon Sep 17 00:00:00 2001
From: Ed Addario <eaddario@hotmail.com>
Date: Wed, 21 Jan 2026 18:26:58 +0000
Subject: [PATCH] Add use_wce option

---
 include/llama.h | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/include/llama.h b/include/llama.h
index 864d7043a1..6a930004e7 100644
--- a/include/llama.h
+++ b/include/llama.h
@@ -391,6 +391,7 @@ extern "C" {
         bool keep_split;                      // quantize to the same number of shards
         void * imatrix;                       // pointer to importance matrix data
         void * activations;                   // pointer to activations data
+        void * statistics;                    // pointer to statistics data
         void * kv_overrides;                  // pointer to vector containing overrides
         void * tensor_types;                  // pointer to vector containing tensor types
         void * prune_layers;                  // pointer to vector containing layer indices to prune
@@ -399,6 +400,7 @@ extern "C" {
         bool save_state;                      // keep bpw state file
         void * state_file;                    // pointer to bpw state file
         bool ignore_tensor_importance;        // allocate target bpw budget equitably across all tensors
+        bool use_wce;                         // optimize for WCE instead of MSE
     } llama_model_quantize_params;
 
     typedef struct llama_logit_bias {