Move test-only stuff out of llama-quant.cpp

2026-03-12 14:06:23 -04:00 · 2026-03-12 14:06:23 -04:00 · 8ebfe03f95
parent 3fe55f1035
commit 8ebfe03f95
3 changed files with 63 additions and 63 deletions
--- a/src/llama-quant.cpp
+++ b/src/llama-quant.cpp
@ -755,64 +755,6 @@ ggml_type llama_ftype_get_default_type(llama_ftype ftype) {
    }
 }
 struct ftype_name_entry {
    const char * name;
    llama_ftype  ftype;
 };
 static const ftype_name_entry ftype_name_table[] = {
    { "F32",        LLAMA_FTYPE_ALL_F32 },
    { "F16",        LLAMA_FTYPE_MOSTLY_F16 },
    { "BF16",       LLAMA_FTYPE_MOSTLY_BF16 },
    { "Q4_0",       LLAMA_FTYPE_MOSTLY_Q4_0 },
    { "Q4_1",       LLAMA_FTYPE_MOSTLY_Q4_1 },
    { "Q5_0",       LLAMA_FTYPE_MOSTLY_Q5_0 },
    { "Q5_1",       LLAMA_FTYPE_MOSTLY_Q5_1 },
    { "Q8_0",       LLAMA_FTYPE_MOSTLY_Q8_0 },
    { "Q2_K",       LLAMA_FTYPE_MOSTLY_Q2_K },
    { "Q2_K_S",     LLAMA_FTYPE_MOSTLY_Q2_K_S },
    { "Q3_K_S",     LLAMA_FTYPE_MOSTLY_Q3_K_S },
    { "Q3_K_M",     LLAMA_FTYPE_MOSTLY_Q3_K_M },
    { "Q3_K_L",     LLAMA_FTYPE_MOSTLY_Q3_K_L },
    { "Q4_K_S",     LLAMA_FTYPE_MOSTLY_Q4_K_S },
    { "Q4_K_M",     LLAMA_FTYPE_MOSTLY_Q4_K_M },
    { "Q5_K_S",     LLAMA_FTYPE_MOSTLY_Q5_K_S },
    { "Q5_K_M",     LLAMA_FTYPE_MOSTLY_Q5_K_M },
    { "Q6_K",       LLAMA_FTYPE_MOSTLY_Q6_K },
    { "IQ1_S",      LLAMA_FTYPE_MOSTLY_IQ1_S },
    { "IQ1_M",      LLAMA_FTYPE_MOSTLY_IQ1_M },
    { "IQ2_XXS",    LLAMA_FTYPE_MOSTLY_IQ2_XXS },
    { "IQ2_XS",     LLAMA_FTYPE_MOSTLY_IQ2_XS },
    { "IQ2_S",      LLAMA_FTYPE_MOSTLY_IQ2_S },
    { "IQ2_M",      LLAMA_FTYPE_MOSTLY_IQ2_M },
    { "IQ3_XXS",    LLAMA_FTYPE_MOSTLY_IQ3_XXS },
    { "IQ3_XS",     LLAMA_FTYPE_MOSTLY_IQ3_XS },
    { "IQ3_S",      LLAMA_FTYPE_MOSTLY_IQ3_S },
    { "IQ3_M",      LLAMA_FTYPE_MOSTLY_IQ3_M },
    { "IQ4_NL",     LLAMA_FTYPE_MOSTLY_IQ4_NL },
    { "IQ4_XS",     LLAMA_FTYPE_MOSTLY_IQ4_XS },
    { "TQ1_0",      LLAMA_FTYPE_MOSTLY_TQ1_0 },
    { "TQ2_0",      LLAMA_FTYPE_MOSTLY_TQ2_0 },
    { "MXFP4_MOE",  LLAMA_FTYPE_MOSTLY_MXFP4_MOE },
 };
 llama_ftype llama_ftype_from_name(const char * name) {
    for (const auto & e : ftype_name_table) {
        if (strcmp(name, e.name) == 0) {
            return e.ftype;
        }
    }
    return (llama_ftype)-1;
 }
 const char * llama_ftype_to_name(llama_ftype ftype) {
    for (const auto & e : ftype_name_table) {
        if (e.ftype == ftype) {
            return e.name;
        }
    }
    return nullptr;
 }
 void init_quantize_state_counters(quantize_state_impl & qs, std::vector<tensor_metadata> & metadata) {
    for (auto & tm : metadata) {
--- a/src/llama-quant.h
+++ b/src/llama-quant.h
@ -86,11 +86,6 @@ struct quantize_state_impl {
 ggml_type llama_tensor_get_type(quantize_state_impl & qs, const llama_model_quantize_params * params, const ggml_tensor * tensor, ggml_type default_type, const tensor_metadata & tm);
 ggml_type llama_ftype_get_default_type(llama_ftype ftype);
 // Ftype name <-> enum conversions.
 // Returns (llama_ftype)-1 on failure.
 llama_ftype  llama_ftype_from_name(const char * name);
 const char * llama_ftype_to_name(llama_ftype ftype);
 // Initialize quantize_state_impl counters and populate tensor_metadata categories.
 // metadata: vector with name fields already set, will have category field populated.
 void init_quantize_state_counters(quantize_state_impl & qs, std::vector<tensor_metadata> & metadata);
--- a/tests/test-quant-type-selection.cpp
+++ b/tests/test-quant-type-selection.cpp
@ -16,6 +16,69 @@
 #include <utility>
 #include <vector>
 // ---------------------------------------------------------------------------
 // ftype name <-> enum mapping
 // ---------------------------------------------------------------------------
 struct ftype_name_entry {
    const char * name;
    llama_ftype  ftype;
 };
 static const ftype_name_entry ftype_name_table[] = {
    { "F32",        LLAMA_FTYPE_ALL_F32 },
    { "F16",        LLAMA_FTYPE_MOSTLY_F16 },
    { "BF16",       LLAMA_FTYPE_MOSTLY_BF16 },
    { "Q4_0",       LLAMA_FTYPE_MOSTLY_Q4_0 },
    { "Q4_1",       LLAMA_FTYPE_MOSTLY_Q4_1 },
    { "Q5_0",       LLAMA_FTYPE_MOSTLY_Q5_0 },
    { "Q5_1",       LLAMA_FTYPE_MOSTLY_Q5_1 },
    { "Q8_0",       LLAMA_FTYPE_MOSTLY_Q8_0 },
    { "Q2_K",       LLAMA_FTYPE_MOSTLY_Q2_K },
    { "Q2_K_S",     LLAMA_FTYPE_MOSTLY_Q2_K_S },
    { "Q3_K_S",     LLAMA_FTYPE_MOSTLY_Q3_K_S },
    { "Q3_K_M",     LLAMA_FTYPE_MOSTLY_Q3_K_M },
    { "Q3_K_L",     LLAMA_FTYPE_MOSTLY_Q3_K_L },
    { "Q4_K_S",     LLAMA_FTYPE_MOSTLY_Q4_K_S },
    { "Q4_K_M",     LLAMA_FTYPE_MOSTLY_Q4_K_M },
    { "Q5_K_S",     LLAMA_FTYPE_MOSTLY_Q5_K_S },
    { "Q5_K_M",     LLAMA_FTYPE_MOSTLY_Q5_K_M },
    { "Q6_K",       LLAMA_FTYPE_MOSTLY_Q6_K },
    { "IQ1_S",      LLAMA_FTYPE_MOSTLY_IQ1_S },
    { "IQ1_M",      LLAMA_FTYPE_MOSTLY_IQ1_M },
    { "IQ2_XXS",    LLAMA_FTYPE_MOSTLY_IQ2_XXS },
    { "IQ2_XS",     LLAMA_FTYPE_MOSTLY_IQ2_XS },
    { "IQ2_S",      LLAMA_FTYPE_MOSTLY_IQ2_S },
    { "IQ2_M",      LLAMA_FTYPE_MOSTLY_IQ2_M },
    { "IQ3_XXS",    LLAMA_FTYPE_MOSTLY_IQ3_XXS },
    { "IQ3_XS",     LLAMA_FTYPE_MOSTLY_IQ3_XS },
    { "IQ3_S",      LLAMA_FTYPE_MOSTLY_IQ3_S },
    { "IQ3_M",      LLAMA_FTYPE_MOSTLY_IQ3_M },
    { "IQ4_NL",     LLAMA_FTYPE_MOSTLY_IQ4_NL },
    { "IQ4_XS",     LLAMA_FTYPE_MOSTLY_IQ4_XS },
    { "TQ1_0",      LLAMA_FTYPE_MOSTLY_TQ1_0 },
    { "TQ2_0",      LLAMA_FTYPE_MOSTLY_TQ2_0 },
    { "MXFP4_MOE",  LLAMA_FTYPE_MOSTLY_MXFP4_MOE },
 };
 static llama_ftype llama_ftype_from_name(const char * name) {
    for (const auto & e : ftype_name_table) {
        if (strcmp(name, e.name) == 0) {
            return e.ftype;
        }
    }
    return (llama_ftype)-1;
 }
 static const char * llama_ftype_to_name(llama_ftype ftype) {
    for (const auto & e : ftype_name_table) {
        if (e.ftype == ftype) {
            return e.name;
        }
    }
    return nullptr;
 }
 // ---------------------------------------------------------------------------
 // Mock tensor construction - may be better to extract this in the future
 // ---------------------------------------------------------------------------