Manually set proper ordering of tensors, mostly applies to gemma

2026-03-26 21:35:13 -04:00 · 2026-03-26 21:35:13 -04:00 · 04c829966e
parent 9c00aab225
commit 04c829966e
5 changed files with 3493 additions and 3481 deletions
--- a/tests/snapshots/gemma-3-4b-it.schema
+++ b/tests/snapshots/gemma-3-4b-it.schema
--- a/tests/snapshots/glm-4.6v.schema
+++ b/tests/snapshots/glm-4.6v.schema
--- a/tests/snapshots/meta-llama-3.1-70b-instruct.schema
+++ b/tests/snapshots/meta-llama-3.1-70b-instruct.schema
--- a/tests/snapshots/qwen3-coder-next.schema
+++ b/tests/snapshots/qwen3-coder-next.schema
--- a/tests/test-quant-type-selection.cpp
+++ b/tests/test-quant-type-selection.cpp
@ -5,6 +5,7 @@
 #include "ggml-cpp.h"
 #include "gguf-model-data.h"

+#include <algorithm>
 #include <cstdio>
 #include <cstring>
 #include <fstream>
@ -269,6 +270,17 @@ static mock_tensors build_mock_tensors(const quantize_state_impl * qs,
        }
    }

+    // sort by layer index then name, matching llama_model_loader::weight_name_comparer
+    std::sort(result.begin(), result.end(), [](const ggml_tensor * a, const ggml_tensor * b) {
+        int a_layer = -1, b_layer = -1;
+        sscanf(a->name, "blk.%d.", &a_layer);
+        sscanf(b->name, "blk.%d.", &b_layer);
+        if (a_layer != b_layer) {
+            return a_layer < b_layer;
+        }
+        return strcmp(a->name, b->name) < 0;
+    });
+
    return { std::move(ctx), std::move(result) };
 }