correct swa layer indexing, is supposed to be 0, 3, 6 ... instead of 1, 4, 7 ...

This commit is contained in:
ryan-mangeno 2025-10-01 14:19:44 -04:00
parent 46f21826b3
commit 33eed315a3
1 changed files with 1 additions and 1 deletions

View File

@ -7987,7 +7987,7 @@ struct llm_build_modern_bert : public llm_graph_context {
ggml_tensor * Kcur = nullptr;
ggml_tensor * Vcur = nullptr;
const float rope_theta = (il+1) % 3 == 0 ? rope_theta_global : rope_theta_local;
const float rope_theta = il % 3 == 0 ? rope_theta_global : rope_theta_local;
// attention layer norm