correct swa layer indexing, is supposed to be 0, 3, 6 ... instead of 1, 4, 7 ...
This commit is contained in:
parent
46f21826b3
commit
33eed315a3
|
|
@ -7987,7 +7987,7 @@ struct llm_build_modern_bert : public llm_graph_context {
|
||||||
ggml_tensor * Kcur = nullptr;
|
ggml_tensor * Kcur = nullptr;
|
||||||
ggml_tensor * Vcur = nullptr;
|
ggml_tensor * Vcur = nullptr;
|
||||||
|
|
||||||
const float rope_theta = (il+1) % 3 == 0 ? rope_theta_global : rope_theta_local;
|
const float rope_theta = il % 3 == 0 ? rope_theta_global : rope_theta_local;
|
||||||
|
|
||||||
|
|
||||||
// attention layer norm
|
// attention layer norm
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue