Fix prefix-LM mode assertion

2024-09-25 22:22:28 +08:00 · 2024-09-25 22:22:28 +08:00 · d1010337c3
parent e70e686805
commit d1010337c3
1 changed files with 2 additions and 1 deletions
--- a/gemma/gemma-inl.h
+++ b/gemma/gemma-inl.h
@ -916,7 +916,8 @@ HWY_NOINLINE void Prefill(
    }
    // In prefix-LM mode, we need to look at all the tokens for the prefix in
    // one iteration through the layers, so we need a large enough batch size.
-    HWY_ASSERT(max_tbatch_size >= prefill_this_query);
+    HWY_ASSERT(prefix_end_this_query == 0 ||
+               max_tbatch_size >= prefill_this_query);

    // For each batch of tokens in the query:
    for (size_t tbatch_start = 0; tbatch_start < prefill_this_query;