mirror of https://github.com/google/gemma.cpp.git
Allow prefill only run by allowing max_prompt_size == seq_len
PiperOrigin-RevId: 827415258
This commit is contained in:
parent
ab87807a4c
commit
3a63a12624
|
|
@ -511,7 +511,7 @@ static void GenerateT(const ModelConfig& config,
|
|||
// We use a single divisor, so all sequence lengths must be the same.
|
||||
HWY_ASSERT(qbatch.KV(qi).SeqLen() == seq_len);
|
||||
}
|
||||
if (max_prompt_size >= seq_len) {
|
||||
if (max_prompt_size > seq_len) {
|
||||
HWY_ABORT("max_prompt_size = %zu, increase --seq_len to at least that.",
|
||||
max_prompt_size);
|
||||
}
|
||||
|
|
|
|||
Loading…
Reference in New Issue