Skip to content

Commit 3a63a12

Browse files
Charles Zhaocopybara-github
authored andcommitted
Allow prefill only run by allowing max_prompt_size == seq_len
PiperOrigin-RevId: 827415258
1 parent ab87807 commit 3a63a12

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

gemma/gemma.cc

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -511,7 +511,7 @@ static void GenerateT(const ModelConfig& config,
511511
// We use a single divisor, so all sequence lengths must be the same.
512512
HWY_ASSERT(qbatch.KV(qi).SeqLen() == seq_len);
513513
}
514-
if (max_prompt_size >= seq_len) {
514+
if (max_prompt_size > seq_len) {
515515
HWY_ABORT("max_prompt_size = %zu, increase --seq_len to at least that.",
516516
max_prompt_size);
517517
}

0 commit comments

Comments
 (0)