update

xu-song · xu-song · commit 433f3d81d931 · 2025-06-19T16:13:32.000+08:00
Signed-off-by: Xu Song &lt;xusong.vip@gmail.com&gt;
diff --git a/vllm/model_executor/layers/sampler.py b/vllm/model_executor/layers/sampler.py
@@ -1197,8 +1197,7 @@ def _get_next_prompt_tokens(
     prompt_tokens = seq_data.prompt_token_ids
     # +1 because we are looking for a next prompt token.
     next_token_index_start = computed_len + 1
-    next_token_index_end = min(computed_len + query_len + 1,
-                               len(prompt_tokens))
+    next_token_index_end = min(computed_len + query_len, len(prompt_tokens))
     next_prompt_tokens = prompt_tokens[
         next_token_index_start:next_token_index_end]
     return next_prompt_tokens