Update sampler.py

xu-song · xu-song · commit b2f069e26bf1 · 2025-06-19T16:11:27.000+08:00
Signed-off-by: xusong28 &lt;xusong28@jd.com&gt;
diff --git a/vllm/model_executor/layers/sampler.py b/vllm/model_executor/layers/sampler.py
@@ -1197,7 +1197,7 @@ def _get_next_prompt_tokens(
     prompt_tokens = seq_data.prompt_token_ids
     # +1 because we are looking for a next prompt token.
     next_token_index_start = computed_len + 1
-    next_token_index_end = min(computed_len + query_len + 1,
+    next_token_index_end = min(computed_len + query_len,
                                len(prompt_tokens))
     next_prompt_tokens = prompt_tokens[
         next_token_index_start:next_token_index_end]