From 433f3d81d931bf3fb1fc5be8678e15b3a8b12fb7 Mon Sep 17 00:00:00 2001
From: Xu Song <xusong.vip@gmail.com>
Date: Thu, 19 Jun 2025 16:13:32 +0800
Subject: [PATCH] update

Signed-off-by: Xu Song <xusong.vip@gmail.com>
---
 vllm/model_executor/layers/sampler.py | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/vllm/model_executor/layers/sampler.py b/vllm/model_executor/layers/sampler.py
index 08840fc40cf6..013659778bd0 100644
--- a/vllm/model_executor/layers/sampler.py
+++ b/vllm/model_executor/layers/sampler.py
@@ -1197,8 +1197,7 @@ def _get_next_prompt_tokens(
     prompt_tokens = seq_data.prompt_token_ids
     # +1 because we are looking for a next prompt token.
     next_token_index_start = computed_len + 1
-    next_token_index_end = min(computed_len + query_len + 1,
-                               len(prompt_tokens))
+    next_token_index_end = min(computed_len + query_len, len(prompt_tokens))
     next_prompt_tokens = prompt_tokens[
         next_token_index_start:next_token_index_end]
     return next_prompt_tokens