Skip to content

Commit 7028370

Browse files
cleanup
Signed-off-by: Lucas Wilkinson <lwilkins@redhat.com>
1 parent 557ee9e commit 7028370

File tree

1 file changed

+0
-27
lines changed

1 file changed

+0
-27
lines changed

vllm/v1/spec_decode/utils.py

Lines changed: 0 additions & 27 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,6 @@
11
# SPDX-License-Identifier: Apache-2.0
22
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
33
from vllm.sampling_params import SamplingParams
4-
from vllm.triton_utils import tl, triton
54

65
_SAMPLING_EPS = 1e-5
76

@@ -13,29 +12,3 @@ def is_spec_decode_unsupported(sampling_params: SamplingParams) -> bool:
1312
or sampling_params.repetition_penalty != 1.0
1413
or sampling_params.min_p > _SAMPLING_EPS
1514
or sampling_params.logprobs is not None)
16-
17-
18-
@triton.jit
19-
def prepare_eagle_input_kernel(
20-
out_ptr,
21-
cu_query_lens_ptr,
22-
cu_num_tokens_ptr,
23-
BLOCK_SIZE: tl.constexpr,
24-
):
25-
pid = tl.program_id(0)
26-
27-
# [start_pos, end_pos)
28-
start_pos = tl.load(cu_num_tokens_ptr + pid)
29-
end_pos = tl.load(cu_num_tokens_ptr + pid + 1)
30-
num_tokens = end_pos - start_pos
31-
32-
index_start = tl.load(cu_query_lens_ptr + pid)
33-
34-
num_blocks = tl.cdiv(num_tokens, BLOCK_SIZE)
35-
for i in tl.range(num_blocks):
36-
offset = i * BLOCK_SIZE + tl.arange(0, BLOCK_SIZE)
37-
tl.store(
38-
out_ptr + start_pos + offset,
39-
index_start + offset,
40-
mask=offset < num_tokens,
41-
)

0 commit comments

Comments
 (0)