File tree Expand file tree Collapse file tree 1 file changed +0
-27
lines changed Expand file tree Collapse file tree 1 file changed +0
-27
lines changed Original file line number Diff line number Diff line change 1
1
# SPDX-License-Identifier: Apache-2.0
2
2
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
3
3
from vllm .sampling_params import SamplingParams
4
- from vllm .triton_utils import tl , triton
5
4
6
5
_SAMPLING_EPS = 1e-5
7
6
@@ -13,29 +12,3 @@ def is_spec_decode_unsupported(sampling_params: SamplingParams) -> bool:
13
12
or sampling_params .repetition_penalty != 1.0
14
13
or sampling_params .min_p > _SAMPLING_EPS
15
14
or sampling_params .logprobs is not None )
16
-
17
-
18
- @triton .jit
19
- def prepare_eagle_input_kernel (
20
- out_ptr ,
21
- cu_query_lens_ptr ,
22
- cu_num_tokens_ptr ,
23
- BLOCK_SIZE : tl .constexpr ,
24
- ):
25
- pid = tl .program_id (0 )
26
-
27
- # [start_pos, end_pos)
28
- start_pos = tl .load (cu_num_tokens_ptr + pid )
29
- end_pos = tl .load (cu_num_tokens_ptr + pid + 1 )
30
- num_tokens = end_pos - start_pos
31
-
32
- index_start = tl .load (cu_query_lens_ptr + pid )
33
-
34
- num_blocks = tl .cdiv (num_tokens , BLOCK_SIZE )
35
- for i in tl .range (num_blocks ):
36
- offset = i * BLOCK_SIZE + tl .arange (0 , BLOCK_SIZE )
37
- tl .store (
38
- out_ptr + start_pos + offset ,
39
- index_start + offset ,
40
- mask = offset < num_tokens ,
41
- )
You can’t perform that action at this time.
0 commit comments