Skip to content

Commit e7ad830

Browse files
committed
Optimize code format
Signed-off-by: skylee-01 <497627264@qq.com>
1 parent 26f2b7f commit e7ad830

File tree

1 file changed

+5
-6
lines changed

1 file changed

+5
-6
lines changed

vllm/v1/spec_decode/mlp_speculator.py

Lines changed: 5 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -28,11 +28,10 @@ def __init__(
2828
self.vllm_config = vllm_config
2929
self.device = device
3030
self.max_num_seqs = vllm_config.scheduler_config.max_num_seqs
31-
self.hidden_size = vllm_config.speculative_config.\
32-
draft_model_config.get_hidden_size(
33-
)
34-
self.num_speculative_tokens = vllm_config.speculative_config.\
35-
num_speculative_tokens
31+
self.hidden_size = (vllm_config.speculative_config.
32+
draft_model_config.get_hidden_size())
33+
self.num_speculative_tokens = (vllm_config.speculative_config.
34+
num_speculative_tokens)
3635
self.dtype = vllm_config.model_config.dtype
3736

3837
def propose(
@@ -41,7 +40,7 @@ def propose(
4140
previous_hidden_states: torch.Tensor,
4241
num_predict_tokens: int,
4342
sampling_metadata: SamplingMetadata,
44-
) -> torch.Tensor:
43+
) -> list[list[int]]:
4544
# Generate blocks and compute logits
4645
draft_tokens = self.model.generate_proposals(input_ids, previous_hidden_states, num_predict_tokens,sampling_metadata)
4746
return list(map(lambda x: x[0], zip(*[i.sampled_token_ids.tolist() for i in draft_tokens])))

0 commit comments

Comments
 (0)