We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 7136360 commit cbf0f7fCopy full SHA for cbf0f7f
vllm/v1/spec_decode/eagle.py
@@ -199,9 +199,9 @@ def propose(
199
# there's a multi-layer MTP module.
200
201
# Generate the remaining draft tokens.
202
- # [num_speculative_tokens, batch_size]
+ # Each tensor in the list has shape [batch_size].
203
draft_token_ids_list: list[torch.Tensor] = [draft_token_ids]
204
- # [num_speculative_tokens, batch_size, vocab_size]
+ # Each tensor in the list has shape [batch_size, vocab_size].
205
draft_probs_list: list[torch.Tensor] = [draft_probs]
206
207
positions = target_positions[last_token_indices]
0 commit comments