We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 8b369df commit de97cdeCopy full SHA for de97cde
vllm_ascend/ascend_forward_context.py
@@ -103,7 +103,7 @@ def set_ascend_forward_context(
103
max_tokens_across_dp / tp_world_size) * world_size
104
105
if fused_moe_state == FusedMoEState.MC2_PREFILL:
106
- chunk_size = envs.VLLM_ASCEND_FUSED_MOE_MC2_CHUNK_SIZE
+ chunk_size = envs_ascend.VLLM_ASCEND_FUSED_MOE_MC2_CHUNK_SIZE
107
forward_context.max_num_chunks = math.ceil(
108
math.ceil(max_tokens_across_dp / tp_world_size) /
109
chunk_size)
0 commit comments