fix lint

bnellnm · bnellnm · commit 07d96cac1ddc · 2025-07-01T15:07:37.000Z
Signed-off-by: Bill Nell &lt;bnell@redhat.com&gt;
diff --git a/vllm/model_executor/layers/fused_moe/layer.py b/vllm/model_executor/layers/fused_moe/layer.py
@@ -121,8 +121,6 @@ def init_prepare_finalize(self, moe: FusedMoEConfig,
 
             handle = all2all_manager.get_handle(all_to_all_args)
 
-            #assert moe.tp_size == all2all_manager.tp_group.world_size
-
             prepare_finalize = PplxPrepareAndFinalize(
                 handle,
                 max_num_tokens=moe.max_num_tokens,
@@ -160,10 +158,9 @@ def init_prepare_finalize(self, moe: FusedMoEConfig,
             # Note : We may want to use FP8 dispatch even otherwise just to
             # reduce datamovement
             assert moe.quant_config is not None
-            use_fp8_dispatch = (moe.quant_config.quant_dtype
-                                == current_platform.fp8_dtype()
-                                and moe.quant_config.block_shape[1]
-                                == DEEPEP_QUANT_BLOCK_SHAPE)
+            use_fp8_dispatch = (
+                moe.quant_config.quant_dtype == current_platform.fp8_dtype()
+                and moe.quant_config.block_shape == DEEPEP_QUANT_BLOCK_SHAPE)
 
             # Note (varun): Whether to use FP8 dispatch or not needs some
             # profiling. Turning it off for now.