lint

bnellnm · bnellnm · commit d86e3f0172e2 · 2025-05-28T23:40:56.000Z
Signed-off-by: Bill Nell &lt;bnell@redhat.com&gt;
diff --git a/vllm/model_executor/layers/fused_moe/fused_batched_moe.py b/vllm/model_executor/layers/fused_moe/fused_batched_moe.py
@@ -614,13 +614,10 @@ def apply(
             else:
                 num = int(expert_num_tokens[expert].item())
             tmp = _resize_cache(workspace2, (num, N))
-            if self.use_fp8_w8a8:
-                assert False  # TBD
-            else:
-                input = hidden_states[expert, :num, :] @ w1[expert].transpose(
-                    0, 1)
-                self.activation(activation, tmp, input)
-                out[expert, :num, :] = tmp @ w2[expert].transpose(0, 1)
+            assert not self.use_fp8_w8a8
+            input = hidden_states[expert, :num, :] @ w1[expert].transpose(0, 1)
+            self.activation(activation, tmp, input)
+            out[expert, :num, :] = tmp @ w2[expert].transpose(0, 1)
 
         return out