fix merge

bnellnm · bnellnm · commit e850c8b5c0f8 · 2025-12-03T20:02:47.000Z
Signed-off-by: Bill Nell &lt;bnell@redhat.com&gt;
diff --git a/vllm/model_executor/layers/quantization/fp8.py b/vllm/model_executor/layers/quantization/fp8.py
@@ -1171,12 +1171,9 @@ def apply(
         x: torch.Tensor,
         router_logits: torch.Tensor,
     ) -> torch.Tensor | tuple[torch.Tensor, torch.Tensor]:
-        if layer.enable_eplb:
-            assert layer.expert_load_view is not None
-            assert layer.logical_to_physical_map is not None
-            assert layer.logical_replica_count is not None
-
         if self.flashinfer_moe_backend == FlashinferMoeBackend.TENSORRT_LLM:
+            if layer.enable_eplb:
+                raise NotImplementedError("EPLB not supported for `Fp8MoEMethod` yet.")
             assert layer.activation == "silu", (
                 f"Expected 'silu' activation but got {layer.activation}"
             )