fix merge

bnellnm · bnellnm · commit 587ee3b1dcf6 · 2025-11-24T19:37:12.000Z
Signed-off-by: Bill Nell &lt;bnell@redhat.com&gt;
diff --git a/vllm/model_executor/layers/quantization/fp8.py b/vllm/model_executor/layers/quantization/fp8.py
@@ -1143,12 +1143,9 @@ def apply(
         x: torch.Tensor,
         router_logits: torch.Tensor,
     ) -> torch.Tensor | tuple[torch.Tensor, torch.Tensor]:
-        if layer.enable_eplb:
-            assert layer.expert_load_view is not None
-            assert layer.logical_to_physical_map is not None
-            assert layer.logical_replica_count is not None
-
         if self.flashinfer_moe_backend == FlashinferMoeBackend.TENSORRT_LLM:
+            if layer.enable_eplb:
+                raise NotImplementedError("EPLB not supported for `Fp8MoEMethod` yet.")
             assert layer.activation == "silu", (
                 f"Expected 'silu' activation but got {layer.activation}"
             )