Skip to content

Commit a41e15e

Browse files
authored
fix for default quant (#3640)
1 parent 2748102 commit a41e15e

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

lmdeploy/pytorch/nn/moe.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -485,7 +485,7 @@ def weight_loader_with_quant(self, param: torch.nn.Parameter, loaded_weight: tor
485485
self.weight._base_weight_loader(self.weight, quanted_weight, expert_id, shard_id)
486486
self.weight_scale_inv.weight_loader(self.weight_scale_inv, scaling, expert_id, shard_id)
487487
else:
488-
return self.weight_loader(param, loaded_weight, expert_id, shard_id)
488+
return self.weight._base_weight_loader(param, loaded_weight, expert_id, shard_id)
489489

490490

491491
class FusedMoEBlockedF8(nn.Module):

0 commit comments

Comments
 (0)