diff --git a/vllm/model_executor/models/dbrx.py b/vllm/model_executor/models/dbrx.py index 4fbf0c3270fab..a2ce325fd7999 100644 --- a/vllm/model_executor/models/dbrx.py +++ b/vllm/model_executor/models/dbrx.py @@ -392,7 +392,7 @@ def sample( def load_weights(self, weights: Iterable[Tuple[str, torch.Tensor]]): expert_params_mapping = [( - "w13_weight" if weight_name in ["w1", "v1"] else "w2_weight", + "w13_" if weight_name in ["w1", "v1"] else "w2_", f"mlp.{weight_name}.", ) for weight_name in ["w1", "v1", "w2"]] params_dict = dict(self.named_parameters(remove_duplicate=False))