diff --git a/python/sglang/srt/models/deepseek_v2.py b/python/sglang/srt/models/deepseek_v2.py index 6a960a37150..50ef16b88b9 100644 --- a/python/sglang/srt/models/deepseek_v2.py +++ b/python/sglang/srt/models/deepseek_v2.py @@ -1509,7 +1509,7 @@ def load_weights(self, weights: Iterable[Tuple[str, torch.Tensor]]): f"mlp.experts." f"{self.config.n_routed_experts + num_repeat}" f".{suffix}", - weights_dict[shared_expert_weight_name].clone(), + weights_dict[shared_expert_weight_name], ) ) names_to_remove += [shared_expert_weight_name]