modify deepseek load_weights() to align with main

sunnyqgg · sunnyqgg · commit 1898a10d9d23 · 2025-09-01T07:59:21.000Z
Signed-off-by: qgai &lt;qgai@nvidia.com&gt;
diff --git a/tensorrt_llm/_torch/models/modeling_deepseekv3.py b/tensorrt_llm/_torch/models/modeling_deepseekv3.py
@@ -153,8 +153,7 @@ def split(v, tp_size, idx, dim=0):
                 return v
             if len(v.shape) == 1:
                 return torch.chunk(v, tp_size)[idx].contiguous()
-            else:
-                return torch.chunk(v, tp_size, dim=dim)[idx].contiguous()
+            return torch.chunk(v, tp_size, dim=dim)[idx].contiguous()
 
         def split_matrix_tp(v, tensor_parallel, rank, dim):
             return split(v, tensor_parallel, rank, dim=dim)
@@ -269,7 +268,9 @@ def split_kv_b_proj(kv_b_proj: torch.Tensor,
 
         for name, module in tqdm(all_named_modules.items(),
                                  desc="Loading weights"):
-            if len(module._parameters) > 0:
+            if len(module._parameters) <= 0 or name.startswith("draft_model"):
+                continue
+            else:
                 names = name.split('.')
                 parent_module_name = '.'.join(names[:-1])
                 if "model.layers" in name and int(