[Feature] support rl_tp_degree (#3934)

* [Feature] support rl_tp_degree * add rl_tp_degree in lmhead * add rl_tp_degree in bias * fix split_axis=0 in bias * fix split_axis in weight * fix bias rl_tp_degree * fix bias rl_tp_degree * change attr to dict --------- Co-authored-by: Jiang-Jia-Jun <163579578+Jiang-Jia-Jun@users.noreply.github.com>
2025-10-05 16:48:03 +08:00 · 2025-09-08 16:20:32 +08:00
parent fa2369271d
commit d40a1046de
3 changed files with 31 additions and 1 deletions
--- a/fastdeploy/model_executor/layers/lm_head.py
+++ b/fastdeploy/model_executor/layers/lm_head.py
@@ -94,6 +94,12 @@ class ParallelLMHead(nn.Layer):
                        "model_format": self.fd_config.model_config.model_format,
                    },
                )
+                if self.bias_key is not None:
+                    set_weight_attrs(
+                        self.linear.bias,
+                        {"rl_need_attr": {"rl_tp_degree": fd_config.parallel_config.tensor_parallel_size}},
+                    )
+
                if self.nranks > 1:
                    set_weight_attrs(self.linear.weight, {"output_dim": True})
            else:
@@ -116,6 +122,9 @@ class ParallelLMHead(nn.Layer):

                if self.nranks > 1:
                    set_weight_attrs(self.linear.weight, {"output_dim": False})
+        set_weight_attrs(
+            self.linear.weight, {"rl_need_attr": {"rl_tp_degree": fd_config.parallel_config.tensor_parallel_size}}
+        )

    def load_state_dict(self, state_dict: Dict[str, paddle.Tensor | np.ndarray]):
        """