【Sync】Release/2.0.1 (#2745)

* add rl qwen model support

* fix

* fix
This commit is contained in:
gaoziyuan
2025-07-08 14:38:18 +08:00
committed by GitHub
parent ea787d8f62
commit 6851489425
13 changed files with 438 additions and 171 deletions

View File

@@ -293,7 +293,7 @@ class ColumnParallelLinear(LinearBase):
)
if self.nranks > 0:
# col parallel
_set_var_distributed(self.linear_weight, split_axis=-1)
_set_var_distributed(self.linear_weight, split_axis=1)
self.linear_bias = None
if self.with_bias:
@@ -304,7 +304,7 @@ class ColumnParallelLinear(LinearBase):
)
if self.nranks > 0:
# col parallel
_set_var_distributed(self.linear_bias, split_axis=-1)
_set_var_distributed(self.linear_bias, split_axis=1)
# smooth quant
self.linear_shift = None