mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-05 00:33:03 +08:00
add input_processor plugin (#3657)
* add input_processor plugin * update * update * update * update * update * update * update * update * update * update * update
This commit is contained in:
@@ -721,7 +721,8 @@ class RowParallelLinear(LinearBase):
|
||||
add_bias=add_bias,
|
||||
skip_quant=skip_quant,
|
||||
)
|
||||
|
||||
if add_bias:
|
||||
assert with_bias, "with_bias must be True when add_bias is True."
|
||||
assert self.quant_method is not None
|
||||
self.quant_method.create_weights(
|
||||
self,
|
||||
@@ -753,7 +754,8 @@ class RowParallelLinear(LinearBase):
|
||||
|
||||
if self.reduce_results and self.nranks > 1:
|
||||
tensor_model_parallel_all_reduce(out, self.tp_group)
|
||||
|
||||
if not self.fd_config.quant_config and self.add_bias:
|
||||
out = paddle.add(out, self.bias)
|
||||
return out
|
||||
|
||||
|
||||
|
Reference in New Issue
Block a user