mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-05 08:37:06 +08:00
[GCU] Update post_process (#3012)
This commit is contained in:
@@ -772,6 +772,8 @@ class GCUModelRunner(ModelRunnerBase):
|
||||
post_process(
|
||||
sampler_output=sampler_output,
|
||||
model_output=model_output_data,
|
||||
share_inputs=self.share_inputs,
|
||||
block_size=self.parallel_config.block_size,
|
||||
speculative_decoding=self.speculative_decoding,
|
||||
skip_save_output=True,
|
||||
)
|
||||
@@ -989,6 +991,8 @@ class GCUModelRunner(ModelRunnerBase):
|
||||
post_process(
|
||||
sampler_output=sampler_output,
|
||||
model_output=model_output_data,
|
||||
share_inputs=self.share_inputs,
|
||||
block_size=self.parallel_config.block_size,
|
||||
save_each_rank=self.parallel_config.use_ep,
|
||||
speculative_decoding=self.speculative_decoding,
|
||||
skip_save_output=skip_save_output,
|
||||
|
Reference in New Issue
Block a user