Skip to content

Commit 8c167e1

Browse files
authored
[GCU] Update post_process (PaddlePaddle#3012)
1 parent 7634ffb commit 8c167e1

1 file changed

Lines changed: 4 additions & 0 deletions

File tree

fastdeploy/worker/gcu_model_runner.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -772,6 +772,8 @@ def _dummy_run(
772772
post_process(
773773
sampler_output=sampler_output,
774774
model_output=model_output_data,
775+
share_inputs=self.share_inputs,
776+
block_size=self.parallel_config.block_size,
775777
speculative_decoding=self.speculative_decoding,
776778
skip_save_output=True,
777779
)
@@ -989,6 +991,8 @@ class at the server level, which is too granular for ModelRunner.
989991
post_process(
990992
sampler_output=sampler_output,
991993
model_output=model_output_data,
994+
share_inputs=self.share_inputs,
995+
block_size=self.parallel_config.block_size,
992996
save_each_rank=self.parallel_config.use_ep,
993997
speculative_decoding=self.speculative_decoding,
994998
skip_save_output=skip_save_output,

0 commit comments

Comments
 (0)