mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
[BugFix][Cherry-Pick] fix can not enter into cuda graph (#5423)
* fix bug * fix bug
This commit is contained in:
@@ -1578,7 +1578,7 @@ class FDConfig:
|
||||
self.graph_opt_config.init_with_cudagrpah_size(max_capture_size=max_capture_shape)
|
||||
|
||||
if self.parallel_config.use_ep:
|
||||
self.graph_opt_config.cudagraph_capture_sizes = [0] + self.graph_opt_config.cudagraph_capture_sizes
|
||||
self.graph_opt_config.cudagraph_capture_sizes += [0]
|
||||
|
||||
self.tokenizer = tokenizer
|
||||
self.ips = ips
|
||||
|
||||
Reference in New Issue
Block a user