mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
[XPU] support prefix cache (#4423)
Co-authored-by: ddchenhao66 <dhaochen163.com>
This commit is contained in:
@@ -410,7 +410,7 @@ class EngineArgs:
|
||||
self.enable_prefix_caching = False
|
||||
if self.speculative_config is not None:
|
||||
self.enable_prefix_caching = False
|
||||
if not current_platform.is_cuda():
|
||||
if not current_platform.is_cuda() and not current_platform.is_xpu():
|
||||
self.enable_prefix_caching = False
|
||||
# if self.dynamic_load_weight:
|
||||
# self.enable_prefix_caching = False
|
||||
|
||||
Reference in New Issue
Block a user