mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
feat: add support for API usage with multimodal models (#4548)
* feat: add support for API usage with multimodal models * completion_tokens contains num_image_tokens * remove test_request.py * fix: paddle.device.is_compiled_with_cuda() * fix test_unstream_without_logprobs
This commit is contained in:
@@ -1068,6 +1068,7 @@ class EngineService:
|
||||
"""
|
||||
exit sub services
|
||||
"""
|
||||
llm_logger.info("Exit sub services.....")
|
||||
self.running = False
|
||||
if hasattr(self, "engine_worker_queue_server") and self.engine_worker_queue_server is not None:
|
||||
self.engine_worker_queue_server.cleanup()
|
||||
|
||||
Reference in New Issue
Block a user