[Feature] optimize expert parallel (#3196)

* optimize

* Update expert_service.py

* Update worker_process.py

* optimize
This commit is contained in:
ltd0924
2025-08-05 17:34:24 +08:00
committed by GitHub
parent dcf9c2daff
commit b20ffe3697
7 changed files with 174 additions and 134 deletions

View File

@@ -177,6 +177,8 @@ class OpenAIServingChat:
for res in response:
if res.get("error_code", 200) != 200:
raise ValueError("{}".format(res["error_msg"]))
if res["finished"]:
api_server_logger.info(f"chat completion finished: {request_id}")
self.engine_client.data_processor.process_response_dict(
res,