mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
[Feature] Tracing: Fine-Grained Tracing for Request Latency Part1 (#5458)
This commit is contained in:
@@ -34,6 +34,7 @@ import numpy as np
|
||||
import paddle
|
||||
from tqdm import tqdm
|
||||
|
||||
import fastdeploy.metrics.trace as tracing
|
||||
from fastdeploy.engine.args_utils import EngineArgs
|
||||
from fastdeploy.engine.common_engine import EngineService
|
||||
from fastdeploy.engine.expert_service import start_data_parallel_service
|
||||
@@ -97,6 +98,8 @@ class LLMEngine:
|
||||
|
||||
main_process_metrics.set_cache_config_info(obj=self.cfg.cache_config)
|
||||
|
||||
tracing.trace_set_thread_info("engine")
|
||||
|
||||
def start(self, api_server_pid=None):
|
||||
"""
|
||||
Initializes the engine and starts its sub-services.
|
||||
|
||||
Reference in New Issue
Block a user