[Feature] Tracing: Fine-Grained Tracing for Request Latency Part1 (#5458)

This commit is contained in:
xiaolei373
2025-12-16 16:36:09 +08:00
committed by GitHub
parent c9b47f90ce
commit a30b4da260
29 changed files with 5464 additions and 475 deletions

View File

@@ -34,6 +34,7 @@ import numpy as np
import paddle
from tqdm import tqdm
import fastdeploy.metrics.trace as tracing
from fastdeploy.engine.args_utils import EngineArgs
from fastdeploy.engine.common_engine import EngineService
from fastdeploy.engine.expert_service import start_data_parallel_service
@@ -97,6 +98,8 @@ class LLMEngine:
main_process_metrics.set_cache_config_info(obj=self.cfg.cache_config)
tracing.trace_set_thread_info("engine")
def start(self, api_server_pid=None):
"""
Initializes the engine and starts its sub-services.