diff --git a/fastdeploy/entrypoints/openai/api_server.py b/fastdeploy/entrypoints/openai/api_server.py index f31cf32d4..db78ec6c2 100644 --- a/fastdeploy/entrypoints/openai/api_server.py +++ b/fastdeploy/entrypoints/openai/api_server.py @@ -60,7 +60,6 @@ from fastdeploy.utils import ( StatefulSemaphore, api_server_logger, console_logger, - is_package_installed, is_port_available, retrive_model_from_server, ) @@ -85,11 +84,8 @@ parser = EngineArgs.add_cli_args(parser) args = parser.parse_args() if args.workers is None: - # In GPU, the workers of uvicorn will be set according to the parameter `max-num-seqs` - if is_package_installed("paddlepaddle-gpu"): - args.workers = max(min(int(args.max_num_seqs // 32), 8), 1) - else: - args.workers = 1 + args.workers = max(min(int(args.max_num_seqs // 32), 8), 1) + console_logger.info(f"Number of api-server workers: {args.workers}.") args.model = retrive_model_from_server(args.model, args.revision)