mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-05 16:48:03 +08:00
This reverts commit d1d063e4af
.
This commit is contained in:
@@ -60,7 +60,6 @@ from fastdeploy.utils import (
|
||||
StatefulSemaphore,
|
||||
api_server_logger,
|
||||
console_logger,
|
||||
is_package_installed,
|
||||
is_port_available,
|
||||
retrive_model_from_server,
|
||||
)
|
||||
@@ -68,7 +67,7 @@ from fastdeploy.utils import (
|
||||
parser = FlexibleArgumentParser()
|
||||
parser.add_argument("--port", default=8000, type=int, help="port to the http server")
|
||||
parser.add_argument("--host", default="0.0.0.0", type=str, help="host to the http server")
|
||||
parser.add_argument("--workers", default=None, type=int, help="number of workers")
|
||||
parser.add_argument("--workers", default=1, type=int, help="number of workers")
|
||||
parser.add_argument("--metrics-port", default=8001, type=int, help="port for metrics server")
|
||||
parser.add_argument("--controller-port", default=-1, type=int, help="port for controller server")
|
||||
parser.add_argument(
|
||||
@@ -83,16 +82,6 @@ parser.add_argument(
|
||||
)
|
||||
parser = EngineArgs.add_cli_args(parser)
|
||||
args = parser.parse_args()
|
||||
|
||||
|
||||
if args.workers is None:
|
||||
# In GPU, the workers of uvicorn will be set according to the parameter `max-num-seqs`
|
||||
if is_package_installed("paddlepaddle-gpu"):
|
||||
args.workers = max(min(int(args.max_num_seqs // 32), 8), 1)
|
||||
else:
|
||||
args.workers = 1
|
||||
console_logger.info(f"Number of api-server workers: {args.workers}.")
|
||||
|
||||
args.model = retrive_model_from_server(args.model, args.revision)
|
||||
chat_template = load_chat_template(args.chat_template, args.model)
|
||||
if args.tool_parser_plugin:
|
||||
|
Reference in New Issue
Block a user