mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-16 05:30:58 +08:00
fix port (#3863)
This commit is contained in:
@@ -359,7 +359,7 @@ class TestMobaAttention(unittest.TestCase):
|
||||
model=model_path,
|
||||
tensor_parallel_size=2,
|
||||
max_model_len=131072,
|
||||
engine_worker_queue_port=8793,
|
||||
engine_worker_queue_port=int(os.getenv("FD_ENGINE_QUEUE_PORT")),
|
||||
max_num_seqs=32,
|
||||
quantization="wint4",
|
||||
enable_chunked_prefill=True,
|
||||
|
Reference in New Issue
Block a user