mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-16 21:51:31 +08:00
fix port (#3863)
This commit is contained in:
@@ -359,7 +359,7 @@ class TestMobaAttention(unittest.TestCase):
|
|||||||
model=model_path,
|
model=model_path,
|
||||||
tensor_parallel_size=2,
|
tensor_parallel_size=2,
|
||||||
max_model_len=131072,
|
max_model_len=131072,
|
||||||
engine_worker_queue_port=8793,
|
engine_worker_queue_port=int(os.getenv("FD_ENGINE_QUEUE_PORT")),
|
||||||
max_num_seqs=32,
|
max_num_seqs=32,
|
||||||
quantization="wint4",
|
quantization="wint4",
|
||||||
enable_chunked_prefill=True,
|
enable_chunked_prefill=True,
|
||||||
|
Reference in New Issue
Block a user