This commit is contained in:
yangjianfengo1
2025-09-04 10:01:38 +08:00
committed by GitHub
parent 3790505319
commit c870be6d27

View File

@@ -359,7 +359,7 @@ class TestMobaAttention(unittest.TestCase):
model=model_path, model=model_path,
tensor_parallel_size=2, tensor_parallel_size=2,
max_model_len=131072, max_model_len=131072,
engine_worker_queue_port=8793, engine_worker_queue_port=int(os.getenv("FD_ENGINE_QUEUE_PORT")),
max_num_seqs=32, max_num_seqs=32,
quantization="wint4", quantization="wint4",
enable_chunked_prefill=True, enable_chunked_prefill=True,