mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
[Feature] Set v1 scheduler as default in develop (#3807)
* Set scheduler v1 as default * Set scheduler v1 as default * Set scheduler v1 as default * Set scheduler v1 as default * Set scheduler v1 as default * close V1 in guided_decoding * fix vl ci * close V1 in guided_decoding
This commit is contained in:
@@ -1,5 +1,6 @@
|
||||
import unittest
|
||||
|
||||
from fastdeploy import envs
|
||||
from fastdeploy.config import (
|
||||
CacheConfig,
|
||||
FDConfig,
|
||||
@@ -48,7 +49,8 @@ class TestConfig(unittest.TestCase):
|
||||
ips="0.0.0.0",
|
||||
test_mode=True,
|
||||
)
|
||||
assert fd_config.max_num_batched_tokens == 2048
|
||||
if not envs.ENABLE_V1_KVCACHE_SCHEDULER:
|
||||
assert fd_config.max_num_batched_tokens == 2048
|
||||
|
||||
cache_config.enable_chunked_prefill = False
|
||||
fd_config = FDConfig(
|
||||
@@ -58,7 +60,8 @@ class TestConfig(unittest.TestCase):
|
||||
ips="0.0.0.0",
|
||||
test_mode=True,
|
||||
)
|
||||
assert fd_config.max_num_batched_tokens == 8192
|
||||
if not envs.ENABLE_V1_KVCACHE_SCHEDULER:
|
||||
assert fd_config.max_num_batched_tokens == 8192
|
||||
|
||||
def test_fdconfig_init_cache(self):
|
||||
parallel_config = ParallelConfig({})
|
||||
|
||||
Reference in New Issue
Block a user