[RL] R3 Support RDMA Store (#5467)

* [RL] R3 support rdma store

* refine notes

* refine code

* disable prefix cache

* support preempted task and put cpu tensor
This commit is contained in:
RAM
2025-12-16 16:50:13 +08:00
committed by GitHub
parent a30b4da260
commit 6fc5eccf83
3 changed files with 69 additions and 4 deletions

View File

@@ -1498,14 +1498,17 @@ class RoutingReplayConfig:
"""Configuration for Routing Replay used in RL training"""
def __init__(self, args) -> None:
self.enable_routing_replay: bool = False
# Routing store type: local/rdma
self.routing_store_type: str = "local"
# Local routing store
self.local_store_dir: str = "./routing_replay_output"
# RDMA routing store
# TODO: Add RDMA routing store configuration attributes here when the feature is implemented.
self.rdma_store_server: str = ""
if args is not None:
for key, value in args.items():
@@ -1698,7 +1701,9 @@ class FDConfig:
self.cache_config.postprocess(self.scheduler_config.max_num_batched_tokens, self.scheduler_config.max_num_seqs)
if self.model_config is not None and self.model_config.enable_mm and not envs.ENABLE_V1_KVCACHE_SCHEDULER:
self.cache_config.enable_prefix_caching = False
if self.routing_replay_config is not None and self.routing_replay_config.enable_routing_replay:
# TODO(gongshaotian): R3 support prefix caching
self.cache_config.enable_prefix_caching = False
if (
self.structured_outputs_config is not None
and self.structured_outputs_config.guided_decoding_backend != "off"