diff --git a/fastdeploy/worker/vl_gpu_model_runner.py b/fastdeploy/worker/vl_gpu_model_runner.py index 82af454b5..778ca8424 100644 --- a/fastdeploy/worker/vl_gpu_model_runner.py +++ b/fastdeploy/worker/vl_gpu_model_runner.py @@ -235,8 +235,6 @@ class GPUVLModelRunner(VLModelRunnerBase): fd_config.model_config.think_end_id = tokenizer.get_vocab()[""] fd_config.model_config.max_text_id = fd_config.model_config.im_patch_id fd_config.model_config.sequence_parallel = False - # TODO(YuanRisheng) The moe_k in develop is fixed to 8, need to be changed according to json config - fd_config.model_config.moe_k = 8 self.fd_config = fd_config self.model_cfg = self.fd_config.model_config self.image_preprocess = self._init_image_preprocess(