mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-05 08:37:06 +08:00
[Feature] remove dependency on enable_mm and refine multimodal's code (#3014)
* remove dependency on enable_mm * fix codestyle check error * fix codestyle check error * update docs * resolve conflicts on model config * fix unit test error * fix code style check error --------- Co-authored-by: shige <1021937542@qq.com> Co-authored-by: Jiang-Jia-Jun <163579578+Jiang-Jia-Jun@users.noreply.github.com>
This commit is contained in:
@@ -28,9 +28,11 @@ from tqdm import tqdm
|
||||
from fastdeploy.engine.args_utils import EngineArgs
|
||||
from fastdeploy.engine.engine import LLMEngine
|
||||
from fastdeploy.engine.sampling_params import SamplingParams
|
||||
|
||||
# from fastdeploy.entrypoints.chat_utils import ChatCompletionMessageParam
|
||||
from fastdeploy.utils import llm_logger, retrive_model_from_server
|
||||
from fastdeploy.utils import (
|
||||
deprecated_kwargs_warning,
|
||||
llm_logger,
|
||||
retrive_model_from_server,
|
||||
)
|
||||
from fastdeploy.worker.output import Logprob, LogprobsLists
|
||||
|
||||
root_logger = logging.getLogger()
|
||||
@@ -72,6 +74,8 @@ class LLM:
|
||||
enable_logprob: Optional[bool] = False,
|
||||
**kwargs,
|
||||
):
|
||||
deprecated_kwargs_warning(**kwargs)
|
||||
|
||||
model = retrive_model_from_server(model, revision)
|
||||
engine_args = EngineArgs(
|
||||
model=model,
|
||||
|
Reference in New Issue
Block a user