mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
feat: add support for API usage with multimodal models (#4548)
* feat: add support for API usage with multimodal models * completion_tokens contains num_image_tokens * remove test_request.py * fix: paddle.device.is_compiled_with_cuda() * fix test_unstream_without_logprobs
This commit is contained in:
@@ -66,6 +66,7 @@ class CompletionTokenUsageInfo(BaseModel):
|
||||
"""
|
||||
|
||||
reasoning_tokens: Optional[int] = None
|
||||
image_tokens: Optional[int] = None
|
||||
|
||||
|
||||
class PromptTokenUsageInfo(BaseModel):
|
||||
@@ -74,6 +75,8 @@ class PromptTokenUsageInfo(BaseModel):
|
||||
"""
|
||||
|
||||
cached_tokens: Optional[int] = None
|
||||
image_tokens: Optional[int] = None
|
||||
video_tokens: Optional[int] = None
|
||||
|
||||
|
||||
class UsageInfo(BaseModel):
|
||||
|
||||
Reference in New Issue
Block a user