mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-05 08:37:06 +08:00
Add ci case for min token and max token (#3229)
Co-authored-by: xujing43 <xujing43@baidu.com>
This commit is contained in:
36
test/ce/server/test_params_boundary.py
Normal file
36
test/ce/server/test_params_boundary.py
Normal file
@@ -0,0 +1,36 @@
|
||||
#!/bin/env python3
|
||||
# -*- coding: utf-8 -*-
|
||||
# @author xujing43
|
||||
# encoding=utf-8 vi:ts=4:sw=4:expandtab:ft=python
|
||||
|
||||
"""
|
||||
Boundary value checking for API parameters
|
||||
"""
|
||||
|
||||
import json
|
||||
|
||||
from core import (
|
||||
TEMPLATE,
|
||||
URL,
|
||||
build_request_payload,
|
||||
send_request,
|
||||
)
|
||||
|
||||
def test_max_min_1_token():
|
||||
data = {
|
||||
"stream": False,
|
||||
"messages": [{"role": "user", "content": "非洲的首都是?"}],
|
||||
"max_tokens": 1,
|
||||
"metadata": {
|
||||
"min_tokens": 1
|
||||
},
|
||||
}
|
||||
payload = build_request_payload(TEMPLATE, data)
|
||||
response = send_request(URL, payload).json()
|
||||
|
||||
response_object = response["object"]
|
||||
assert "error" not in response_object, f"响应中包含错误信息: {response_object}"
|
||||
completion_tokens = response["usage"]["completion_tokens"]
|
||||
assert completion_tokens == 1, f"实际生成的token数为: {completion_tokens}, 应该为1"
|
||||
finish_reason = response["choices"][0]["finish_reason"]
|
||||
assert finish_reason == "length", f"内容不可能完整生成, 但实际finish_reason为: {response}"
|
Reference in New Issue
Block a user