mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-06 00:57:33 +08:00
[FIX 2.0.2]fix topp topk default value (#2810)
* fix topp topk default value * update topk
This commit is contained in:
@@ -82,7 +82,7 @@ class SamplingParams:
|
|||||||
frequency_penalty: float = None
|
frequency_penalty: float = None
|
||||||
repetition_penalty: float = None
|
repetition_penalty: float = None
|
||||||
temperature: float = None
|
temperature: float = None
|
||||||
top_p: float = 1.0
|
top_p: float = None
|
||||||
top_k: int = 0
|
top_k: int = 0
|
||||||
seed: Optional[int] = None
|
seed: Optional[int] = None
|
||||||
stop: Optional[Union[str, List[str]]] = None
|
stop: Optional[Union[str, List[str]]] = None
|
||||||
@@ -132,7 +132,7 @@ class SamplingParams:
|
|||||||
repetition_penalty=repetition_penalty
|
repetition_penalty=repetition_penalty
|
||||||
if repetition_penalty is not None else 1.0,
|
if repetition_penalty is not None else 1.0,
|
||||||
temperature=temperature if temperature is not None else 1.0,
|
temperature=temperature if temperature is not None else 1.0,
|
||||||
top_p=top_p if top_p is not None else 1.0,
|
top_p=top_p,
|
||||||
top_k=top_k if top_k is not None else 0,
|
top_k=top_k if top_k is not None else 0,
|
||||||
seed=seed,
|
seed=seed,
|
||||||
stop=stop,
|
stop=stop,
|
||||||
|
@@ -244,7 +244,7 @@ class GPUModelRunner(ModelRunnerBase):
|
|||||||
request.eos_token_ids.append(request.eos_token_ids[0])
|
request.eos_token_ids.append(request.eos_token_ids[0])
|
||||||
self.share_inputs["eos_token_id"][:] = np.array(
|
self.share_inputs["eos_token_id"][:] = np.array(
|
||||||
request.eos_token_ids, dtype="int64").reshape(-1, 1)
|
request.eos_token_ids, dtype="int64").reshape(-1, 1)
|
||||||
self.share_inputs["top_p"][idx:idx + 1] = request.get("top_p", 1.0)
|
self.share_inputs["top_p"][idx:idx + 1] = request.get("top_p", 0.7)
|
||||||
self.share_inputs["top_k"][idx:idx + 1] = request.get("top_k", 0)
|
self.share_inputs["top_k"][idx:idx + 1] = request.get("top_k", 0)
|
||||||
self.share_inputs["temperature"][idx:idx + 1] = request.get(
|
self.share_inputs["temperature"][idx:idx + 1] = request.get(
|
||||||
"temperature", 0.95)
|
"temperature", 0.95)
|
||||||
|
@@ -279,7 +279,7 @@ class XPUModelRunner(ModelRunnerBase):
|
|||||||
self.share_inputs["eos_token_id"][:] = np.array(
|
self.share_inputs["eos_token_id"][:] = np.array(
|
||||||
request.eos_token_ids, dtype="int64").reshape(-1, 1)
|
request.eos_token_ids, dtype="int64").reshape(-1, 1)
|
||||||
self.share_inputs["pre_ids"][idx:idx + 1] = -1
|
self.share_inputs["pre_ids"][idx:idx + 1] = -1
|
||||||
self.share_inputs["top_p"][idx:idx + 1] = request.get("top_p", 1.0)
|
self.share_inputs["top_p"][idx:idx + 1] = request.get("top_p", 0.7)
|
||||||
self.share_inputs["top_k"][idx:idx + 1] = request.get("top_k", 0)
|
self.share_inputs["top_k"][idx:idx + 1] = request.get("top_k", 0)
|
||||||
self.share_inputs["temperature"][idx:idx + 1] = request.get(
|
self.share_inputs["temperature"][idx:idx + 1] = request.get(
|
||||||
"temperature", 0.95)
|
"temperature", 0.95)
|
||||||
|
Reference in New Issue
Block a user