mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-05 08:37:06 +08:00
[Feature] support prompt repetition_penalty (#2806)
Some checks failed
Deploy GitHub Pages / deploy (push) Has been cancelled
Some checks failed
Deploy GitHub Pages / deploy (push) Has been cancelled
This commit is contained in:
@@ -57,6 +57,12 @@ def _create_default_sampling_metadata(
|
||||
top_p=paddle.full(shape=[batch_size, 1],
|
||||
fill_value=0.7,
|
||||
dtype="float32"),
|
||||
prompt_ids=paddle.full(shape=[batch_size, max_seq_len],
|
||||
fill_value=0,
|
||||
dtype="int64"),
|
||||
prompt_lens=paddle.full(shape=[batch_size, 1],
|
||||
fill_value=5,
|
||||
dtype="int64"),
|
||||
step_idx=paddle.full(shape=[batch_size, 1],
|
||||
fill_value=0,
|
||||
dtype="int64"),
|
||||
|
Reference in New Issue
Block a user