mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
[Feature] Guided Decoding add LLguidance backend (#5124)
* llguidance * add requirements_guided_decoding.txt and doc * fix test_guidance_*.py * fix test_guidance_*.py && mv * fix llguidance choice * test_guidance_* * rm lazy loader --------- Co-authored-by: YuBaoku <49938469+EmmonsCurse@users.noreply.github.com>
This commit is contained in:
@@ -294,7 +294,12 @@ class BackendBase:
|
||||
"""
|
||||
try:
|
||||
architectures = self.fd_config.model_config.architectures
|
||||
if not ErnieArchitectures.contains_ernie_arch(architectures):
|
||||
is_guidance_backend = (
|
||||
self.fd_config.structured_outputs_config is not None
|
||||
and self.fd_config.structured_outputs_config.guided_decoding_backend is not None
|
||||
and self.fd_config.structured_outputs_config.guided_decoding_backend == "guidance"
|
||||
)
|
||||
if not ErnieArchitectures.contains_ernie_arch(architectures) or is_guidance_backend:
|
||||
from transformers import AutoTokenizer, PreTrainedTokenizerFast
|
||||
|
||||
tokenizer = AutoTokenizer.from_pretrained(
|
||||
|
||||
Reference in New Issue
Block a user