【Sync】Release/2.0.1 (#2745)

* add rl qwen model support

* fix

* fix
This commit is contained in:
gaoziyuan
2025-07-08 14:38:18 +08:00
committed by GitHub
parent ea787d8f62
commit 6851489425
13 changed files with 438 additions and 171 deletions

View File

@@ -21,7 +21,11 @@ from dataclasses import dataclass, field
from typing import List, Optional
import paddle
from paddle.nn.functional.flash_attention import flash_attention_v3_varlen
try:
from paddle.nn.functional.flash_attention import flash_attention_v3_varlen
except:
flash_attention_v3_varlen = None
from fastdeploy.config import FDConfig
from fastdeploy.model_executor.layers.attention.attention import Attention