[BugFix] fix RMSNorm rms_norm_esp (#2804)

This commit is contained in:
lizexu123
2025-07-10 20:39:02 +08:00
committed by GitHub
parent 823a47e64a
commit e681e1e719
7 changed files with 18 additions and 16 deletions

View File

@@ -79,12 +79,12 @@ class Qwen3Attention(nn.Layer):
self.q_norm = RMSNorm(fd_config=fd_config,
hidden_size=fd_config.model_config.head_dim,
eps=1e-6,
eps=fd_config.model_config.rms_norm_eps,
prefix=f"{prefix}.q_norm",
begin_norm_axis=2)
self.k_norm = RMSNorm(fd_config=fd_config,
hidden_size=fd_config.model_config.head_dim,
eps=1e-6,
eps=fd_config.model_config.rms_norm_eps,
prefix=f"{prefix}.k_norm",
begin_norm_axis=2)
@@ -184,7 +184,7 @@ class Qwen3Model(nn.Layer):
self.norm = RMSNorm(
fd_config,
hidden_size=fd_config.model_config.hidden_size,
eps=1e-6,
eps=fd_config.model_config.rms_norm_eps,
prefix=f"{fd_config.model_config.prefix_name}.norm",
)