qwen3 0.3B fix (#3255)
Some checks failed
Deploy GitHub Pages / deploy (push) Has been cancelled

This commit is contained in:
bukejiyu
2025-08-08 11:35:40 +08:00
committed by GitHub
parent fac2f64837
commit b76b17fc1b
2 changed files with 22 additions and 31 deletions

View File

@@ -286,6 +286,9 @@ class Qwen3ForCausalLM(ModelForCasualLM):
weight_loader = getattr(param, "weight_loader", default_weight_loader(self.fd_config))
weight_loader(param, loaded_weight)
if self.tie_word_embeddings:
self.lm_head.linear.weight.set_value(self.model.embed_tokens.embeddings.weight.transpose([1, 0]))
@paddle.no_grad()
def set_state_dict(self, state_dict):
"""