mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 08:21:53 +08:00
[BugFix]fix v1 loader lm head fp32 (#5270)
This commit is contained in:
@@ -376,7 +376,9 @@ class Qwen2ForCausalLM(ModelForCasualLM):
|
||||
model_sublayer_name = re.sub(r"\.(weight)$", "", model_param_name)
|
||||
process_weights_after_loading_fn(model_sublayer_name, param)
|
||||
if self.tie_word_embeddings:
|
||||
self.lm_head.linear.weight.set_value(self.qwen2.embed_tokens.embeddings.weight.transpose([1, 0]))
|
||||
self.lm_head.linear.weight.set_value(
|
||||
self.qwen2.embed_tokens.embeddings.weight.transpose([1, 0]).astype(self.lm_head.linear.weight.dtype)
|
||||
)
|
||||
|
||||
@classmethod
|
||||
def name(self):
|
||||
|
||||
Reference in New Issue
Block a user