update FAQ

This commit is contained in:
Azure 2025-02-12 08:50:58 +00:00
parent 0564ac8465
commit 3897f001f5
3 changed files with 55 additions and 7 deletions

View file

@ -1699,7 +1699,7 @@ class DeepseekV3ForCausalLM(DeepseekV3PreTrainedModel):
)
hidden_states = outputs[0]
logits = self.lm_head(hidden_states)
logits = self.lm_head(hidden_states.to(self.lm_head.weight.device))
logits = logits.float()
loss = None