mirror of
https://github.com/kvcache-ai/ktransformers.git
synced 2025-09-11 07:44:35 +00:00
Update modeling_deepseek_v3.py
This commit is contained in:
parent
016d11e6d4
commit
e36ddc36a8
1 changed files with 1 additions and 1 deletions
|
@ -436,7 +436,7 @@ class MoEGate(nn.Module):
|
|||
|
||||
### select top-k experts
|
||||
if self.topk_method == "noaux_tc":
|
||||
assert not self.training
|
||||
#assert not self.training
|
||||
scores_for_choice = scores.view(bsz * seq_len, -1) + self.e_score_correction_bias.unsqueeze(0)
|
||||
group_scores = (
|
||||
scores_for_choice.view(bsz * seq_len, self.n_group, -1).topk(2, dim=-1)[0].sum(dim = -1)
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue