baidu
/

ERNIE-4.5-21B-A3B-PT

Text Generation

Model card Files Files and versions

hlfby06 commited on Jul 18

Commit

25a6467

·

verified ·

1 Parent(s): da07396

fix model correction_bias

Files changed (1) hide show

modeling_ernie4_5_moe.py +8 -2

modeling_ernie4_5_moe.py CHANGED Viewed

@@ -483,8 +483,14 @@ class Ernie4_5_MoeMLP(nn.Module):
         S, H = x.shape
         E = gate_logits.shape[1]
         device = x.device
-        topk_prob, topk_idx = torch.topk(gate_logits, k, dim=-1)
-        combine_weights = topk_prob
         expert_id = topk_idx
         y = x.new_zeros((E, capacity, H))
         scatter_index = x.new_full((k, S), -1, dtype=torch.int32)

         S, H = x.shape
         E = gate_logits.shape[1]
         device = x.device
+        if self.use_correction_bias:
+            _, topk_idx = torch.topk(gate_logits + self.moe_statics.e_score_correction_bias, k, dim=-1)
+            topk_prob = torch.gather(gate_logits, dim=-1, index=topk_idx)
+        else:
+            topk_prob, topk_idx = torch.topk(gate_logits, k, dim=-1)
+        combine_weights = topk_prob
         expert_id = topk_idx
         y = x.new_zeros((E, capacity, H))
         scatter_index = x.new_full((k, S), -1, dtype=torch.int32)