fix noaux_router balanceloss bug

HIT-cwh · CyCle1024 · commit f9bd261d95b2 · 2025-11-06T19:41:13.000+08:00
diff --git a/xtuner/v1/module/router/noaux_router.py b/xtuner/v1/module/router/noaux_router.py
@@ -111,6 +111,10 @@ def forward(self, logits) -> RouterResults:
         _, topk_idx = torch.topk(scores_for_choice, k=self.top_k, dim=-1)
         topk_weight = scores.gather(1, topk_idx)
 
+        # The returned `router_weights` is only used for computing balance loss
+        # It should be normalized
+        scores_for_choice = scores_for_choice / torch.sum(scores_for_choice, dim=-1, keepdim=True)
+
         if self.top_k > 1 and self.norm_topk_prob:
             denominator = topk_weight.sum(dim=-1, keepdim=True) + 1e-20
             topk_weight = topk_weight / denominator
@@ -169,6 +173,10 @@ def forward(self, logits) -> RouterResults:
         topk_weight = scores_for_choice.gather(1, topk_idx)  # [seq, n_groups]
         scores_for_choice = scores_for_choice.view(seq, self.n_routed_experts)
 
+        # The returned `router_weights` is only used for computing balance loss
+        # It should be normalized
+        scores_for_choice = scores_for_choice / torch.sum(scores_for_choice, dim=-1, keepdim=True)
+
         if self.top_k > 1 and self.norm_topk_prob:
             denominator = topk_weight.sum(dim=-1, keepdim=True) + 1e-20
             topk_weight = topk_weight / denominator