justheuristic 4 年之前
父节点
当前提交
882cad67da
共有 1 个文件被更改,包括 0 次插入1 次删除
  1. 0 1
      hivemind/moe/client/balanced_expert.py

+ 0 - 1
hivemind/moe/client/balanced_expert.py

@@ -67,7 +67,6 @@ class BalancedRemoteExpert(nn.Module):
 
         # Note: we send DUMMY to prevent torch from excluding expert from backward if no other inputs require grad
         flat_outputs = _BalancedRemoteModuleCall.apply(DUMMY,
-                                                       self.uid,
                                                        self.expert_balancer,
                                                        self.info,
                                                        self.forward_timeout,