Forráskód Böngészése

undo harmful change

justheuristic 3 éve
szülő
commit
4bdccf8599
1 módosított fájl, 3 hozzáadás és 3 törlés
  1. 3 3
      hivemind/optim/experimental/state_averager.py

+ 3 - 3
hivemind/optim/experimental/state_averager.py

@@ -541,9 +541,9 @@ class TrainingStateAverager(DecentralizedAverager):
             if not began_running:
                 logger.error(f"Aborted {self.__class__.__name__}.step because wait_for_trigger raised exception")
             logger.exception(e)
-            if averaging_control is not None and not averaging_control.triggered:
-                averaging_control.weight = 0.0
-                averaging_control.allow_allreduce()
+            if averaging_control is not None and not averaging_control.done():
+                logger.error(f"Cancelled scheduled state averaging round")
+                averaging_control.cancel()
             self.finished_optimizer_step.set()
             self.finished_averaging_round.set()