@@ -10,7 +10,7 @@ jobs:
strategy:
matrix:
python-version: [ 3.7, 3.8, 3.9 ]
- attempt: [ 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20 ]
+ attempt: [ 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30 ]
fail-fast: false
timeout-minutes: 10
steps:
@@ -36,9 +36,6 @@ def cleanup_children():
with suppress(psutil.NoSuchProcess):
child.terminate()
psutil.wait_procs(children, timeout=1)
- for child in children:
- with suppress(psutil.NoSuchProcess):
- child.kill()
# Broken code or killing of child processes may leave the MPFuture backend corrupted
MPFuture.reset_backend()
@@ -577,6 +574,7 @@ def test_training_averager(n_steps: int = 10, n_dims: int = 16):
if __name__ == '__main__':
with cleanup_children():
+ print(f"BEGAN test_key_manager()")
loop = asyncio.new_event_loop()
loop.run_until_complete(test_key_manager())
print(f"PASSED test_key_manager()")
@@ -584,20 +582,25 @@ if __name__ == '__main__':
for n_clients in [0, 1, 2]:
for n_aux in [0, 1, 2]:
+ print(f"BEGAN _test_allreduce_once({n_clients}, {n_aux})")
_test_allreduce_once(n_clients, n_aux)
print(f"PASSED _test_allreduce_once({n_clients}, {n_aux})")
for n_clients, n_aux in [(0, 4), (1, 3), (0, 3)]:
+ print(f"BEGAN _test_allreduce_weighted")
test_allreduce_weighted()
print(f"PASSED _test_allreduce_weighted")
+ print(f"BEGAN _test_allreduce_grid")
test_allreduce_grid()
print(f"PASSED _test_allreduce_grid")
+ print("BEGAN _test_allreduce_compression")
test_allreduce_compression()
print(f"PASSED _test_allreduce_compression")