3 年前 · 5aa4e3d85b
--- a/hivemind/utils/asyncio.py
+++ b/hivemind/utils/asyncio.py
@@ -1,5 +1,7 @@
 
															 import asyncio
														
 
															 import concurrent.futures
														
 
															+import multiprocessing as mp
														
 
															+import os
														
 
															 from concurrent.futures import ThreadPoolExecutor
														
 
															 from contextlib import AbstractAsyncContextManager, AbstractContextManager, asynccontextmanager
														
 
															 from typing import AsyncIterable, AsyncIterator, Awaitable, Callable, Iterable, Optional, Tuple, TypeVar, Union
														
@@ -167,12 +169,25 @@ async def attach_event_on_finished(iterable: AsyncIterable[T], event: asyncio.Ev
 
															 class _AsyncContextWrapper(AbstractAsyncContextManager):
														
 
															     """Wrapper for a non-async context manager that allows entering and exiting it in EventLoop-friendly manner"""
														
 
															+    EXECUTOR_PID = None
														
 
															+    CONTEXT_EXECUTOR = None
														
 
															+    EXECUTOR_LOCK = mp.Lock()
														
 
															+
														
 
															     def __init__(self, context: AbstractContextManager):
														
 
															         self._context = context
														
 
															+    @classmethod
														
 
															+    def get_process_wide_executor(cls):
														
 
															+        if os.getpid() != cls.EXECUTOR_PID:
														
 
															+            with cls.EXECUTOR_LOCK:
														
 
															+                if os.getpid() != cls.EXECUTOR_PID:
														
 
															+                    cls.CONTEXT_EXECUTOR = ThreadPoolExecutor(max_workers=float("inf"))
														
 
															+                    cls.EXECUTOR_PID = os.getpid()
														
 
															+        return cls.CONTEXT_EXECUTOR
														
 
															+
														
 
															     async def __aenter__(self):
														
 
															         loop = asyncio.get_event_loop()
														
 
															-        return await loop.run_in_executor(None, self._context.__enter__)
														
 
															+        return await loop.run_in_executor(self.get_process_wide_executor(), self._context.__enter__)
														
 
															     async def __aexit__(self, exc_type, exc_value, traceback):
														
 
															         return self._context.__exit__(exc_type, exc_value, traceback)
														
--- a/tests/test_util_modules.py
+++ b/tests/test_util_modules.py
@@ -507,6 +507,32 @@ async def test_async_context():
 
															     # running this without enter_asynchronously would deadlock the event loop
														
 
															+@pytest.mark.asyncio
														
 
															+async def test_async_context_flooding():
														
 
															+    """
														
 
															+    test for a possible deadlock when many coroutines await the lock and overwhelm the underlying ThreadPoolExecutor
														
 
															+
														
 
															+    Here's how the test below works: suppose that the thread pool has at most N workers;
														
 
															+    If at least N + 1 coroutines await lock1 concurrently, N of them occupy workers and the rest are awaiting workers;
														
 
															+    When the first of N workers acquires lock1, it lets coroutine A inside lock1 and into await sleep(1e-2);
														
 
															+    During that sleep, one of the worker-less coroutines will take up the worker freed by coroutine A.
														
 
															+    Finally, coroutine A finishes sleeping and immediately gets stuck at lock2, because there are no free workers.
														
 
															+    Thus, every single coroutine is either awaiting an already acquired lock, or awaiting for free workers in executor.
														
 
															+
														
 
															+    """
														
 
															+    lock1, lock2 = mp.Lock(), mp.Lock()
														
 
															+
														
 
															+    async def coro():
														
 
															+        async with enter_asynchronously(lock1):
														
 
															+            await asyncio.sleep(1e-2)
														
 
															+            async with enter_asynchronously(lock2):
														
 
															+                await asyncio.sleep(1e-2)
														
 
															+
														
 
															+    num_coros = max(100, mp.cpu_count() * 5 + 1)
														
 
															+    # note: if we deprecate py3.7, this can be reduced to max(33, cpu + 5); see https://bugs.python.org/issue35279
														
 
															+    await asyncio.wait({coro() for _ in range(num_coros)})
														
 
															+
														
 
															+
														
 
															 def test_batch_tensor_descriptor_msgpack():
														
 
															     tensor_descr = BatchTensorDescriptor.from_tensor(torch.ones(1, 3, 3, 7))
														
 
															     tensor_descr_roundtrip = MSGPackSerializer.loads(MSGPackSerializer.dumps(tensor_descr))