4 years ago · 9f9c4ac96b
--- a/docs/modules/dht.rst
+++ b/docs/modules/dht.rst
@@ -10,6 +10,11 @@ Here's a high level scheme of how these components interact with one another:
 
															    :width: 640
														
 
															    :align: center
														
 
															+
														
 
															+**Note:** hivemind.DHT is currently being updated to improve beam search latency
														
 
															+(see `issue 92 <https://github.com/learning-at-home/hivemind/issues>`__). New functionality will be documented
														
 
															+here by 2020.10.15 23:59:59 AOE (ping justheuristic for details).
														
 
															+
														
 
															 DHT and DHTNode
														
 
															 ###############
														
--- a/hivemind/__init__.py
+++ b/hivemind/__init__.py
@@ -3,4 +3,4 @@ from hivemind.dht import *
 
															 from hivemind.server import *
														
 
															 from hivemind.utils import *
														
 
															-__version__ = '0.8.4'
														
 
															+__version__ = '0.8.5'
														
--- a/hivemind/dht/__init__.py
+++ b/hivemind/dht/__init__.py
@@ -14,11 +14,12 @@ The code is organized as follows:
 
															 """
														
 
															 import asyncio
														
 
															 import ctypes
														
 
															+import heapq
														
 
															 import multiprocessing as mp
														
 
															 import warnings
														
 
															 from collections import deque, OrderedDict
														
 
															 from concurrent.futures import ThreadPoolExecutor
														
 
															-from typing import List, Tuple, Optional, Sequence, OrderedDict as TOrderedDict, Union, Awaitable
														
 
															+from typing import List, Tuple, Optional, Sequence, OrderedDict as TOrderedDict, Union, Awaitable, Dict, Deque, Set
														
 
															 import uvloop
														
@@ -67,7 +68,6 @@ class DHT(mp.Process):
 
															     This beam search explores one additional dimension per step and finds k best experts from across the DHT
														
 
															     in O(k / s * log(N)) average time where s is grid sparsity rate and N is the total number of experts.
														
 
															     """
														
 
															-
														
 
															     UID_DELIMITER = '.'  # when declaring experts, DHT store all prefixes of that expert's uid, split over this prefix
														
 
															     #  formally, prefixes = {uid.split(UID_DELIMITER)[:length] for length in range(1, uid.count(UID_DELIMITER) + 2)}
														
@@ -147,7 +147,9 @@ class DHT(mp.Process):
 
															             expiration_time = get_dht_time()
														
 
															         num_workers = len(uids) if self.max_workers is None else min(len(uids), self.max_workers)
														
 
															         response = await node.get_many(uids, expiration_time, num_workers=num_workers)
														
 
															-        future.set_result([RemoteExpert(**expert_data) if maybe_expiration_time else None
														
 
															+        # TODO expert_data['expert'] -> namedtuple with meaningful field names
														
 
															+        future.set_result([RemoteExpert(*expert_data['expert'][0])
														
 
															+                           if maybe_expiration_time else None and expert_data['expert'][1] is not None
														
 
															                            for uid, (expert_data, maybe_expiration_time) in response.items()])
														
 
															     def declare_experts(self, uids: List[str], endpoint: Endpoint, wait=True, timeout=None) -> Optional[List[bool]]:
														
@@ -169,18 +171,148 @@ class DHT(mp.Process):
 
															     async def _declare_experts(self, node: DHTNode, uids: List[str], endpoint: Endpoint, future: Optional[MPFuture]):
														
 
															         num_workers = len(uids) if self.max_workers is None else min(len(uids), self.max_workers)
														
 
															         expiration_time = get_dht_time() + self.expiration
														
 
															-
														
 
															-        data_to_store = {}
														
 
															-        for uid in uids:
														
 
															+        unique_entries: Set[Tuple[str, str]] = set()
														
 
															+        #                 prefix---v next_dim     uid  endpoint
														
 
															+        data_to_store: List[Tuple[str, str, List[str, Endpoint]]] = []
														
 
															+        for uid in uids:  # first k entries are expert uids themselves
														
 
															+            data_to_store.append((uid, "expert", [uid, endpoint]))
														
 
															+        for uid in uids:  # and then, add all prefixes
														
 
															             uid_parts = uid.split(self.UID_DELIMITER)
														
 
															-            for i in range(len(uid_parts)):
														
 
															+            for i in range(len(uid_parts) - 1):
														
 
															                 uid_prefix_i = self.UID_DELIMITER.join(uid_parts[:i + 1])
														
 
															-                data_to_store[uid_prefix_i] = {'uid': uid, 'endpoint': endpoint}
														
 
															+                if (uid_prefix_i, uid_parts[i + 1]) in unique_entries:
														
 
															+                    continue
														
 
															+                unique_entries.add((uid_prefix_i, uid_parts[i + 1]))
														
 
															+                data_to_store.append((uid_prefix_i, uid_parts[i + 1], [uid, endpoint]))
														
 
															+
														
 
															+        keys, subkeys, values = map(list, zip(*data_to_store))
														
 
															+        store_ok = await node.store_many(keys, values, expiration_time, subkeys=subkeys, num_workers=num_workers)
														
 
															+        if future is not None:
														
 
															+            future.set_result([store_ok[key, subkey] for key, subkey in zip(keys, subkeys)])
														
 
															+
														
 
															+    def find_best_experts(self, prefix: str, grid_scores: Sequence[Sequence[float]], beam_size: int, *,
														
 
															+                          return_future=False, **kwargs) -> Union[List[RemoteExpert], MPFuture]:
														
 
															+        """
														
 
															+        Find and return :beam_size: active experts with highest scores, use both local cache and DHT
														
 
															+
														
 
															+        :param prefix: common prefix for all expert uids in grid
														
 
															+        :param grid_scores: scores predicted for each dimension in the grid,
														
 
															+        :type grid_scores: model scores for each grid dimension, list of arrays of shape grid_size[i]
														
 
															+        :param beam_size: how many best experts should beam search return
														
 
															+         After time_budget is reached, beam search won't search for more experts and instead fall back on local cache
														
 
															+         Please note that any queries that fall outside the budget will still be performed in background and cached
														
 
															+         for subsequent iterations as long as DHTNode.cache_locally is True
														
 
															+        :param return_future: if set to True, returns MPFuture that can be awaited to get the actual result
														
 
															+        :param kwargs: extra keyword parameters passed to DHTNode.get_many
														
 
															+        :returns: a list that contains *up to* k_best RemoteExpert instances
														
 
															+        """
														
 
															+        future, _future = MPFuture.make_pair()
														
 
															+        self.pipe.send(('_find_best_experts', [], dict(prefix=prefix, grid_scores=list(map(tuple, grid_scores)),
														
 
															+                                                       beam_size=beam_size, future=_future, **kwargs)))
														
 
															+        return future if return_future else future.result()
														
 
															+
														
 
															+    async def _find_best_experts(
														
 
															+            self, node: DHTNode, prefix: str, grid_scores: List[Tuple[float]], beam_size: int,
														
 
															+            max_workers: Optional[int] = None, future: Optional[MPFuture] = None, **kwargs) -> List[RemoteExpert]:
														
 
															+        max_workers: Optional[int] = max_workers or self.max_workers or beam_size
														
 
															+
														
 
															+        # form initial beam from top-k active L1 prefixes, each row is (score, uid prefix, possible suffixes)
														
 
															+        beam: List[Tuple[float, str, Dict[str, List[str, Endpoint]]]] = await self._get_initial_beam(
														
 
															+            node, prefix, beam_size, grid_scores[0], num_workers=min(beam_size, max_workers))
														
 
															+        if not beam:
														
 
															+            logger.warning(f"Beam search had to terminate prematurely because of empty beam (dim 0)")
														
 
															+            return []
														
 
															+
														
 
															+        for dim_index in range(1, len(grid_scores) - 1):
														
 
															+            # select beam_size best suffixes from current beam
														
 
															+            dim_scores = grid_scores[dim_index]
														
 
															+            best_active_pairs: List[Tuple[float, str]] = heapq.nlargest(beam_size, (
														
 
															+                (prefix_score + dim_scores[int(suffix_i)], f"{prefix}{self.UID_DELIMITER}{suffix_i}")
														
 
															+                for prefix_score, prefix, suffixes in beam for suffix_i in suffixes.keys()
														
 
															+                # TODO get rid of str.isdecimal
														
 
															+                if str.isdecimal(suffix_i) and 0 <= int(suffix_i) < len(dim_scores)))
														
 
															+
														
 
															+            # search DHT for next step suffixes
														
 
															+            _, best_uid_prefixes = zip(*best_active_pairs)
														
 
															+            # TODO Tuple[Dict[str, List[str, Endpoint]], DHTExpiration] -> namedtuple
														
 
															+            dht_responses: Dict[str, Tuple[Dict[str, List[str, Endpoint]], DHTExpiration]] = await node.get_many(
														
 
															+                keys=best_uid_prefixes, num_workers=min(len(best_uid_prefixes), max_workers), **kwargs)
														
 
															+            if all(expiration is None for key, (_, expiration) in dht_responses.items()):
														
 
															+                logger.warning(f"Beam search had to terminate prematurely because of empty beam (dim {dim_index})")
														
 
															+                break
														
 
															+            beam = [(prefix_score, prefix, dht_responses[prefix][0])  # add suffix dict if it is found
														
 
															+                    for prefix_score, prefix in best_active_pairs if dht_responses[prefix][1] is not None]
														
 
															+
														
 
															+        # select best experts from the final beam
														
 
															+        dim_scores = grid_scores[-1]
														
 
															+        final_best_pairs: List[Tuple[float, str, Endpoint]] = heapq.nlargest(beam_size, (
														
 
															+            (prefix_score + dim_scores[int(suffix_i)], uid, endpoint)
														
 
															+            for prefix_score, prefix, suffixes in beam for suffix_i, ((uid, endpoint), _) in suffixes.items()
														
 
															+            if str.isdecimal(suffix_i) and 0 <= int(suffix_i) < len(dim_scores)
														
 
															+        ))
														
 
															+        best_experts = [RemoteExpert(uid, endpoint) for score, uid, endpoint in final_best_pairs]
														
 
															+        if future is not None:
														
 
															+            future.set_result(best_experts)
														
 
															+        return best_experts
														
 
															+
														
 
															+    def batch_find_best_experts(self, prefix: str, batch_grid_scores: Sequence[Sequence[Sequence[float]]], beam_size: int, *,
														
 
															+                                return_future=False, **kwargs) -> Union[List[RemoteExpert], MPFuture]:
														
 
															+        """
														
 
															+        Find and return :beam_size: active experts with highest scores, use both local cache and DHT
														
 
															+
														
 
															+        :param prefix: common prefix for all expert uids in grid
														
 
															+        :param batch_grid_scores: scores predicted for each batch example and each dimension in the grid,
														
 
															+        :type batch_grid_scores: model scores for each example and each grid dimension,  list of arrays of shape (batch_size, grid_size[i])
														
 
															+        :param beam_size: how many best experts should beam search return
														
 
															+         After time_budget is reached, beam search won't search for more experts and instead fall back on local cache
														
 
															+         Please note that any queries that fall outside the budget will still be performed in background and cached
														
 
															+         for subsequent iterations as long as DHTNode.cache_locally is True
														
 
															+        :param return_future: if set to True, returns MPFuture that can be awaited to get the actual result
														
 
															+        :param kwargs: extra keyword parameters passed to DHTNode.get_many
														
 
															+        :returns: a list that contains *up to* k_best RemoteExpert instances
														
 
															+        """
														
 
															+        future, _future = MPFuture.make_pair()
														
 
															+        self.pipe.send(('_batch_find_best_experts', [], dict(prefix=prefix, batch_grid_scores=batch_grid_scores,
														
 
															+                                                             beam_size=beam_size, future=_future, **kwargs)))
														
 
															+        return future if return_future else future.result()
														
 
															+
														
 
															+    async def _batch_find_best_experts(
														
 
															+            self, node: DHTNode, prefix: str, batch_grid_scores: Sequence[Sequence[Tuple[float]]], beam_size: int,
														
 
															+            max_workers: Optional[int] = None, future: Optional[MPFuture] = None, **kwargs) -> List[List[RemoteExpert]]:
														
 
															+
														
 
															+        batch_grid_scores = [[tuple(grid_score[i]) for grid_score in batch_grid_scores] for i in range(len(batch_grid_scores[0]))]
														
 
															+        coros = [self._find_best_experts(node, prefix, grid_scores, beam_size, max_workers, **kwargs) for grid_scores in batch_grid_scores]
														
 
															-        store_keys, store_values = zip(*data_to_store.items())
														
 
															-        store_ok = await node.store_many(store_keys, store_values, expiration_time, num_workers=num_workers)
														
 
															+        best_experts_batch = await asyncio.gather(*coros)
														
 
															         if future is not None:
														
 
															-            future.set_result([store_ok[key] for key in data_to_store.keys()])
														
 
															+            future.set_result(best_experts_batch)
														
 
															+        return best_experts_batch
														
 
															+
														
 
															+    async def _get_initial_beam(self, node, prefix: str, beam_size: int, scores: Tuple[float, ...], num_workers: int
														
 
															+                                ) -> List[Tuple[float, str, Dict[str, List[str]]]]:
														
 
															+        """ Fetch a list of all active level-one prefixes of a given prefix. Used for beam search """
														
 
															+        beam: List[Tuple[float, str, Dict[str, List[str, Endpoint]]]] = []  # results will be stored here
														
 
															+        unattempted_indices: List[int] = sorted(range(len(scores)), key=scores.__getitem__)  # order: worst to best
														
 
															+        pending_tasks: Deque[Tuple[int, str, asyncio.Task]] = deque()  # up to num_workers concurrent get tasks
														
 
															+
														
 
															+        while len(beam) < beam_size and (unattempted_indices or pending_tasks):
														
 
															+            # dispatch additional tasks
														
 
															+            while unattempted_indices and len(pending_tasks) < num_workers:
														
 
															+                next_index = unattempted_indices.pop()  # note: this is best unattempted index because of sort order
														
 
															+                next_best_prefix = f"{prefix}{self.UID_DELIMITER}{next_index}"
														
 
															+                pending_tasks.append((next_index, next_best_prefix, asyncio.create_task(node.get(next_best_prefix))))
														
 
															+
														
 
															+            # await the next best prefix to be fetched
														
 
															+            pending_best_index, pending_best_prefix, pending_task = pending_tasks.popleft()
														
 
															+            try:
														
 
															+                maybe_prefix_data, maybe_expiration_time = await pending_task
														
 
															+                if maybe_expiration_time is not None:
														
 
															+                    beam.append((scores[pending_best_index], pending_best_prefix, maybe_prefix_data))
														
 
															+            except asyncio.CancelledError:
														
 
															+                for _, pending_task in pending_tasks:
														
 
															+                    pending_task.cancel()
														
 
															+                raise
														
 
															+        return beam
														
 
															     def first_k_active(
														
 
															             self, uid_prefixes: List[str], k: int, max_prefetch: int = 1, chunk_size: Optional[int] = None,
														
@@ -196,6 +328,7 @@ class DHT(mp.Process):
 
															         :returns: a ordered dict{uid_prefix -> RemoteExpert} mapping at most :k: prefixes to matching experts
														
 
															             The keys in the returned dict are ordered same as in uid_prefixes.
														
 
															         """
														
 
															+        logger.warning("first_k_active is deprecated and will be removed in 0.8.6")
														
 
															         assert not isinstance(uid_prefixes, str), "please provide a list/tuple of prefixes as the first argument"
														
 
															         future, _future = MPFuture.make_pair()
														
 
															         self.pipe.send(('_first_k_active', [],
														
@@ -220,8 +353,8 @@ class DHT(mp.Process):
 
															             response = await pending_tasks.popleft()
														
 
															             for uid_prefix in uid_prefixes[chunk_i * chunk_size: (chunk_i + 1) * chunk_size]:
														
 
															                 maybe_expert_data, maybe_expiration_time = response[uid_prefix]
														
 
															-                if maybe_expiration_time is not None:  # found active peer
														
 
															-                    found.append((uid_prefix, RemoteExpert(**maybe_expert_data)))
														
 
															+                if maybe_expiration_time is not None and len(maybe_expert_data) > 0:  # found active peer
														
 
															+                    found.append((uid_prefix, RemoteExpert(*next(iter(maybe_expert_data.values()))[0])))
														
 
															                     # if we found enough active experts, finish immediately
														
 
															                     if len(found) >= k:
														
 
															                         break
														
--- a/hivemind/dht/node.py
+++ b/hivemind/dht/node.py
@@ -1,17 +1,18 @@
 
															 from __future__ import annotations
														
 
															 import asyncio
														
 
															-
														
 
															 import random
														
 
															 from collections import defaultdict
														
 
															 from dataclasses import dataclass, field
														
 
															-from typing import Optional, Tuple, List, Dict, DefaultDict, Collection, Union, Set, Awaitable, Callable, Any, Iterable
														
 
															-from sortedcontainers import SortedList
														
 
															 from functools import partial
														
 
															+from typing import Optional, Tuple, List, Dict, DefaultDict, Collection, Union, Set, Awaitable, Callable, Any
														
 
															 from warnings import warn
														
 
															-from hivemind.dht.protocol import DHTProtocol, LocalStorage
														
 
															-from hivemind.dht.routing import DHTID, DHTExpiration, DHTKey, get_dht_time, DHTValue, BinaryDHTValue
														
 
															+from sortedcontainers import SortedList
														
 
															+
														
 
															+from hivemind.dht.protocol import DHTProtocol
														
 
															+from hivemind.dht.routing import DHTID, DHTExpiration, DHTKey, get_dht_time, DHTValue, BinaryDHTValue, Subkey
														
 
															+from hivemind.dht.storage import CacheRefreshQueue, DictionaryDHTValue
														
 
															 from hivemind.dht.traverse import traverse_dht
														
 
															 from hivemind.utils import Endpoint, LOCALHOST, MSGPackSerializer, get_logger, SerializerBase
														
@@ -39,7 +40,7 @@ class DHTNode:
 
															         nearest peers from recipient's routing table (ordered nearest-to-farthest, not including recipient itself)
														
 
															         This RPC is a mixture between Kademlia FIND_NODE and FIND_VALUE with multiple keys per call.
														
 
															-    Formally, DHTNode follows the following contract:
														
 
															+    A DHTNode follows the following contract:
														
 
															     - when asked to get(key), a node must find and return a value with highest expiration time that it found across DHT
														
 
															       IF that time has not come yet. if expiration time is smaller than current get_dht_time(), node may return None;
														
@@ -53,9 +54,8 @@ class DHTNode:
 
															     # fmt:off
														
 
															     node_id: DHTID; is_alive: bool; port: int; num_replicas: int; num_workers: int; protocol: DHTProtocol
														
 
															     refresh_timeout: float; cache_locally: bool; cache_nearest: int; cache_refresh_before_expiry: float
														
 
															-    cache_refresh_available: asyncio.Event; cache_refresh_queue: LocalStorage
														
 
															-    reuse_get_requests: bool; pending_get_requests: DefaultDict[DHTID, SortedList[_IntermediateResult]]
														
 
															-    serializer = MSGPackSerializer  # used to pack/unpack DHT Values for transfer over network
														
 
															+    cache_on_store: bool; reuse_get_requests: bool; pending_get_requests: DefaultDict[DHTID, SortedList[_SearchState]]
														
 
															+    cache_refresh_task: Optional[asyncio.Task]; cache_refresh_evt: asyncio.Event; cache_refresh_queue: CacheRefreshQueue
														
 
															     # fmt:on
														
 
															     @classmethod
														
@@ -64,8 +64,8 @@ class DHTNode:
 
															             bucket_size: int = 20, num_replicas: int = 5, depth_modulo: int = 5, parallel_rpc: int = None,
														
 
															             wait_timeout: float = 5, refresh_timeout: Optional[float] = None, bootstrap_timeout: Optional[float] = None,
														
 
															             cache_locally: bool = True, cache_nearest: int = 1, cache_size=None, cache_refresh_before_expiry: float = 5,
														
 
															-            reuse_get_requests: bool = True, num_workers: int = 1, listen: bool = True,
														
 
															-            listen_on: Endpoint = "0.0.0.0:*", **kwargs) -> DHTNode:
														
 
															+            cache_on_store: bool = True, reuse_get_requests: bool = True, num_workers: int = 1,
														
 
															+            listen: bool = True, listen_on: Endpoint = "0.0.0.0:*", **kwargs) -> DHTNode:
														
 
															         """
														
 
															         :param node_id: current node's identifier, determines which keys it will store locally, defaults to random id
														
 
															         :param initial_peers: connects to these peers to populate routing table, defaults to no peers
														
@@ -81,6 +81,7 @@ class DHTNode:
 
															           if staleness_timeout is None, DHTNode will not refresh stale buckets (which is usually okay)
														
 
															         :param bootstrap_timeout: after one of peers responds, await other peers for at most this many seconds
														
 
															         :param cache_locally: if True, caches all values (stored or found) in a node-local cache
														
 
															+        :param cache_on_store: if True, update cache entries for a key after storing a new item for that key
														
 
															         :param cache_nearest: whenever DHTNode finds a value, it will also store (cache) this value on this many
														
 
															           nodes nearest nodes visited by search algorithm. Prefers nodes that are nearest to :key: but have no value yet
														
 
															         :param cache_size: if specified, local cache will store up to this many records (as in LRU cache)
														
@@ -96,10 +97,6 @@ class DHTNode:
 
															           see https://grpc.github.io/grpc/core/group__grpc__arg__keys.html for a list of all options
														
 
															         :param kwargs: extra parameters used in grpc.aio.server
														
 
															         """
														
 
															-        if cache_refresh_before_expiry > 0 and not cache_locally:
														
 
															-            logger.warning("If cache_locally is False, cache_refresh_before_expiry has no effect. To silence this"
														
 
															-                           " warning, please specify cache_refresh_before_expiry=0")
														
 
															-
														
 
															         self = cls(_initialized_with_create=True)
														
 
															         self.node_id = node_id = node_id if node_id is not None else DHTID.generate()
														
 
															         self.num_replicas, self.num_workers = num_replicas, num_workers
														
@@ -110,12 +107,11 @@ class DHTNode:
 
															         # caching policy
														
 
															         self.refresh_timeout = refresh_timeout
														
 
															-        self.cache_locally, self.cache_nearest = cache_locally, cache_nearest
														
 
															+        self.cache_locally, self.cache_nearest, self.cache_on_store = cache_locally, cache_nearest, cache_on_store
														
 
															         self.cache_refresh_before_expiry = cache_refresh_before_expiry
														
 
															-        self.cache_refresh_queue = LocalStorage()
														
 
															-        self.cache_refresh_available = asyncio.Event()
														
 
															-        if cache_refresh_before_expiry:
														
 
															-            asyncio.create_task(self._refresh_stale_cache_entries())
														
 
															+        self.cache_refresh_queue = CacheRefreshQueue()
														
 
															+        self.cache_refresh_evt = asyncio.Event()
														
 
															+        self.cache_refresh_task = None
														
 
															         self.protocol = await DHTProtocol.create(self.node_id, bucket_size, depth_modulo, num_replicas, wait_timeout,
														
 
															                                                  parallel_rpc, cache_size, listen, listen_on, **kwargs)
														
@@ -211,25 +207,27 @@ class DHTNode:
 
															             nearest_nodes_with_endpoints[query] = {node: node_to_endpoint[node] for node in nearest_nodes[:k_nearest]}
														
 
															         return nearest_nodes_with_endpoints
														
 
															-    async def store(self, key: DHTKey, value: DHTValue, expiration_time: DHTExpiration, **kwargs) -> bool:
														
 
															+    async def store(self, key: DHTKey, value: DHTValue, expiration_time: DHTExpiration,
														
 
															+                    subkey: Optional[Subkey] = None, **kwargs) -> bool:
														
 
															         """
														
 
															         Find num_replicas best nodes to store (key, value) and store it there at least until expiration time.
														
 
															-
														
 
															         :note: store is a simplified interface to store_many, all kwargs are be forwarded there
														
 
															         :returns: True if store succeeds, False if it fails (due to no response or newer value)
														
 
															         """
														
 
															-        store_ok = await self.store_many([key], [value], [expiration_time], **kwargs)
														
 
															-        return store_ok[key]
														
 
															+        store_ok = await self.store_many([key], [value], [expiration_time], subkeys=[subkey], **kwargs)
														
 
															+        return store_ok[(key, subkey) if subkey is not None else key]
														
 
															     async def store_many(self, keys: List[DHTKey], values: List[DHTValue],
														
 
															                          expiration_time: Union[DHTExpiration, List[DHTExpiration]],
														
 
															+                         subkeys: Optional[Union[Subkey, List[Optional[Subkey]]]] = None,
														
 
															                          exclude_self: bool = False, await_all_replicas=True, **kwargs) -> Dict[DHTKey, bool]:
														
 
															         """
														
 
															-        Traverse DHT to find up to best nodes to store multiple (key, value, expiration_time) pairs.
														
 
															+        Traverse DHT to find up :num_replicas: to best nodes to store multiple (key, value, expiration_time) pairs.
														
 
															         :param keys: arbitrary serializable keys associated with each value
														
 
															         :param values: serializable "payload" for each key
														
 
															         :param expiration_time: either one expiration time for all keys or individual expiration times (see class doc)
														
 
															+        :param subkeys: an optional list of same shape as keys. If specified, this
														
 
															         :param kwargs: any additional parameters passed to traverse_dht function (e.g. num workers)
														
 
															         :param exclude_self: if True, never store value locally even if you are one of the nearest nodes
														
 
															         :note: if exclude_self is True and self.cache_locally == True, value will still be __cached__ locally
														
@@ -239,24 +237,23 @@ class DHTNode:
 
															         """
														
 
															         if isinstance(expiration_time, DHTExpiration):
														
 
															             expiration_time = [expiration_time] * len(keys)
														
 
															-        assert len(keys) == len(values) == len(expiration_time), "Number of keys, values and expiration doesn't match."
														
 
															+        if subkeys is None or isinstance(subkeys, Subkey):
														
 
															+            subkeys = [subkeys] * len(keys)
														
 
															-        key_ids = list(map(DHTID.generate, keys))
														
 
															-        id_to_original_key = dict(zip(key_ids, keys))
														
 
															-        binary_values_by_key_id = {key_id: self.serializer.dumps(value) for key_id, value in zip(key_ids, values)}
														
 
															-        expiration_by_key_id = {key_id: expiration_time for key_id, expiration_time in zip(key_ids, expiration_time)}
														
 
															-        unfinished_key_ids = set(key_ids)  # we use this set to ensure that each store request is finished
														
 
															+        assert len(keys) == len(subkeys) == len(values) == len(expiration_time), \
														
 
															+            "Either of keys, values, subkeys or expiration timestamps have different sequence lengths."
														
 
															-        store_ok = {key: False for key in keys}  # outputs, updated during search
														
 
															-        store_finished_events = {key: asyncio.Event() for key in keys}
														
 
															+        key_id_to_data: DefaultDict[DHTID, List[Tuple[DHTKey, Subkey, DHTValue, DHTExpiration]]] = defaultdict(list)
														
 
															+        for key, subkey, value, expiration in zip(keys, subkeys, values, expiration_time):
														
 
															+            key_id_to_data[DHTID.generate(source=key)].append((key, subkey, value, expiration))
														
 
															-        if self.cache_locally:
														
 
															-            for key_id in key_ids:
														
 
															-                self.protocol.cache.store(key_id, binary_values_by_key_id[key_id], expiration_by_key_id[key_id])
														
 
															+        unfinished_key_ids = set(key_id_to_data.keys())  # use this set to ensure that each store request is finished
														
 
															+        store_ok = {(key, subkey): None for key, subkey in zip(keys, subkeys)}  # outputs, updated during search
														
 
															+        store_finished_events = {(key, subkey): asyncio.Event() for key, subkey in zip(keys, subkeys)}
														
 
															         # pre-populate node_to_endpoint
														
 
															         node_to_endpoint: Dict[DHTID, Endpoint] = dict()
														
 
															-        for key_id in key_ids:
														
 
															+        for key_id in unfinished_key_ids:
														
 
															             node_to_endpoint.update(self.protocol.routing_table.get_nearest_neighbors(
														
 
															                 key_id, self.protocol.bucket_size, exclude=self.node_id))
														
@@ -272,48 +269,73 @@ class DHTNode:
 
															             pending_store_tasks = set()
														
 
															             store_candidates = sorted(nearest_nodes + ([] if exclude_self else [self.node_id]),
														
 
															                                       key=key_id.xor_distance, reverse=True)  # ordered so that .pop() returns nearest
														
 
															+            [original_key, *_], current_subkeys, current_values, current_expirations = zip(*key_id_to_data[key_id])
														
 
															+            binary_values: List[bytes] = list(map(self.protocol.serializer.dumps, current_values))
														
 
															             while num_successful_stores < self.num_replicas and (store_candidates or pending_store_tasks):
														
 
															-                # spawn enough tasks to cover all replicas
														
 
															                 while store_candidates and num_successful_stores + len(pending_store_tasks) < self.num_replicas:
														
 
															                     node_id: DHTID = store_candidates.pop()  # nearest untried candidate
														
 
															+
														
 
															                     if node_id == self.node_id:
														
 
															-                        self.protocol.storage.store(key_id, binary_values_by_key_id[key_id],
														
 
															-                                                    expiration_by_key_id[key_id])
														
 
															-                        store_ok[id_to_original_key[key_id]] = True
														
 
															                         num_successful_stores += 1
														
 
															-                        if not await_all_replicas:
														
 
															-                            store_finished_events[id_to_original_key[key_id]].set()
														
 
															-
														
 
															+                        for subkey, value, expiration_time in zip(current_subkeys, binary_values, current_expirations):
														
 
															+                            store_ok[original_key, subkey] = self.protocol.storage.store(
														
 
															+                                key_id, value, expiration_time, subkey=subkey)
														
 
															+                            if not await_all_replicas:
														
 
															+                                store_finished_events[original_key, subkey].set()
														
 
															                     else:
														
 
															                         pending_store_tasks.add(asyncio.create_task(self.protocol.call_store(
														
 
															-                            node_to_endpoint[node_id], [key_id], [binary_values_by_key_id[key_id]],
														
 
															-                            [expiration_by_key_id[key_id]])))
														
 
															+                            node_to_endpoint[node_id], keys=[key_id] * len(current_values), values=binary_values,
														
 
															+                            expiration_time=current_expirations, subkeys=current_subkeys)))
														
 
															                 # await nearest task. If it fails, dispatch more on the next iteration
														
 
															                 if pending_store_tasks:
														
 
															                     finished_store_tasks, pending_store_tasks = await asyncio.wait(
														
 
															                         pending_store_tasks, return_when=asyncio.FIRST_COMPLETED)
														
 
															                     for task in finished_store_tasks:
														
 
															-                        if task.result()[0]:  # if store succeeded
														
 
															-                            store_ok[id_to_original_key[key_id]] = True
														
 
															+                        if task.result() is not None:
														
 
															                             num_successful_stores += 1
														
 
															-                            if not await_all_replicas:
														
 
															-                                store_finished_events[id_to_original_key[key_id]].set()
														
 
															+                            for subkey, store_status in zip(current_subkeys, task.result()):
														
 
															+                                store_ok[original_key, subkey] = store_status
														
 
															+                                if not await_all_replicas:
														
 
															+                                    store_finished_events[original_key, subkey].set()
														
 
															-            store_finished_events[id_to_original_key[key_id]].set()
														
 
															+            if self.cache_on_store:
														
 
															+                self._update_cache_on_store(key_id, current_subkeys, binary_values, current_expirations,
														
 
															+                                            store_ok=[store_ok[original_key, subkey] for subkey in current_subkeys])
														
 
															+
														
 
															+            for subkey, value_bytes, expiration in zip(current_subkeys, binary_values, current_expirations):
														
 
															+                store_finished_events[original_key, subkey].set()
														
 
															         store_task = asyncio.create_task(self.find_nearest_nodes(
														
 
															-            queries=set(key_ids), k_nearest=self.num_replicas, node_to_endpoint=node_to_endpoint,
														
 
															+            queries=set(unfinished_key_ids), k_nearest=self.num_replicas, node_to_endpoint=node_to_endpoint,
														
 
															             found_callback=on_found, exclude_self=exclude_self, **kwargs))
														
 
															         try:
														
 
															             await asyncio.wait([evt.wait() for evt in store_finished_events.values()])  # wait for items to be stored
														
 
															             assert len(unfinished_key_ids) == 0, "Internal error: traverse_dht didn't finish search"
														
 
															-            return store_ok
														
 
															+            return {(key, subkey) if subkey else key: status or False for (key, subkey), status in store_ok.items()}
														
 
															         except asyncio.CancelledError as e:
														
 
															             store_task.cancel()
														
 
															             raise e
														
 
															+    def _update_cache_on_store(self, key_id: DHTID, subkeys: List[Subkey], binary_values: List[bytes],
														
 
															+                               expirations: List[DHTExpiration], store_ok: List[bool]):
														
 
															+        """ Update local cache after finishing a store for one key (with perhaps several subkeys) """
														
 
															+        store_succeeded = any(store_ok)
														
 
															+        is_dictionary = any(subkey is not None for subkey in subkeys)
														
 
															+        if store_succeeded and not is_dictionary:  # stored a new regular value, cache it!
														
 
															+            stored_value_bytes, stored_expiration = max(zip(binary_values, expirations), key=lambda p: p[1])
														
 
															+            self.protocol.cache.store(key_id, stored_value_bytes, stored_expiration)
														
 
															+        elif not store_succeeded and not is_dictionary:  # store rejected, check if local cache is also obsolete
														
 
															+            rejected_value, rejected_expiration = max(zip(binary_values, expirations), key=lambda p: p[1])
														
 
															+            self.protocol.cache.store(key_id, rejected_value, rejected_expiration)  # can still be better than cache
														
 
															+            if (self.protocol.cache.get(key_id)[1] or float("inf")) <= rejected_expiration:  # cache would be rejected
														
 
															+                self._schedule_for_refresh(key_id, refresh_time=get_dht_time())  # fetch new key in background (asap)
														
 
															+        else:  # stored a dictionary (or failed to store), either way, there can be other keys and we should update
														
 
															+            for subkey, stored_value_bytes, expiration_time in zip(subkeys, binary_values, expirations):
														
 
															+                self.protocol.cache.store_subkey(key_id, subkey, stored_value_bytes, expiration_time)
														
 
															+            self._schedule_for_refresh(key_id, refresh_time=get_dht_time())  # fetch new key in background (asap)
														
 
															+
														
 
															     async def get(self, key: DHTKey, latest=False, **kwargs) -> Tuple[Optional[DHTValue], Optional[DHTExpiration]]:
														
 
															         """
														
 
															         Search for a key across DHT and return either first or latest entry.
														
@@ -350,8 +372,8 @@ class DHTNode:
 
															     async def get_many_by_id(
														
 
															             self, key_ids: Collection[DHTID], sufficient_expiration_time: Optional[DHTExpiration] = None,
														
 
															             num_workers: Optional[int] = None, beam_size: Optional[int] = None, return_futures: bool = False,
														
 
															-            _refresh_cache=True) -> Dict[DHTID, Union[Tuple[Optional[DHTValue], Optional[DHTExpiration]],
														
 
															-                                                      Awaitable[Tuple[Optional[DHTValue], Optional[DHTExpiration]]]]]:
														
 
															+            _is_refresh=False) -> Dict[DHTID, Union[Tuple[Optional[DHTValue], Optional[DHTExpiration]],
														
 
															+                                                    Awaitable[Tuple[Optional[DHTValue], Optional[DHTExpiration]]]]]:
														
 
															         """
														
 
															         Traverse DHT to find a list of DHTIDs. For each key, return latest (value, expiration) or None if not found.
														
@@ -364,17 +386,17 @@ class DHTNode:
 
															         :param return_futures: if True, immediately return asyncio.Future for every before interacting with the nework.
														
 
															          The algorithm will populate these futures with (value, expiration) when it finds the corresponding key
														
 
															          Note: canceling a future will stop search for the corresponding key
														
 
															-        :param _refresh_cache: internal flag, whether or not to self._trigger_cache_refresh
														
 
															+        :param _is_refresh: internal flag, set to True by an internal cache refresher (if enabled)
														
 
															         :returns: for each key: value and its expiration time. If nothing is found, returns (None, None) for that key
														
 
															         :note: in order to check if get returned a value, please check (expiration_time is None)
														
 
															         """
														
 
															         sufficient_expiration_time = sufficient_expiration_time or get_dht_time()
														
 
															         beam_size = beam_size if beam_size is not None else self.protocol.bucket_size
														
 
															         num_workers = num_workers if num_workers is not None else self.num_workers
														
 
															-        search_results: Dict[DHTID, _IntermediateResult] = {key_id: _IntermediateResult(
														
 
															-            key_id, sufficient_expiration_time, serializer=self.serializer) for key_id in key_ids}
														
 
															+        search_results: Dict[DHTID, _SearchState] = {key_id: _SearchState(
														
 
															+            key_id, sufficient_expiration_time, serializer=self.protocol.serializer) for key_id in key_ids}
														
 
															-        if _refresh_cache:
														
 
															+        if not _is_refresh:  # if we're already refreshing cache, there's no need to trigger subsequent refreshes
														
 
															             for key_id in key_ids:
														
 
															                 search_results[key_id].add_done_callback(self._trigger_cache_refresh)
														
@@ -387,7 +409,8 @@ class DHTNode:
 
															         # stage 1: check for value in this node's local storage and cache
														
 
															         for key_id in key_ids:
														
 
															             search_results[key_id].add_candidate(*self.protocol.storage.get(key_id), source_node_id=self.node_id)
														
 
															-            search_results[key_id].add_candidate(*self.protocol.cache.get(key_id), source_node_id=self.node_id)
														
 
															+            if not _is_refresh:
														
 
															+                search_results[key_id].add_candidate(*self.protocol.cache.get(key_id), source_node_id=self.node_id)
														
 
															         # stage 2: traverse the DHT to get the remaining keys from remote peers
														
 
															         unfinished_key_ids = [key_id for key_id in key_ids if not search_results[key_id].finished]
														
@@ -414,7 +437,7 @@ class DHTNode:
 
															         # V-- this function will be called exactly once when traverse_dht finishes search for a given key
														
 
															         async def found_callback(key_id: DHTID, nearest_nodes: List[DHTID], _visited: Set[DHTID]):
														
 
															             search_results[key_id].finish_search()  # finish search whether or we found something
														
 
															-            self._cache_new_result(search_results[key_id], nearest_nodes, node_to_endpoint)
														
 
															+            self._cache_new_result(search_results[key_id], nearest_nodes, node_to_endpoint, _is_refresh=_is_refresh)
														
 
															         asyncio.create_task(traverse_dht(
														
 
															             queries=list(unfinished_key_ids), initial_nodes=list(node_to_endpoint),
														
@@ -433,9 +456,9 @@ class DHTNode:
 
															                     search_result.future.cancel()
														
 
															                 raise e
														
 
															-    def _reuse_finished_search_result(self, finished: _IntermediateResult):
														
 
															+    def _reuse_finished_search_result(self, finished: _SearchState):
														
 
															         expiration_time_threshold = max(finished.expiration_time or -float('inf'), finished.sufficient_expiration_time)
														
 
															-        concurrent_requests: SortedList[_IntermediateResult] = self.pending_get_requests[finished.key_id]
														
 
															+        concurrent_requests: SortedList[_SearchState] = self.pending_get_requests[finished.key_id]
														
 
															         # note: concurrent_requests is sorded in the order of descending sufficient_expiration_time
														
 
															         while concurrent_requests and expiration_time_threshold >= concurrent_requests[-1].sufficient_expiration_time:
														
 
															             concurrent_requests[-1].add_candidate(finished.binary_value, finished.expiration_time,
														
@@ -443,66 +466,72 @@ class DHTNode:
 
															             concurrent_requests[-1].finish_search()
														
 
															             concurrent_requests.pop(-1)
														
 
															-    def _trigger_cache_refresh(self, result: _IntermediateResult):
														
 
															+    def _trigger_cache_refresh(self, search: _SearchState):
														
 
															         """ Called after get request is finished (whether it was found, not found, hit cache, cancelled, or reused) """
														
 
															-        if result.found_something and result.source_node_id == self.node_id:
														
 
															-            with self.protocol.cache.freeze():  # do not clear outdated cache for now...
														
 
															-                if self.cache_refresh_before_expiry and result.key_id in self.protocol.cache:
														
 
															-                    previous_earliest_item: Tuple[DHTID, BinaryDHTValue, DHTExpiration] = self.cache_refresh_queue.top()
														
 
															-                    self.cache_refresh_queue.store(result.key_id, result.binary_value, result.expiration_time)
														
 
															-                    if previous_earliest_item is None or result.expiration_time < previous_earliest_item[-1]:
														
 
															-                        self.cache_refresh_available.set()  # if we new element is now earliest, notify the cache queue
														
 
															+        if search.found_something and search.source_node_id == self.node_id:
														
 
															+            if self.cache_refresh_before_expiry and search.key_id in self.protocol.cache:
														
 
															+                self._schedule_for_refresh(search.key_id, search.expiration_time - self.cache_refresh_before_expiry)
														
 
															+
														
 
															+    def _schedule_for_refresh(self, key_id: DHTID, refresh_time: DHTExpiration):
														
 
															+        """ Add key to a refresh queue, refresh at :refresh_time: or later """
														
 
															+        if self.cache_refresh_task is None or self.cache_refresh_task.done() or self.cache_refresh_task.cancelled():
														
 
															+            self.cache_refresh_task = asyncio.create_task(self._refresh_stale_cache_entries())
														
 
															+            logger.debug("Spawned cache refresh task.")
														
 
															+        previous_earliest_item: Tuple[DHTID, Any, DHTExpiration] = self.cache_refresh_queue.top()
														
 
															+        if previous_earliest_item is None or refresh_time < previous_earliest_item[-1]:
														
 
															+            self.cache_refresh_evt.set()  # if we new element is now earliest, notify the cache queue
														
 
															+        self.cache_refresh_queue.store(key_id, value=refresh_time, expiration_time=refresh_time)
														
 
															     async def _refresh_stale_cache_entries(self):
														
 
															         """ periodically refresh keys near-expired keys that were accessed at least once during previous lifetime """
														
 
															         while self.is_alive:
														
 
															-            with self.cache_refresh_queue.freeze():
														
 
															-                while len(self.cache_refresh_queue) == 0:
														
 
															-                    await self.cache_refresh_available.wait()
														
 
															-                    self.cache_refresh_available.clear()
														
 
															-                key_id, _, nearest_expiration = self.cache_refresh_queue.top()
														
 
															+            while len(self.cache_refresh_queue) == 0:
														
 
															+                await self.cache_refresh_evt.wait()
														
 
															+                self.cache_refresh_evt.clear()
														
 
															+            key_id, _, nearest_refresh_time = self.cache_refresh_queue.top()
														
 
															             try:
														
 
															                 # step 1: await until :cache_refresh_before_expiry: seconds before earliest first element expires
														
 
															-                time_to_wait = nearest_expiration - get_dht_time() - self.cache_refresh_before_expiry
														
 
															-                await asyncio.wait_for(self.cache_refresh_available.wait(), timeout=time_to_wait)
														
 
															+                time_to_wait = nearest_refresh_time - get_dht_time()
														
 
															+                await asyncio.wait_for(self.cache_refresh_evt.wait(), timeout=time_to_wait)
														
 
															                 # note: the line above will cause TimeoutError when we are ready to refresh cache
														
 
															-                self.cache_refresh_available.clear()  # no timeout error => someone added new entry to queue and ...
														
 
															+                self.cache_refresh_evt.clear()  # no timeout error => someone added new entry to queue and ...
														
 
															                 continue  # ... and this element is earlier than nearest_expiration. we should refresh this entry first
														
 
															             except asyncio.TimeoutError:  # caught TimeoutError => it is time to refresh the most recent cached entry
														
 
															                 # step 2: find all keys that we should already refresh and remove them from queue
														
 
															-                with self.cache_refresh_queue.freeze():
														
 
															-                    keys_to_refresh = {key_id}
														
 
															+                current_time = get_dht_time()
														
 
															+                keys_to_refresh = {key_id}
														
 
															+                max_expiration_time = self.protocol.cache.get(key_id)[1] or current_time
														
 
															+                del self.cache_refresh_queue[key_id]  # we pledge to refresh this key_id in the nearest batch
														
 
															+                while self.cache_refresh_queue:
														
 
															+                    key_id, _, nearest_refresh_time = self.cache_refresh_queue.top()
														
 
															+                    if nearest_refresh_time > current_time:
														
 
															+                        break
														
 
															                     del self.cache_refresh_queue[key_id]  # we pledge to refresh this key_id in the nearest batch
														
 
															-                    while self.cache_refresh_queue:
														
 
															-                        key_id, _, nearest_expiration = self.cache_refresh_queue.top()
														
 
															-                        if nearest_expiration > get_dht_time() + self.cache_refresh_before_expiry:
														
 
															-                            break
														
 
															-                        del self.cache_refresh_queue[key_id]  # we pledge to refresh this key_id in the nearest batch
														
 
															-                        keys_to_refresh.add(key_id)
														
 
															+                    keys_to_refresh.add(key_id)
														
 
															+                    max_expiration_time = max(max_expiration_time, self.protocol.cache.get(key_id)[1] or current_time)
														
 
															                 # step 3: search newer versions of these keys, cache them as a side-effect of self.get_many_by_id
														
 
															-                await self.get_many_by_id(
														
 
															-                    keys_to_refresh, sufficient_expiration_time=nearest_expiration + self.cache_refresh_before_expiry,
														
 
															-                    _refresh_cache=False)  # if we found value locally, we shouldn't trigger another refresh
														
 
															+                sufficient_expiration_time = max_expiration_time + self.cache_refresh_before_expiry + 1
														
 
															+                await self.get_many_by_id(keys_to_refresh, sufficient_expiration_time, _is_refresh=True)
														
 
															-    def _cache_new_result(self, result: _IntermediateResult, nearest_nodes: List[DHTID],
														
 
															-                          node_to_endpoint: Dict[DHTID, Endpoint]):
														
 
															+    def _cache_new_result(self, search: _SearchState, nearest_nodes: List[DHTID],
														
 
															+                          node_to_endpoint: Dict[DHTID, Endpoint], _is_refresh: bool = False):
														
 
															         """ after key_id is found, update cache according to caching policy. used internally in get and get_many """
														
 
															-        if result.found_something:
														
 
															-            previous_expiration_time = max(self.protocol.storage.get(result.key_id)[1] or -float('inf'),
														
 
															-                                           self.protocol.cache.get(result.key_id)[1] or -float('inf'))
														
 
															-            if result.expiration_time > previous_expiration_time:  # if this value has better expiration
														
 
															-                if self.cache_locally:
														
 
															-                    self.protocol.cache.store(result.key_id, result.binary_value, result.expiration_time)
														
 
															+        if search.found_something:
														
 
															+            previous_expiration_time = max(self.protocol.storage.get(search.key_id)[1] or -float('inf'),
														
 
															+                                           self.protocol.cache.get(search.key_id)[1] or -float('inf'))
														
 
															+            if search.expiration_time > previous_expiration_time:  # if this value has better expiration
														
 
															+                if self.cache_locally or _is_refresh:
														
 
															+                    self.protocol.cache.store(search.key_id, search.binary_value, search.expiration_time)
														
 
															                 if self.cache_nearest:
														
 
															                     num_cached_nodes = 0
														
 
															                     for node_id in nearest_nodes:
														
 
															-                        if node_id == result.source_node_id:
														
 
															+                        if node_id == search.source_node_id:
														
 
															                             continue
														
 
															                         asyncio.create_task(self.protocol.call_store(
														
 
															-                            node_to_endpoint[node_id], [result.key_id], [result.binary_value], [result.expiration_time],
														
 
															+                            node_to_endpoint[node_id], [search.key_id], [search.binary_value], [search.expiration_time],
														
 
															                             in_cache=True))
														
 
															                         num_cached_nodes += 1
														
 
															                         if num_cached_nodes >= self.cache_nearest:
														
@@ -523,11 +552,11 @@ class DHTNode:
 
															 @dataclass(init=True, repr=True, frozen=False, order=False)
														
 
															-class _IntermediateResult:
														
 
															+class _SearchState:
														
 
															     """ A helper class that stores current-best GET results with metadata """
														
 
															     key_id: DHTID
														
 
															     sufficient_expiration_time: DHTExpiration
														
 
															-    binary_value: Optional[BinaryDHTValue] = None
														
 
															+    binary_value: Optional[Union[BinaryDHTValue, DictionaryDHTValue]] = None
														
 
															     expiration_time: Optional[DHTExpiration] = None  # best expiration time so far
														
 
															     source_node_id: Optional[DHTID] = None  # node that gave us the value
														
 
															     future: asyncio.Future[Tuple[Optional[DHTValue], Optional[DHTExpiration]]] = field(default_factory=asyncio.Future)
														
@@ -540,25 +569,33 @@ class _IntermediateResult:
 
															             if self.expiration_time >= self.sufficient_expiration_time:
														
 
															                 self.finish_search()
														
 
															-    def add_done_callback(self, callback: Callable[[_IntermediateResult], Any]):
														
 
															-        """ Add callback that will be called when _IntermediateSearchResult is done (found OR cancelled by user) """
														
 
															+    def add_done_callback(self, callback: Callable[[_SearchState], Any]):
														
 
															+        """ Add callback that will be called when _SearchState is done (found OR cancelled by user) """
														
 
															         self.future.add_done_callback(lambda _future: callback(self))
														
 
															     def finish_search(self):
														
 
															         if self.future.done():
														
 
															-            return  # either user cancelled our result or someone sent it before us. Nothing more to do here.
														
 
															-        deserialized_value = self.serializer.loads(self.binary_value) if self.found_something else None
														
 
															-        self.future.set_result((deserialized_value, self.expiration_time))
														
 
															+            return  # either user cancelled our search or someone sent it before us. Nothing more to do here.
														
 
															+        elif not self.found_something:
														
 
															+            self.future.set_result((None, None))
														
 
															+        elif isinstance(self.binary_value, BinaryDHTValue):
														
 
															+            self.future.set_result((self.serializer.loads(self.binary_value), self.expiration_time))
														
 
															+        elif isinstance(self.binary_value, DictionaryDHTValue):
														
 
															+            dict_value = {key: (self.serializer.loads(value), item_expiration_time)
														
 
															+                          for key, value, item_expiration_time in self.binary_value.items()}
														
 
															+            self.future.set_result((dict_value, self.expiration_time))
														
 
															+        else:
														
 
															+            logger.error(f"Invalid value type: {type(self.binary_value)}")
														
 
															     @property
														
 
															     def found_something(self) -> bool:
														
 
															-        """ Whether or not we have at least some result, regardless of its expiration time """
														
 
															+        """ Whether or not we have found at least some value, regardless of its expiration time """
														
 
															         return self.expiration_time is not None
														
 
															     @property
														
 
															     def finished(self) -> bool:
														
 
															         return self.future.done()
														
 
															-    def __lt__(self, other: _IntermediateResult):
														
 
															-        """ _IntermediateResult instances will be sorted by their target expiration time """
														
 
															+    def __lt__(self, other: _SearchState):
														
 
															+        """ _SearchState instances will be sorted by their target expiration time """
														
 
															         return self.sufficient_expiration_time < other.sufficient_expiration_time
														
--- a/hivemind/dht/protocol.py
+++ b/hivemind/dht/protocol.py
@@ -2,26 +2,28 @@
 
															 from __future__ import annotations
														
 
															 import asyncio
														
 
															-import heapq
														
 
															-from contextlib import contextmanager
														
 
															-from typing import Optional, List, Tuple, Dict, Iterator, Any, Sequence, Union, Collection
														
 
															+from typing import Optional, List, Tuple, Dict, Any, Sequence, Union, Collection
														
 
															 from warnings import warn
														
 
															 import grpc
														
 
															 import grpc.experimental.aio
														
 
															-from hivemind.dht.routing import RoutingTable, DHTID, BinaryDHTValue, DHTExpiration, get_dht_time
														
 
															+from hivemind.dht.routing import RoutingTable, DHTID, BinaryDHTValue, DHTExpiration, Subkey
														
 
															+from hivemind.dht.storage import DHTLocalStorage, DictionaryDHTValue
														
 
															 from hivemind.proto import dht_pb2, dht_pb2_grpc as dht_grpc
														
 
															-from hivemind.utils import Endpoint, get_logger, replace_port
														
 
															+from hivemind.utils import Endpoint, get_logger, replace_port, MSGPackSerializer
														
 
															 logger = get_logger(__name__)
														
 
															+NOT_FOUND_VALUE, NOT_FOUND_EXPIRATION, IS_REGULAR_VALUE, IS_DICTIONARY = b'', -float('inf'), '', '___DictionaryDHTValue'
														
 
															+RESERVED_SUBKEYS = {IS_REGULAR_VALUE, IS_DICTIONARY}
														
 
															 class DHTProtocol(dht_grpc.DHTServicer):
														
 
															     # fmt:off
														
 
															     node_id: DHTID; port: int; bucket_size: int; num_replicas: int; wait_timeout: float; node_info: dht_pb2.NodeInfo
														
 
															     channel_options: Optional[Sequence[Tuple[str, Any]]]; server: grpc.experimental.aio.Server
														
 
															-    storage: LocalStorage; cache: LocalStorage; routing_table: RoutingTable; rpc_semaphore: asyncio.Semaphore
														
 
															+    storage: DHTLocalStorage; cache: DHTLocalStorage; routing_table: RoutingTable; rpc_semaphore: asyncio.Semaphore
														
 
															+    serializer = MSGPackSerializer  # used to pack/unpack DHT Values for transfer over network
														
 
															     # fmt:on
														
 
															     @classmethod
														
@@ -44,7 +46,7 @@ class DHTProtocol(dht_grpc.DHTServicer):
 
															         self = cls(_initialized_with_create=True)
														
 
															         self.node_id, self.bucket_size, self.num_replicas = node_id, bucket_size, num_replicas
														
 
															         self.wait_timeout, self.channel_options = wait_timeout, channel_options
														
 
															-        self.storage, self.cache = LocalStorage(), LocalStorage(maxsize=cache_size)
														
 
															+        self.storage, self.cache = DHTLocalStorage(), DHTLocalStorage(maxsize=cache_size)
														
 
															         self.routing_table = RoutingTable(node_id, bucket_size, depth_modulo)
														
 
															         self.rpc_semaphore = asyncio.Semaphore(parallel_rpc if parallel_rpc is not None else float('inf'))
														
@@ -110,30 +112,46 @@ class DHTProtocol(dht_grpc.DHTServicer):
 
															             asyncio.create_task(self.update_routing_table(sender_id, rpc_endpoint))
														
 
															         return self.node_info
														
 
															-    async def call_store(self, peer: Endpoint, keys: Sequence[DHTID], values: Sequence[BinaryDHTValue],
														
 
															+    async def call_store(self, peer: Endpoint, keys: Sequence[DHTID],
														
 
															+                         values: Sequence[Union[BinaryDHTValue, DictionaryDHTValue]],
														
 
															                          expiration_time: Union[DHTExpiration, Sequence[DHTExpiration]],
														
 
															-                         in_cache: Optional[Union[bool, Sequence[bool]]] = None) -> Sequence[bool]:
														
 
															+                         subkeys: Optional[Union[Subkey, Sequence[Optional[Subkey]]]] = None,
														
 
															+                         in_cache: Optional[Union[bool, Sequence[bool]]] = None) -> Optional[List[bool]]:
														
 
															         """
														
 
															         Ask a recipient to store several (key, value : expiration_time) items or update their older value
														
 
															         :param peer: request this peer to store the data
														
 
															         :param keys: a list of N keys digested by DHTID.generate(source=some_dict_key)
														
 
															         :param values: a list of N serialized values (bytes) for each respective key
														
 
															-        :param expiration_time: a list of N expiration timestamps for each respective key-value pair (see get_dht_time())
														
 
															+        :param expiration_time: a list of N expiration timestamps for each respective key-value pair(see get_dht_time())
														
 
															+        :param subkeys: a list of N optional sub-keys. If None, stores value normally. If not subkey is not None:
														
 
															+          1) if local storage doesn't have :key:, create a new dictionary {subkey: (value, expiration_time)}
														
 
															+          2) if local storage already has a dictionary under :key:, try add (subkey, value, exp_time) to that dictionary
														
 
															+          2) if local storage associates :key: with a normal value with smaller expiration, clear :key: and perform (1)
														
 
															+          3) finally, if local storage currently associates :key: with a normal value with larger expiration, do nothing
														
 
															         :param in_cache: a list of booleans, True = store i-th key in cache, value = store i-th key locally
														
 
															         :note: the difference between storing normally and in cache is that normal storage is guaranteed to be stored
														
 
															          until expiration time (best-effort), whereas cached storage can be evicted early due to limited cache size
														
 
															-
														
 
															         :return: list of [True / False] True = stored, False = failed (found newer value or no response)
														
 
															-         if peer did not respond (e.g. due to timeout or congestion), returns None
														
 
															+                 if peer did not respond (e.g. due to timeout or congestion), returns None
														
 
															         """
														
 
															         if isinstance(expiration_time, DHTExpiration):
														
 
															             expiration_time = [expiration_time] * len(keys)
														
 
															+        if subkeys is None or isinstance(subkeys, Subkey):
														
 
															+            subkeys = [subkeys] * len(keys)
														
 
															+
														
 
															         in_cache = in_cache if in_cache is not None else [False] * len(keys)  # default value (None)
														
 
															         in_cache = [in_cache] * len(keys) if isinstance(in_cache, bool) else in_cache  # single bool
														
 
															-        keys, values, expiration_time, in_cache = map(list, [keys, values, expiration_time, in_cache])
														
 
															+        keys, subkeys, values, expiration_time, in_cache = map(list, [keys, subkeys, values, expiration_time, in_cache])
														
 
															+        for i in range(len(keys)):
														
 
															+            if subkeys[i] is None:  # add default sub-key if not specified
														
 
															+                subkeys[i] = IS_REGULAR_VALUE if not isinstance(values[i], DictionaryDHTValue) else IS_DICTIONARY
														
 
															+            if isinstance(values[i], DictionaryDHTValue):
														
 
															+                assert subkeys[i] == IS_DICTIONARY, "Please do not specify subkey when storing an entire dictionary"
														
 
															+                values[i] = self.serializer.dumps(values[i])
														
 
															+
														
 
															         assert len(keys) == len(values) == len(expiration_time) == len(in_cache), "Data is not aligned"
														
 
															-        store_request = dht_pb2.StoreRequest(keys=list(map(DHTID.to_bytes, keys)), values=values,
														
 
															+        store_request = dht_pb2.StoreRequest(keys=list(map(DHTID.to_bytes, keys)), subkeys=subkeys, values=values,
														
 
															                                              expiration_time=expiration_time, in_cache=in_cache, peer=self.node_info)
														
 
															         try:
														
 
															             async with self.rpc_semaphore:
														
@@ -145,7 +163,7 @@ class DHTProtocol(dht_grpc.DHTServicer):
 
															         except grpc.experimental.aio.AioRpcError as error:
														
 
															             logger.warning(f"DHTProtocol failed to store at {peer}: {error.code()}")
														
 
															             asyncio.create_task(self.update_routing_table(self.routing_table.get(endpoint=peer), peer, responded=False))
														
 
															-            return [False] * len(keys)
														
 
															+            return None
														
 
															     async def rpc_store(self, request: dht_pb2.StoreRequest, context: grpc.ServicerContext) -> dht_pb2.StoreResponse:
														
 
															         """ Some node wants us to store this (key, value) pair """
														
@@ -153,10 +171,19 @@ class DHTProtocol(dht_grpc.DHTServicer):
 
															             asyncio.create_task(self.rpc_ping(request.peer, context))
														
 
															         assert len(request.keys) == len(request.values) == len(request.expiration_time) == len(request.in_cache)
														
 
															         response = dht_pb2.StoreResponse(store_ok=[], peer=self.node_info)
														
 
															-        for key_bytes, value_bytes, expiration_time, in_cache in zip(
														
 
															-                request.keys, request.values, request.expiration_time, request.in_cache):
														
 
															-            local_memory = self.cache if in_cache else self.storage
														
 
															-            response.store_ok.append(local_memory.store(DHTID.from_bytes(key_bytes), value_bytes, expiration_time))
														
 
															+        keys = map(DHTID.from_bytes, request.keys)
														
 
															+        for key_id, subkey, value_bytes, expiration_time, in_cache in zip(
														
 
															+                keys, request.subkeys, request.values, request.expiration_time, request.in_cache):
														
 
															+            storage = self.cache if in_cache else self.storage
														
 
															+            if subkey == IS_REGULAR_VALUE:  # store normal value without subkeys
														
 
															+                response.store_ok.append(storage.store(key_id, value_bytes, expiration_time))
														
 
															+            elif subkey == IS_DICTIONARY:   # store an entire dictionary with pre-existing subkeys
														
 
															+                value_dictionary = self.serializer.loads(value_bytes)
														
 
															+                assert isinstance(value_dictionary, DictionaryDHTValue)
														
 
															+                response.store_ok.append(all(storage.store_subkey(key_id, subkey, subvalue, subkey_expiration)
														
 
															+                                             for subkey, subvalue, subkey_expiration in value_dictionary.items()))
														
 
															+            else:  # add new entry into an existing dictionary-like value or create a new dictionary with one sub-key
														
 
															+                response.store_ok.append(storage.store_subkey(key_id, subkey, value_bytes, expiration_time))
														
 
															         return response
														
 
															     async def call_find(self, peer: Endpoint, keys: Collection[DHTID]) -> \
														
@@ -179,16 +206,19 @@ class DHTProtocol(dht_grpc.DHTServicer):
 
															             if response.peer and response.peer.node_id:
														
 
															                 peer_id = DHTID.from_bytes(response.peer.node_id)
														
 
															                 asyncio.create_task(self.update_routing_table(peer_id, peer, responded=True))
														
 
															-            assert len(response.values) == len(response.expiration_time) == len(response.nearest) == len(keys), \
														
 
															-                "DHTProtocol: response is not aligned with keys and/or expiration times"
														
 
															-
														
 
															-            output = {}  # unpack data without special NOT_FOUND_* values
														
 
															-            for key, value, expiration_time, nearest in zip(
														
 
															-                    keys, response.values, response.expiration_time, response.nearest):
														
 
															-                value = value if value != _NOT_FOUND_VALUE else None
														
 
															-                expiration_time = expiration_time if expiration_time != _NOT_FOUND_EXPIRATION else None
														
 
															-                nearest = dict(zip(map(DHTID.from_bytes, nearest.node_ids), nearest.endpoints))
														
 
															-                output[key] = (value, expiration_time, nearest)
														
 
															+            assert len(keys) == len(response.results), "DHTProtocol: response is not aligned with keys"
														
 
															+
														
 
															+            output = {}  # unpack data depending on its type
														
 
															+            for key, result in zip(keys, response.results):
														
 
															+                nearest = dict(zip(map(DHTID.from_bytes, result.nearest_node_ids), result.nearest_endpoints))
														
 
															+                if result.type == dht_pb2.NOT_FOUND:
														
 
															+                    output[key] = None, None, nearest
														
 
															+                elif result.type == dht_pb2.FOUND_REGULAR:
														
 
															+                    output[key] = result.value, result.expiration_time, nearest
														
 
															+                elif result.type == dht_pb2.FOUND_DICTIONARY:
														
 
															+                    output[key] = self.serializer.loads(result.value), result.expiration_time, nearest
														
 
															+                else:
														
 
															+                    logger.error(f"Unknown result type: {result.type}")
														
 
															             return output
														
 
															         except grpc.experimental.aio.AioRpcError as error:
														
 
															             logger.warning(f"DHTProtocol failed to find at {peer}: {error.code()}")
														
@@ -201,24 +231,27 @@ class DHTProtocol(dht_grpc.DHTServicer):
 
															         """
														
 
															         if request.peer:  # if requested, add peer to the routing table
														
 
															             asyncio.create_task(self.rpc_ping(request.peer, context))
														
 
															-
														
 
															-        response = dht_pb2.FindResponse(values=[], expiration_time=[], nearest=[], peer=self.node_info)
														
 
															-        for key_id in map(DHTID.from_bytes, request.keys):
														
 
															+        response = dht_pb2.FindResponse(results=[], peer=self.node_info)
														
 
															+        for i, key_id in enumerate(map(DHTID.from_bytes, request.keys)):
														
 
															             maybe_value, maybe_expiration_time = self.storage.get(key_id)
														
 
															             cached_value, cached_expiration_time = self.cache.get(key_id)
														
 
															             if (cached_expiration_time or -float('inf')) > (maybe_expiration_time or -float('inf')):
														
 
															                 maybe_value, maybe_expiration_time = cached_value, cached_expiration_time
														
 
															-            nearest_neighbors = self.routing_table.get_nearest_neighbors(
														
 
															-                key_id, k=self.bucket_size, exclude=DHTID.from_bytes(request.peer.node_id))
														
 
															-            if nearest_neighbors:
														
 
															-                peer_ids, endpoints = zip(*nearest_neighbors)
														
 
															-            else:
														
 
															-                peer_ids, endpoints = [], []
														
 
															-
														
 
															-            response.values.append(maybe_value if maybe_value is not None else _NOT_FOUND_VALUE)
														
 
															-            response.expiration_time.append(maybe_expiration_time if maybe_expiration_time else _NOT_FOUND_EXPIRATION)
														
 
															-            response.nearest.append(dht_pb2.Peers(node_ids=list(map(DHTID.to_bytes, peer_ids)), endpoints=endpoints))
														
 
															+            if maybe_expiration_time is None:  # value not found
														
 
															+                item = dht_pb2.FindResult(type=dht_pb2.NOT_FOUND)
														
 
															+            elif isinstance(maybe_value, DictionaryDHTValue):
														
 
															+                item = dht_pb2.FindResult(type=dht_pb2.FOUND_DICTIONARY, value=self.serializer.dumps(maybe_value),
														
 
															+                                          expiration_time=maybe_value.latest_expiration_time)
														
 
															+            else:  # found regular value
														
 
															+                item = dht_pb2.FindResult(type=dht_pb2.FOUND_REGULAR, value=maybe_value,
														
 
															+                                          expiration_time=maybe_expiration_time)
														
 
															+
														
 
															+            for node_id, endpoint in self.routing_table.get_nearest_neighbors(
														
 
															+                key_id, k=self.bucket_size, exclude=DHTID.from_bytes(request.peer.node_id)):
														
 
															+                item.nearest_node_ids.append(node_id.to_bytes())
														
 
															+                item.nearest_endpoints.append(endpoint)
														
 
															+            response.results.append(item)
														
 
															         return response
														
 
															     async def update_routing_table(self, node_id: Optional[DHTID], peer_endpoint: Endpoint, responded=True):
														
@@ -256,91 +289,3 @@ class DHTProtocol(dht_grpc.DHTServicer):
 
															         else:  # we sent outgoing request and peer did not respond
														
 
															             if node_id is not None and node_id in self.routing_table:
														
 
															                 del self.routing_table[node_id]
														
 
															-
														
 
															-
														
 
															-_NOT_FOUND_VALUE, _NOT_FOUND_EXPIRATION = b'', -float('inf')  # internal values to represent that a value was not found
														
 
															-
														
 
															-
														
 
															-class LocalStorage:
														
 
															-    """ Local dictionary that maintains up to :maxsize: tuples of (key, value, expiration_time) """
														
 
															-
														
 
															-    def __init__(self, maxsize: Optional[int] = None):
														
 
															-        self.cache_size = maxsize or float("inf")
														
 
															-        self.data: Dict[DHTID, Tuple[BinaryDHTValue, DHTExpiration]] = dict()
														
 
															-        self.expiration_heap: List[Tuple[DHTExpiration, DHTID]] = []
														
 
															-        self.key_to_heap: Dict[DHTID, Tuple[DHTExpiration, DHTID]] = dict()
														
 
															-        self.frozen = False  # if True, do not remove outdated elements
														
 
															-
														
 
															-    def _remove_outdated(self):
														
 
															-        while not self.frozen and self.expiration_heap and (self.expiration_heap[0][0] < get_dht_time()
														
 
															-                                                            or len(self.expiration_heap) > self.cache_size):
														
 
															-            heap_entry = heapq.heappop(self.expiration_heap)
														
 
															-            key = heap_entry[1]
														
 
															-            if self.key_to_heap.get(key) == heap_entry:
														
 
															-                del self.data[key], self.key_to_heap[key]
														
 
															-
														
 
															-    def store(self, key: DHTID, value: BinaryDHTValue, expiration_time: DHTExpiration) -> bool:
														
 
															-        """
														
 
															-        Store a (key, value) pair locally at least until expiration_time. See class docstring for details.
														
 
															-        :returns: True if new value was stored, False it was rejected (current value is newer)
														
 
															-        """
														
 
															-        if expiration_time < get_dht_time() and not self.frozen:
														
 
															-            return False
														
 
															-        self.key_to_heap[key] = (expiration_time, key)
														
 
															-        heapq.heappush(self.expiration_heap, (expiration_time, key))
														
 
															-        if key in self.data:
														
 
															-            if self.data[key][1] < expiration_time:
														
 
															-                self.data[key] = (value, expiration_time)
														
 
															-                return True
														
 
															-            return False
														
 
															-        self.data[key] = (value, expiration_time)
														
 
															-        self._remove_outdated()
														
 
															-        return True
														
 
															-
														
 
															-    def get(self, key: DHTID) -> (Optional[BinaryDHTValue], Optional[DHTExpiration]):
														
 
															-        """ Get a value corresponding to a key if that (key, value) pair was previously stored here. """
														
 
															-        self._remove_outdated()
														
 
															-        if key in self.data:
														
 
															-            return self.data[key]
														
 
															-        return None, None
														
 
															-
														
 
															-    def items(self) -> Iterator[Tuple[DHTID, BinaryDHTValue, DHTExpiration]]:
														
 
															-        """ Iterate over (key, value, expiration_time) tuples stored in this storage """
														
 
															-        self._remove_outdated()
														
 
															-        return ((key, value, expiration_time) for key, (value, expiration_time) in self.data.items())
														
 
															-
														
 
															-    def top(self) -> Optional[Tuple[DHTID, BinaryDHTValue, DHTExpiration]]:
														
 
															-        """ Return the entry with earliest expiration or None if there isn't any """
														
 
															-        self._remove_outdated()
														
 
															-        if self.data:
														
 
															-            top_entry, top_key = self.expiration_heap[0], self.expiration_heap[0][1]
														
 
															-            while self.key_to_heap.get(top_key) != top_entry:
														
 
															-                heapq.heappop(self.expiration_heap)  # skip leftover "ghost" entries until first real entry
														
 
															-                top_entry, top_key = self.expiration_heap[0], self.expiration_heap[0][1]
														
 
															-            value, expiration = self.data[top_key]
														
 
															-            return top_key, value, expiration
														
 
															-
														
 
															-    def __contains__(self, key: DHTID):
														
 
															-        self._remove_outdated()
														
 
															-        return key in self.data
														
 
															-
														
 
															-    def __len__(self):
														
 
															-        self._remove_outdated()
														
 
															-        return len(self.data)
														
 
															-
														
 
															-    def __delitem__(self, key: DHTID):
														
 
															-        if key in self.key_to_heap:
														
 
															-            del self.data[key], self.key_to_heap[key]
														
 
															-        # note: key may still be in self.expiration_heap, but it will not be used and eventually ._remove_outdated()
														
 
															-
														
 
															-    def __bool__(self):
														
 
															-        return bool(self.data)
														
 
															-
														
 
															-    @contextmanager
														
 
															-    def freeze(self):
														
 
															-        """ Temporarily cease to ._remove_outdated() elements inside this context to ensure consistency """
														
 
															-        prev_frozen, self.frozen = self.frozen, True
														
 
															-        try:
														
 
															-            yield self
														
 
															-        finally:
														
 
															-            self.frozen = prev_frozen
														
--- a/hivemind/dht/routing.py
+++ b/hivemind/dht/routing.py
@@ -12,7 +12,7 @@ from typing import Tuple, Optional, List, Dict, Set, Union, Any, Sequence
 
															 from hivemind.utils import Endpoint, PickleSerializer
														
 
															-DHTKey, DHTValue, DHTExpiration, BinaryDHTID, BinaryDHTValue, = Any, Any, float, bytes, bytes  # flavour types
														
 
															+DHTKey, Subkey, DHTValue, DHTExpiration, BinaryDHTID, BinaryDHTValue, = Any, str, Any, float, bytes, bytes
														
 
															 get_dht_time = time.time  # time used by all dht functionality. You can replace this with any infrastructure-wide time
														
--- a/hivemind/dht/storage.py
+++ b/hivemind/dht/storage.py
@@ -0,0 +1,161 @@
 
															+from __future__ import annotations
														
 
															+import heapq
														
 
															+from contextlib import contextmanager
														
 
															+from typing import Generic, Optional, Dict, Tuple, List, Iterator, TypeVar, Union, Any
														
 
															+
														
 
															+from hivemind.dht.routing import DHTID, DHTExpiration, get_dht_time, BinaryDHTValue, Subkey
														
 
															+from hivemind.utils.serializer import MSGPackSerializer
														
 
															+
														
 
															+KeyType = TypeVar('KeyType')
														
 
															+ValueType = TypeVar('ValueType')
														
 
															+
														
 
															+
														
 
															+class TimedStorage(Generic[KeyType, ValueType]):
														
 
															+    """ A dictionary that maintains up to :maxsize: key-value-expiration tuples until their expiration_time """
														
 
															+    frozen = False  # can be set to True. If true, do not remove outdated elements
														
 
															+
														
 
															+    def __init__(self, maxsize: Optional[int] = None):
														
 
															+        self.maxsize = maxsize or float("inf")
														
 
															+        self.data: Dict[KeyType, Tuple[ValueType, DHTExpiration]] = dict()
														
 
															+        self.expiration_heap: List[Tuple[DHTExpiration, KeyType]] = []
														
 
															+        self.key_to_heap: Dict[KeyType, Tuple[DHTExpiration, KeyType]] = dict()
														
 
															+
														
 
															+    def _remove_outdated(self):
														
 
															+        while not self.frozen and self.expiration_heap and (self.expiration_heap[0][0] < get_dht_time()
														
 
															+                                                            or len(self.expiration_heap) > self.maxsize):
														
 
															+            heap_entry = heapq.heappop(self.expiration_heap)
														
 
															+            key = heap_entry[1]
														
 
															+            if self.key_to_heap.get(key) == heap_entry:
														
 
															+                del self.data[key], self.key_to_heap[key]
														
 
															+
														
 
															+    def store(self, key: KeyType, value: ValueType, expiration_time: DHTExpiration) -> bool:
														
 
															+        """
														
 
															+        Store a (key, value) pair locally at least until expiration_time. See class docstring for details.
														
 
															+        :returns: True if new value was stored, False it was rejected (current value is newer)
														
 
															+        """
														
 
															+        if expiration_time < get_dht_time() and not self.frozen:
														
 
															+            return False
														
 
															+        self.key_to_heap[key] = (expiration_time, key)
														
 
															+        heapq.heappush(self.expiration_heap, (expiration_time, key))
														
 
															+        if key in self.data:
														
 
															+            if self.data[key][1] < expiration_time:
														
 
															+                self.data[key] = (value, expiration_time)
														
 
															+                return True
														
 
															+            return False
														
 
															+        self.data[key] = (value, expiration_time)
														
 
															+        self._remove_outdated()
														
 
															+        return True
														
 
															+
														
 
															+    def get(self, key: KeyType) -> (Optional[ValueType], Optional[DHTExpiration]):
														
 
															+        """ Get a value corresponding to a key if that (key, value) pair was previously stored under this key. """
														
 
															+        self._remove_outdated()
														
 
															+        if key in self.data:
														
 
															+            return self.data[key]
														
 
															+        return None, None
														
 
															+
														
 
															+    def items(self) -> Iterator[Tuple[KeyType, ValueType, DHTExpiration]]:
														
 
															+        """ Iterate over (key, value, expiration_time) tuples stored in this storage """
														
 
															+        self._remove_outdated()
														
 
															+        return ((key, value, expiration_time) for key, (value, expiration_time) in self.data.items())
														
 
															+
														
 
															+    def top(self) -> Optional[Tuple[KeyType, ValueType, DHTExpiration]]:
														
 
															+        """ Return the entry with earliest expiration or None if there isn't any """
														
 
															+        self._remove_outdated()
														
 
															+        if self.data:
														
 
															+            top_entry, top_key = self.expiration_heap[0], self.expiration_heap[0][1]
														
 
															+            while self.key_to_heap.get(top_key) != top_entry:
														
 
															+                heapq.heappop(self.expiration_heap)  # skip leftover "ghost" entries until first real entry
														
 
															+                top_entry, top_key = self.expiration_heap[0], self.expiration_heap[0][1]
														
 
															+            value, expiration = self.data[top_key]
														
 
															+            return top_key, value, expiration
														
 
															+
														
 
															+    def __contains__(self, key: KeyType):
														
 
															+        self._remove_outdated()
														
 
															+        return key in self.data
														
 
															+
														
 
															+    def __len__(self):
														
 
															+        self._remove_outdated()
														
 
															+        return len(self.data)
														
 
															+
														
 
															+    def __delitem__(self, key: KeyType):
														
 
															+        if key in self.key_to_heap:
														
 
															+            del self.data[key], self.key_to_heap[key]
														
 
															+        # note: key may still be in self.expiration_heap, but it will not be used and eventually ._remove_outdated()
														
 
															+
														
 
															+    def __bool__(self):
														
 
															+        return bool(self.data)
														
 
															+
														
 
															+    def __repr__(self):
														
 
															+        return f"{self.__class__.__name__}({self.data})"
														
 
															+
														
 
															+    @contextmanager
														
 
															+    def freeze(self):
														
 
															+        """ Temporarily cease to ._remove_outdated() elements inside this context to ensure consistency """
														
 
															+        prev_frozen, self.frozen = self.frozen, True
														
 
															+        try:
														
 
															+            yield self
														
 
															+        finally:
														
 
															+            self.frozen = prev_frozen
														
 
															+
														
 
															+
														
 
															+@MSGPackSerializer.ext_serializable(0x50)
														
 
															+class DictionaryDHTValue(TimedStorage[Subkey, BinaryDHTValue]):
														
 
															+    """ a dictionary-like DHT value type that maps sub-keys to values with individual expirations """
														
 
															+    latest_expiration_time = float('-inf')
														
 
															+
														
 
															+    def store(self, key: KeyType, value: ValueType, expiration_time: DHTExpiration) -> bool:
														
 
															+        self.latest_expiration_time = max(self.latest_expiration_time, expiration_time)
														
 
															+        return super().store(key, value, expiration_time)
														
 
															+
														
 
															+    def packb(self) -> bytes:
														
 
															+        """ custom behavior for MSGPackSerializer.dumps """
														
 
															+        return MSGPackSerializer.dumps([self.maxsize, self.latest_expiration_time, list(map(list, self.items()))])
														
 
															+
														
 
															+    @classmethod
														
 
															+    def unpackb(cls, raw: bytes) -> DictionaryDHTValue:
														
 
															+        maxsize, latest_expiration_time, items = MSGPackSerializer.loads(raw)
														
 
															+        with DictionaryDHTValue(maxsize).freeze() as new_dict:
														
 
															+            for key, value, expiration_time in items:
														
 
															+                new_dict.store(key, value, expiration_time)
														
 
															+            new_dict.latest_expiration_time = latest_expiration_time
														
 
															+            return new_dict
														
 
															+
														
 
															+
														
 
															+class DHTLocalStorage(TimedStorage[DHTID, Union[BinaryDHTValue, DictionaryDHTValue]]):
														
 
															+    """ A dictionary-like storage that can store binary values and/or nested dictionaries until expiration """
														
 
															+    def store(self, key: DHTID, value: BinaryDHTValue, expiration_time: DHTExpiration,
														
 
															+              subkey: Optional[Subkey] = None) -> bool:
														
 
															+        """
														
 
															+        Store a (key, value) pair locally at least until expiration_time. See class docstring for details.
														
 
															+        If subkey is not None, adds a subkey-value pair to a dictionary associated with :key: (see store_subkey below)
														
 
															+        :returns: True if new value was stored, False it was rejected (current value is newer)
														
 
															+        """
														
 
															+        if subkey is not None:  # add one sub-key
														
 
															+            return self.store_subkey(key, subkey, value, expiration_time)
														
 
															+        else:  # store regular key
														
 
															+            return super().store(key, value, expiration_time)
														
 
															+
														
 
															+    def store_subkey(self, key: DHTID, subkey: Subkey, value: BinaryDHTValue, expiration_time: DHTExpiration) -> bool:
														
 
															+        """
														
 
															+        Save a (sub-key, value) into a dictionary associated with a given key.
														
 
															+         1) if self[key] is empty, create a new dictionary and add sub-key there
														
 
															+         2) if self[key] is a dictionary (DictionaryDHTValue), store {sub-key: value, expiration} to that storage
														
 
															+         3) if self[key] is a normal value with smaller expiration time, overwrite it with a dictionary and add sub-key
														
 
															+        :returns: True if new entry was stored, False it was rejected (current value is newer)
														
 
															+        """
														
 
															+        previous_value, previous_expiration_time = self.get(key)
														
 
															+        if isinstance(previous_value, DictionaryDHTValue):  # already a dictionary, just add new subkey
														
 
															+            if expiration_time > previous_value.latest_expiration_time:
														
 
															+                super().store(key, previous_value, expiration_time)  # refresh expiration time
														
 
															+            return previous_value.store(subkey, value, expiration_time)
														
 
															+        elif expiration_time > (previous_expiration_time or float('-inf')):  # create new dictionary, add subkey
														
 
															+            new_storage = DictionaryDHTValue()
														
 
															+            new_storage.store(subkey, value, expiration_time)
														
 
															+            return super().store(key, new_storage, new_storage.latest_expiration_time)
														
 
															+        else:
														
 
															+            return False
														
 
															+
														
 
															+
														
 
															+class CacheRefreshQueue(TimedStorage[DHTID, DHTExpiration]):
														
 
															+    """ a queue of keys scheduled for refresh in future, used in DHTNode """
														
 
															+    frozen = True
														
--- a/hivemind/proto/dht.proto
+++ b/hivemind/proto/dht.proto
@@ -24,10 +24,11 @@ message NodeInfo {
 
															 message StoreRequest {
														
 
															   // three lists of the same length representing dht keys, dht values and expiration
														
 
															   repeated bytes keys = 1;             // keys in the form of DHTID.generate(raw_key).to_bytes()
														
 
															-  repeated bytes values = 2;           // binary-encoded value for i-th key
														
 
															-  repeated double expiration_time = 3; // expirations for i-th key (type = DHTExpiration)
														
 
															-  repeated bool in_cache = 4;          // if in_cache[i], store i-th key in cache, else store normally
														
 
															-  NodeInfo peer = 5;                   // (optional) sender's own node info, same behavior as in DHT.rpc_ping
														
 
															+  repeated string subkeys = 2;         // [optional] subkeys for DictionaryDHTValue type, empty string means no subkey
														
 
															+  repeated bytes values = 3;           // binary-encoded value for i-th key
														
 
															+  repeated double expiration_time = 4; // expirations for i-th key (type = DHTExpiration)
														
 
															+  repeated bool in_cache = 5;          // if in_cache[i], store i-th key in cache, else store normally
														
 
															+  NodeInfo peer = 6;                   // (optional) sender's own node info, same behavior as in DHT.rpc_ping
														
 
															 }
														
 
															 message StoreResponse {
														
@@ -40,16 +41,21 @@ message FindRequest {
 
															   NodeInfo peer = 2;                   // optional, same behavior as in DHT.ping
														
 
															 }
														
 
															-message Peers {
														
 
															-  // two aligned arrays: DHTIDs and Endpoints, i-th endpoint corresponds to peer with i-th node id
														
 
															-  repeated bytes node_ids = 1;         // DHTID serialized with node_id.to_bytes()
														
 
															-  repeated string endpoints = 2;       // e.g. 123.123.123.123:1337 or [2a21:6с8:b192:2105]:8888
														
 
															+enum ResultType {NOT_FOUND = 0; FOUND_REGULAR = 1; FOUND_DICTIONARY = 2;}
														
 
															+
														
 
															+message FindResult {
														
 
															+  ResultType type = 1;                 // NONE |      REGULAR     | DICTIONARY
														
 
															+  bytes value = 2;                     // n/a  | serialized value | serialized DictionaryDHTValue with serialized fields
														
 
															+  double expiration_time = 3;          // n/a  | expiration time  | DictionaryDHTValue.latest_expiration_time
														
 
															+
														
 
															+  // two aligned arrays: DHTIDs and Endpoints for nearest peers (sorted by XOR distance)
														
 
															+  repeated bytes nearest_node_ids = 4;      // DHTIDs serialized with node_id.to_bytes()
														
 
															+  repeated string nearest_endpoints = 5;    // e.g. 123.123.123.123:1337 or [2a21:6с8:b192:2105]:8888
														
 
															 }
														
 
															+
														
 
															 message FindResponse {
														
 
															-  repeated bytes values = 1;           // value for i-th key, b'' means not found locally
														
 
															-  repeated double expiration_time = 2; // expiration time for i-th value, only valid value is found
														
 
															-  repeated Peers nearest = 3;          // peers ordered from nearest to farthest based on distance to i-th key
														
 
															-  NodeInfo peer = 4;                   // respondent's node id, for you to update routing table
														
 
															+  repeated FindResult results = 1;       // for each item, return value/expiration (if found) and nearest peers
														
 
															+  NodeInfo peer = 2;                   // respondent's node id, for you to update routing table
														
 
															 }
														
--- a/hivemind/server/checkpoint_saver.py
+++ b/hivemind/server/checkpoint_saver.py
@@ -1,5 +1,4 @@
 
															 import threading
														
 
															-import time
														
 
															 from datetime import datetime
														
 
															 from pathlib import Path
														
 
															 from shutil import copytree
														
--- a/hivemind/utils/serializer.py
+++ b/hivemind/utils/serializer.py
@@ -1,9 +1,14 @@
 
															 """ A unified interface for several common serialization methods """
														
 
															 import pickle
														
 
															 from io import BytesIO
														
 
															+from typing import Dict, Any
														
 
															 import torch
														
 
															-import umsgpack
														
 
															+import msgpack
														
 
															+from hivemind.utils.logging import get_logger
														
 
															+
														
 
															+logger = get_logger(__name__)
														
 
															+
														
 
															 class SerializerBase:
														
 
															     @staticmethod
														
@@ -38,10 +43,41 @@ class PytorchSerializer(SerializerBase):
 
															 class MSGPackSerializer(SerializerBase):
														
 
															-    @staticmethod
														
 
															-    def dumps(obj: object) -> bytes:
														
 
															-        return umsgpack.dumps(obj, use_bin_type=False, strict_types=True)
														
 
															+    _ExtTypes: Dict[Any, int] = {}
														
 
															+    _ExtTypeCodes: Dict[int, Any] = {}
														
 
															+
														
 
															+    @classmethod
														
 
															+    def ext_serializable(cls, type_code: int):
														
 
															+        assert isinstance(type_code, int), "Please specify a (unique) int type code"
														
 
															+
														
 
															+        def wrap(wrapped_type: type):
														
 
															+            assert callable(getattr(wrapped_type, 'packb', None)) and callable(getattr(wrapped_type, 'unpackb', None)),\
														
 
															+                f"Every ext_type must have 2 methods: packb(self) -> bytes and classmethod unpackb(cls, bytes)"
														
 
															+            if type_code in cls._ExtTypeCodes:
														
 
															+                logger.warning(f"{cls.__name__}: type {type_code} is already registered, overwriting.")
														
 
															+            cls._ExtTypeCodes[type_code], cls._ExtTypes[wrapped_type] = wrapped_type, type_code
														
 
															+            return wrapped_type
														
 
															+        return wrap
														
 
															+
														
 
															+    @classmethod
														
 
															+    def _encode_ext_types(cls, obj):
														
 
															+        type_code = cls._ExtTypes.get(type(obj))
														
 
															+        if type_code is not None:
														
 
															+            return msgpack.ExtType(type_code, obj.packb())
														
 
															+        return obj
														
 
															+
														
 
															+    @classmethod
														
 
															+    def _decode_ext_types(cls, type_code: int, data: bytes):
														
 
															+        if type_code in cls._ExtTypeCodes:
														
 
															+            return cls._ExtTypeCodes[type_code].unpackb(data)
														
 
															+        logger.warning(f"Unknown ExtType code: {type_code}, leaving it as is.")
														
 
															+        return data
														
 
															+
														
 
															+    @classmethod
														
 
															+    def dumps(cls, obj: object) -> bytes:
														
 
															+        return msgpack.dumps(obj, use_bin_type=True, default=cls._encode_ext_types, strict_types=True)
														
 
															+
														
 
															+    @classmethod
														
 
															+    def loads(cls, buf: bytes) -> object:
														
 
															+        return msgpack.loads(buf, ext_hook=cls._decode_ext_types, raw=False)
														
 
															-    @staticmethod
														
 
															-    def loads(buf: bytes) -> object:
														
 
															-        return umsgpack.loads(buf, raw=False)
														
--- a/requirements.txt
+++ b/requirements.txt
@@ -2,7 +2,7 @@ PyYAML
 
															 torch>=1.3.0
														
 
															 numpy>=1.17
														
 
															 prefetch_generator>=1.0.1
														
 
															-umsgpack
														
 
															+msgpack>=0.5.6
														
 
															 sortedcontainers
														
 
															 uvloop>=0.14.0
														
 
															 grpcio>=1.31
														
--- a/tests/test_dht_experts.py
+++ b/tests/test_dht_experts.py
@@ -6,7 +6,7 @@ import hivemind
 
															 from hivemind import LOCALHOST
														
 
															-def test_hivemind_dht():
														
 
															+def test_store_get_experts():
														
 
															     peers = [hivemind.DHT(start=True)]
														
 
															     for i in range(10):
														
 
															         neighbors_i = [f'{LOCALHOST}:{node.port}' for node in random.sample(peers, min(3, len(peers)))]
														
--- a/tests/test_dht_node.py
+++ b/tests/test_dht_node.py
@@ -11,6 +11,7 @@ from typing import List, Dict
 
															 from hivemind import get_dht_time
														
 
															 from hivemind.dht.node import DHTID, Endpoint, DHTNode, LOCALHOST, DHTProtocol
														
 
															 from hivemind.dht.protocol import DHTProtocol
														
 
															+from hivemind.dht.storage import DictionaryDHTValue
														
 
															 def run_protocol_listener(port: int, dhtid: DHTID, started: mp.synchronize.Event, ping: Optional[Endpoint] = None):
														
@@ -85,6 +86,24 @@ def test_dht_protocol():
 
															             dummy_port = hivemind.find_open_port()
														
 
															             assert loop.run_until_complete(protocol.call_find(f"{LOCALHOST}:{dummy_port}", [key])) is None
														
 
															+            # store/get a dictionary with sub-keys
														
 
															+            nested_key, subkey1, subkey2 = DHTID.generate(), 'foo', 'bar'
														
 
															+            value1, value2 = [random.random(), {'ololo': 'pyshpysh'}], 'abacaba'
														
 
															+            assert loop.run_until_complete(protocol.call_store(
														
 
															+                f'{LOCALHOST}:{peer1_port}', keys=[nested_key], values=[hivemind.MSGPackSerializer.dumps(value1)],
														
 
															+                expiration_time=[expiration], subkeys=[subkey1])
														
 
															+            )
														
 
															+            assert loop.run_until_complete(protocol.call_store(
														
 
															+                f'{LOCALHOST}:{peer1_port}', keys=[nested_key], values=[hivemind.MSGPackSerializer.dumps(value2)],
														
 
															+                expiration_time=[expiration + 5], subkeys=[subkey2])
														
 
															+            )
														
 
															+            recv_dict, recv_expiration, nodes_found = loop.run_until_complete(
														
 
															+                protocol.call_find(f'{LOCALHOST}:{peer1_port}', [nested_key]))[nested_key]
														
 
															+            assert isinstance(recv_dict, DictionaryDHTValue)
														
 
															+            assert len(recv_dict.data) == 2 and recv_expiration == expiration + 5
														
 
															+            assert recv_dict.data[subkey1] == (protocol.serializer.dumps(value1), expiration)
														
 
															+            assert recv_dict.data[subkey2] == (protocol.serializer.dumps(value2), expiration + 5)
														
 
															+
														
 
															             if listen:
														
 
															                 loop.run_until_complete(protocol.shutdown())
														
 
															             print("DHTProtocol test finished successfully!")
														
@@ -172,7 +191,8 @@ def test_dht_node():
 
															         # note: we run everything in a separate process to re-initialize all global states from scratch
														
 
															         # this helps us avoid undesirable side-effects when running multiple tests in sequence
														
 
															         loop = asyncio.get_event_loop()
														
 
															-        me = loop.run_until_complete(DHTNode.create(initial_peers=random.sample(dht.keys(), 5), parallel_rpc=10))
														
 
															+        me = loop.run_until_complete(DHTNode.create(initial_peers=random.sample(dht.keys(), 5), parallel_rpc=10,
														
 
															+                                                    cache_refresh_before_expiry=False))
														
 
															         # test 1: find self
														
 
															         nearest = loop.run_until_complete(me.find_nearest_nodes([me.node_id], k_nearest=1))[me.node_id]
														
@@ -229,19 +249,24 @@ def test_dht_node():
 
															         assert len(set.difference(set(nearest.keys()), set(all_node_ids) | {me.node_id})) == 0
														
 
															         # test 5: node without peers
														
 
															-        other_node = loop.run_until_complete(DHTNode.create())
														
 
															-        nearest = loop.run_until_complete(other_node.find_nearest_nodes([dummy]))[dummy]
														
 
															-        assert len(nearest) == 1 and nearest[other_node.node_id] == f"{LOCALHOST}:{other_node.port}"
														
 
															-        nearest = loop.run_until_complete(other_node.find_nearest_nodes([dummy], exclude_self=True))[dummy]
														
 
															+        detached_node = loop.run_until_complete(DHTNode.create())
														
 
															+        nearest = loop.run_until_complete(detached_node.find_nearest_nodes([dummy]))[dummy]
														
 
															+        assert len(nearest) == 1 and nearest[detached_node.node_id] == f"{LOCALHOST}:{detached_node.port}"
														
 
															+        nearest = loop.run_until_complete(detached_node.find_nearest_nodes([dummy], exclude_self=True))[dummy]
														
 
															         assert len(nearest) == 0
														
 
															         # test 6 store and get value
														
 
															         true_time = get_dht_time() + 1200
														
 
															         assert loop.run_until_complete(me.store("mykey", ["Value", 10], true_time))
														
 
															-        for node in [me, other_node]:
														
 
															-            val, expiration_time = loop.run_until_complete(me.get("mykey"))
														
 
															-            assert expiration_time == true_time, "Wrong time"
														
 
															+        that_guy = loop.run_until_complete(DHTNode.create(initial_peers=random.sample(dht.keys(), 3), parallel_rpc=10,
														
 
															+                                                          cache_refresh_before_expiry=False, cache_locally=False))
														
 
															+
														
 
															+        for node in [me, that_guy]:
														
 
															+            val, expiration_time = loop.run_until_complete(node.get("mykey"))
														
 
															             assert val == ["Value", 10], "Wrong value"
														
 
															+            assert expiration_time == true_time, f"Wrong time"
														
 
															+
														
 
															+        assert loop.run_until_complete(detached_node.get("mykey")) == (None, None)
														
 
															         # test 7: bulk store and bulk get
														
 
															         keys = 'foo', 'bar', 'baz', 'zzz'
														
@@ -252,6 +277,31 @@ def test_dht_node():
 
															         for key, value in zip(keys, values):
														
 
															             assert key in response and response[key][0] == value
														
 
															+        # test 8: store dictionaries as values (with sub-keys)
														
 
															+        upper_key, subkey1, subkey2, subkey3 = 'ololo', 'k1', 'k2', 'k3'
														
 
															+        now = get_dht_time()
														
 
															+        assert loop.run_until_complete(me.store(upper_key, subkey=subkey1, value=123, expiration_time=now + 10))
														
 
															+        assert loop.run_until_complete(me.store(upper_key, subkey=subkey2, value=456, expiration_time=now + 20))
														
 
															+        for node in [that_guy, me]:
														
 
															+            value, time = loop.run_until_complete(node.get(upper_key))
														
 
															+            assert isinstance(value, dict) and time == now + 20
														
 
															+            assert value[subkey1] == (123, now + 10)
														
 
															+            assert value[subkey2] == (456, now + 20)
														
 
															+            assert len(value) == 2
														
 
															+
														
 
															+        assert not loop.run_until_complete(me.store(upper_key, subkey=subkey2, value=345, expiration_time=now + 10))
														
 
															+        assert loop.run_until_complete(me.store(upper_key, subkey=subkey2, value=567, expiration_time=now + 30))
														
 
															+        assert loop.run_until_complete(me.store(upper_key, subkey=subkey3, value=890, expiration_time=now + 50))
														
 
															+        loop.run_until_complete(asyncio.sleep(0.1))  # wait for cache to refresh
														
 
															+
														
 
															+        for node in [that_guy, me]:
														
 
															+            value, time = loop.run_until_complete(node.get(upper_key))
														
 
															+            assert isinstance(value, dict) and time == now + 50, (value, time)
														
 
															+            assert value[subkey1] == (123, now + 10)
														
 
															+            assert value[subkey2] == (567, now + 30)
														
 
															+            assert value[subkey3] == (890, now + 50)
														
 
															+            assert len(value) == 3
														
 
															+
														
 
															         test_success.set()
														
 
															     tester = mp.Process(target=_tester, daemon=True)
														
@@ -262,6 +312,39 @@ def test_dht_node():
 
															         proc.terminate()
														
 
															+def test_dhtnode_replicas():
														
 
															+    dht_size = 20
														
 
															+    initial_peers = 3
														
 
															+    num_replicas = random.randint(1, 20)
														
 
															+    test_success = mp.Event()
														
 
															+
														
 
															+    async def _tester():
														
 
															+        peers = []
														
 
															+        for i in range(dht_size):
														
 
															+            neighbors_i = [f'{LOCALHOST}:{node.port}' for node in random.sample(peers, min(initial_peers, len(peers)))]
														
 
															+            peers.append(await DHTNode.create(initial_peers=neighbors_i, num_replicas=num_replicas))
														
 
															+
														
 
															+        you = random.choice(peers)
														
 
															+        assert await you.store('key1', 'foo', get_dht_time() + 999)
														
 
															+
														
 
															+        actual_key1_replicas = sum(len(peer.protocol.storage) for peer in peers)
														
 
															+        assert num_replicas == actual_key1_replicas
														
 
															+
														
 
															+        assert await you.store('key2', 'bar', get_dht_time() + 999)
														
 
															+        total_size = sum(len(peer.protocol.storage) for peer in peers)
														
 
															+        actual_key2_replicas = total_size - actual_key1_replicas
														
 
															+        assert num_replicas == actual_key2_replicas
														
 
															+
														
 
															+        assert await you.store('key2', 'baz', get_dht_time() + 1000)
														
 
															+        assert sum(len(peer.protocol.storage) for peer in peers) == total_size, "total size should not have changed"
														
 
															+        test_success.set()
														
 
															+
														
 
															+    proc = mp.Process(target=lambda: asyncio.run(_tester()))
														
 
															+    proc.start()
														
 
															+    proc.join()
														
 
															+    assert test_success.is_set()
														
 
															+
														
 
															+
														
 
															 def test_dhtnode_caching(T=0.05):
														
 
															     test_success = mp.Event()
														
--- a/tests/test_dht_storage.py
+++ b/tests/test_dht_storage.py
@@ -1,18 +1,19 @@
 
															 import time
														
 
															-from hivemind import DHTID, get_dht_time
														
 
															-from hivemind.dht.protocol import LocalStorage
														
 
															+from hivemind.dht.routing import get_dht_time
														
 
															+from hivemind.dht.storage import DHTLocalStorage, DHTID, DictionaryDHTValue
														
 
															+from hivemind.utils.serializer import MSGPackSerializer
														
 
															 def test_store():
														
 
															-    d = LocalStorage()
														
 
															+    d = DHTLocalStorage()
														
 
															     d.store(DHTID.generate("key"), b"val", get_dht_time() + 0.5)
														
 
															     assert d.get(DHTID.generate("key"))[0] == b"val", "Wrong value"
														
 
															     print("Test store passed")
														
 
															 def test_get_expired():
														
 
															-    d = LocalStorage()
														
 
															+    d = DHTLocalStorage()
														
 
															     d.store(DHTID.generate("key"), b"val", get_dht_time() + 0.1)
														
 
															     time.sleep(0.5)
														
 
															     assert d.get(DHTID.generate("key")) == (None, None), "Expired value must be deleted"
														
@@ -20,13 +21,13 @@ def test_get_expired():
 
															 def test_get_empty():
														
 
															-    d = LocalStorage()
														
 
															-    assert d.get(DHTID.generate(source="key")) == (None, None), "LocalStorage returned non-existent value"
														
 
															+    d = DHTLocalStorage()
														
 
															+    assert d.get(DHTID.generate(source="key")) == (None, None), "DHTLocalStorage returned non-existent value"
														
 
															     print("Test get expired passed")
														
 
															 def test_change_expiration_time():
														
 
															-    d = LocalStorage()
														
 
															+    d = DHTLocalStorage()
														
 
															     d.store(DHTID.generate("key"), b"val1", get_dht_time() + 1)
														
 
															     assert d.get(DHTID.generate("key"))[0] == b"val1", "Wrong value"
														
 
															     d.store(DHTID.generate("key"), b"val2", get_dht_time() + 200)
														
@@ -36,7 +37,7 @@ def test_change_expiration_time():
 
															 def test_maxsize_cache():
														
 
															-    d = LocalStorage(maxsize=1)
														
 
															+    d = DHTLocalStorage(maxsize=1)
														
 
															     d.store(DHTID.generate("key1"), b"val1", get_dht_time() + 1)
														
 
															     d.store(DHTID.generate("key2"), b"val2", get_dht_time() + 200)
														
 
															     assert d.get(DHTID.generate("key2"))[0] == b"val2", "Value with bigger exp. time must be kept"
														
@@ -44,7 +45,7 @@ def test_maxsize_cache():
 
															 def test_localstorage_top():
														
 
															-    d = LocalStorage(maxsize=3)
														
 
															+    d = DHTLocalStorage(maxsize=3)
														
 
															     d.store(DHTID.generate("key1"), b"val1", get_dht_time() + 1)
														
 
															     d.store(DHTID.generate("key2"), b"val2", get_dht_time() + 2)
														
 
															     d.store(DHTID.generate("key3"), b"val3", get_dht_time() + 4)
														
@@ -61,8 +62,40 @@ def test_localstorage_top():
 
															     assert d.top()[:2] == (DHTID.generate("key3"), b"val3")
														
 
															+def test_localstorage_nested():
														
 
															+    time = get_dht_time()
														
 
															+    d1 = DHTLocalStorage()
														
 
															+    d2 = DictionaryDHTValue()
														
 
															+    d2.store('subkey1', b'value1', time + 2)
														
 
															+    d2.store('subkey2', b'value2', time + 3)
														
 
															+    d2.store('subkey3', b'value3', time + 1)
														
 
															+
														
 
															+    assert d2.latest_expiration_time == time + 3
														
 
															+    for subkey, subvalue, subexpiration in d2.items():
														
 
															+        assert d1.store_subkey(DHTID.generate('foo'), subkey, subvalue, subexpiration)
														
 
															+    assert d1.store(DHTID.generate('bar'), b'456', time + 2)
														
 
															+    assert d1.get(DHTID.generate('foo'))[0].data == d2.data
														
 
															+    assert d1.get(DHTID.generate('foo'))[1] == d2.latest_expiration_time
														
 
															+    assert d1.get(DHTID.generate('foo'))[0].get('subkey1') == (b'value1', time + 2)
														
 
															+    assert len(d1.get(DHTID.generate('foo'))[0]) == 3
														
 
															+    assert d1.store_subkey(DHTID.generate('foo'), 'subkey4', b'value4', time + 4)
														
 
															+    assert len(d1.get(DHTID.generate('foo'))[0]) == 4
														
 
															+
														
 
															+    assert d1.store_subkey(DHTID.generate('bar'), 'subkeyA', b'valueA', time + 1) is False  # prev has better expiration
														
 
															+    assert d1.store_subkey(DHTID.generate('bar'), 'subkeyA', b'valueA', time + 3)  # new value has better expiration
														
 
															+    assert d1.store_subkey(DHTID.generate('bar'), 'subkeyB', b'valueB', time + 4)  # new value has better expiration
														
 
															+    assert d1.store_subkey(DHTID.generate('bar'), 'subkeyA', b'valueA+', time + 5)  # overwrite subkeyA under key bar
														
 
															+    assert all(subkey in d1.get(DHTID.generate('bar'))[0] for subkey in ('subkeyA', 'subkeyB'))
														
 
															+    assert len(d1.get(DHTID.generate('bar'))[0]) == 2 and d1.get(DHTID.generate('bar'))[1] == time + 5
														
 
															+
														
 
															+    assert d1.store(DHTID.generate('foo'), b'nothing', time + 3.5) is False  # previous value has better expiration
														
 
															+    assert d1.get(DHTID.generate('foo'))[0].get('subkey2') == (b'value2', time + 3)
														
 
															+    assert d1.store(DHTID.generate('foo'), b'nothing', time + 5) is True  # new value has better expiraiton
														
 
															+    assert d1.get(DHTID.generate('foo')) == (b'nothing', time + 5)  # value should be replaced
														
 
															+
														
 
															+
														
 
															 def test_localstorage_freeze():
														
 
															-    d = LocalStorage(maxsize=2)
														
 
															+    d = DHTLocalStorage(maxsize=2)
														
 
															     with d.freeze():
														
 
															         d.store(DHTID.generate("key1"), b"val1", get_dht_time() + 0.01)
														
@@ -77,3 +110,20 @@ def test_localstorage_freeze():
 
															         d.store(DHTID.generate("key3"), b"val3", get_dht_time() + 3)  # key3 will push key1 out due to maxsize
														
 
															         assert DHTID.generate("key1") in d
														
 
															     assert DHTID.generate("key1") not in d
														
 
															+
														
 
															+
														
 
															+def test_localstorage_serialize():
														
 
															+    d1 = DictionaryDHTValue()
														
 
															+    d2 = DictionaryDHTValue()
														
 
															+
														
 
															+    now = get_dht_time()
														
 
															+    d1.store('key1', b'ololo', now + 1)
														
 
															+    d2.store('key2', b'pysh', now + 1)
														
 
															+    d2.store('key3', b'pyshpysh', now + 2)
														
 
															+
														
 
															+    data = MSGPackSerializer.dumps([d1, d2, 123321])
														
 
															+    assert isinstance(data, bytes)
														
 
															+    new_d1, new_d2, new_value = MSGPackSerializer.loads(data)
														
 
															+    assert isinstance(new_d1, DictionaryDHTValue) and isinstance(new_d2, DictionaryDHTValue) and new_value == 123321
														
 
															+    assert 'key1' in new_d1 and len(new_d1) == 1
														
 
															+    assert 'key1' not in new_d2 and len(new_d2) == 2 and new_d2.get('key3') == (b'pyshpysh', now + 2)
														
--- a/tests/test_moe.py
+++ b/tests/test_moe.py
@@ -15,8 +15,6 @@ def test_moe():
 
															     with background_server(expert_uids=all_expert_uids, device='cpu', expert_cls='ffn',
														
 
															                            num_handlers=1, hidden_dim=16) as (server_endpoint, dht_endpoint):
														
 
															         dht = hivemind.DHT(start=True, expiration=999, initial_peers=[dht_endpoint])
														
 
															-        # declare expert uids. Server *should* declare them by itself, but it takes time.
														
 
															-        assert all(dht.declare_experts(all_expert_uids, endpoint=server_endpoint))
														
 
															         dmoe = hivemind.RemoteMixtureOfExperts(
														
 
															             in_features=16, grid_size=(32, 32, 32), dht=dht, k_best=3, uid_prefix='ffn')