5 سال پیش · 35289c7005
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -1,7 +1,7 @@
 
				 
			
 
				 
			
 
				 ### Rules for collaborating:
			
 
				-Tesseract is still in the early stage of development, we expect only a handful of collaborators with individual roles.
			
 
				+Hivemind is still in the early stage of development, we expect only a handful of collaborators with individual roles.
			
 
				 
			
 
				 1. Before you write any code, please contact us to avoid duplicate work:
			
 
				    * Report bugs and propose new features via issues. We don't have templates at this point;
			
@@ -20,5 +20,5 @@ Tesseract is still in the early stage of development, we expect only a handful o
 
				 
			
 
				 ### Tips & tricks
			
 
				 * You can find a wealth of pytorch debugging tricks at [their contributing page](https://github.com/pytorch/pytorch/blob/master/CONTRIBUTING.md).
			
 
				-* Tesseract is optimized for development in pycharm CE 2019.3 or newer.
			
 
				+* Hivemind is optimized for development in pycharm CE 2019.3 or newer.
			
 
				   * When working on tests, please mark "tests" as sources root.
			
--- a/README.md
+++ b/README.md
@@ -1,4 +1,4 @@
 
				-## Tesseract
			
 
				+## Hivemind
			
 
				 
			
 
				 [![Build status](https://circleci.com/gh/learning-at-home/tesseract.svg?style=shield)](https://circleci.com/gh/learning-at-home/tesseract)
			
 
				 [![Documentation Status](https://readthedocs.org/projects/learning-at-home/badge/?version=latest)](https://learning-at-home.readthedocs.io/en/latest/?badge=latest)
			
--- a/docs/conf.py
+++ b/docs/conf.py
@@ -23,8 +23,8 @@ from recommonmark.parser import CommonMarkParser
 
				 
			
 
				 # -- Project information -----------------------------------------------------
			
 
				 sys.path.insert(0, '..')
			
 
				-src_path = '../tesseract'
			
 
				-project = 'tesseract'
			
 
				+src_path = '../hivemind'
			
 
				+project = 'hivemind'
			
 
				 copyright = '2020, Learning@home & contributors'
			
 
				 author = 'Learning@home & contributors'
			
 
				 
			
@@ -119,7 +119,7 @@ html_static_path = ['_static']
 
				 # -- Options for HTMLHelp output ---------------------------------------------
			
 
				 
			
 
				 # Output file base name for HTML help builder.
			
 
				-htmlhelp_basename = 'tesseractdoc'
			
 
				+htmlhelp_basename = 'hiveminddoc'
			
 
				 
			
 
				 
			
 
				 # -- Options for LaTeX output ------------------------------------------------
			
@@ -146,7 +146,7 @@ latex_elements = {
 
				 # (source start file, target name, title,
			
 
				 #  author, documentclass [howto, manual, or own class]).
			
 
				 latex_documents = [
			
 
				-    (master_doc, 'tesseract.tex', 'tesseract Documentation',
			
 
				+    (master_doc, 'hivemind.tex', 'hivemind Documentation',
			
 
				      'Learning@home \\& contributors', 'manual'),
			
 
				 ]
			
 
				 
			
@@ -156,7 +156,7 @@ latex_documents = [
 
				 # One entry per manual page. List of tuples
			
 
				 # (source start file, name, description, authors, manual section).
			
 
				 man_pages = [
			
 
				-    (master_doc, 'tesseract', 'tesseract Documentation',
			
 
				+    (master_doc, 'hivemind', 'hivemind Documentation',
			
 
				      [author], 1)
			
 
				 ]
			
 
				 
			
@@ -167,8 +167,8 @@ man_pages = [
 
				 # (source start file, target name, title, author,
			
 
				 #  dir menu entry, description, category)
			
 
				 texinfo_documents = [
			
 
				-    (master_doc, 'tesseract', 'tesseract Documentation',
			
 
				-     author, 'tesseract', 'One line description of project.',
			
 
				+    (master_doc, 'hivemind', 'hivemind Documentation',
			
 
				+     author, 'hivemind', 'One line description of project.',
			
 
				      'Miscellaneous'),
			
 
				 ]
			
 
				 
			
@@ -240,7 +240,7 @@ def linkcode_resolve(domain, info):
 
				     if domain != 'py' or not info['module']:
			
 
				         return None
			
 
				     try:
			
 
				-        filename = 'tesseract/%s#L%d-L%d' % find_source()
			
 
				+        filename = 'hivemind/%s#L%d-L%d' % find_source()
			
 
				     except Exception:
			
 
				         filename = info['module'].replace('.', '/') + '.py'
			
 
				     return "https://github.com/learning-at-home/tesseract/blob/%s/%s" % (branch, filename)
			
--- a/docs/index.rst
+++ b/docs/index.rst
@@ -1,7 +1,7 @@
 
				-``learning@home::tesseract``
			
 
				+``learning@home::hivemind``
			
 
				 ====================================
			
 
				 
			
 
				-Tesseract lets you train huge neural networks on computers provided by volunteers. Powered by pytorch.
			
 
				+Hivemind lets you train huge neural networks on computers provided by volunteers. Powered by pytorch.
			
 
				 
			
 
				 .. image:: _static/bug.gif
			
 
				 
			
@@ -28,4 +28,4 @@ Indices and tables
 
				 * :ref:`modindex`
			
 
				 * :ref:`search`
			
 
				 
			
 
				-.. _GitHub: https://github.com/learning-at-home/tesseract
			
 
				+.. _GitHub: https://github.com/learning-at-home/hivemind
			
--- a/docs/modules/client.rst
+++ b/docs/modules/client.rst
@@ -1,9 +1,9 @@
 
				-``tesseract.client``
			
 
				+``hidemind.client``
			
 
				 ====================
			
 
				 
			
 
				-.. automodule:: tesseract.client
			
 
				+.. automodule:: hivemind.client
			
 
				 
			
 
				-.. currentmodule:: tesseract.client
			
 
				+.. currentmodule:: hivemind.client
			
 
				 
			
 
				 .. raw:: html
			
 
				 
			
--- a/docs/modules/server.rst
+++ b/docs/modules/server.rst
@@ -1,17 +1,17 @@
 
				-``tesseract.server & runtime``
			
 
				+``hivemind.server & runtime``
			
 
				 ========================================
			
 
				 
			
 
				-.. automodule:: tesseract.server
			
 
				+.. automodule:: hivemind.server
			
 
				 
			
 
				-.. currentmodule:: tesseract.server
			
 
				+.. currentmodule:: hivemind.server
			
 
				 
			
 
				-.. autoclass:: TesseractServer
			
 
				+.. autoclass:: Server
			
 
				    :members:
			
 
				    :member-order: bysource
			
 
				 
			
 
				-.. currentmodule:: tesseract.runtime
			
 
				+.. currentmodule:: hivemind.runtime
			
 
				 
			
 
				-.. autoclass:: TesseractRuntime
			
 
				+.. autoclass:: Runtime
			
 
				     :members:
			
 
				     :member-order: bysource
			
 
				 
			
--- a/docs/user/quickstart.md
+++ b/docs/user/quickstart.md
@@ -1,6 +1,6 @@
 
				 # Quick start [nothing here yet]
			
 
				 
			
 
				-This will eventually become a tutorial on how to host a tesseract node or connect to an existing node.
			
 
				+This will eventually become a tutorial on how to host a hivemind node or connect to an existing node.
			
 
				 
			
 
				 ![img](https://media.giphy.com/media/3oz8xtBx06mcZWoNJm/giphy.gif)
			
 
				 
			
@@ -16,30 +16,30 @@ This will eventually become a tutorial on how to host a tesseract node or connec
 
				 
			
 
				 ## How do I run it?
			
 
				 
			
 
				-Currently, there is no way to do it easily. There are some tests (you can check [`./tests/benchmark_throughput.py`](https://github.com/learning-at-home/tesseract/blob/master/tests/benchmark_throughput.py)
			
 
				+Currently, there is no way to do it easily. There are some tests (you can check [`./tests/benchmark_throughput.py`](https://github.com/learning-at-home/hivemind/blob/master/tests/benchmark_throughput.py)
			
 
				  or look into CI logs) and we want to expand them. If you want to
			
 
				 do something complex with it, please contact us by opening an issue (less preferred: [telegram](https://t.me/justheuristic)).
			
 
				 
			
 
				-## `tesseract` quick tour
			
 
				+## `hivemind` quick tour
			
 
				 
			
 
				 **Trainer process:**
			
 
				 
			
 
				-- **`RemoteExpert`**(`tesseract/client/remote_expert.py`) behaves like a pytorch
			
 
				+- **`RemoteExpert`**(`hivemind/client/remote_expert.py`) behaves like a pytorch
			
 
				   module with autograd support but actually sends request to a remote runtime.
			
 
				-- **`RemoteMixtureOfExperts`**(`tesseract/client/remote_moe.py`) finds best experts
			
 
				+- **`RemoteMixtureOfExperts`**(`hivemind/client/remote_moe.py`) finds best experts
			
 
				   for a given input and either returns them as `RemoteExpert` or applies them
			
 
				   right away.
			
 
				 
			
 
				 **Runtime process:**
			
 
				 
			
 
				-- **`TesseractRuntime`** (`tesseract/runtime/__init__.py`) aggregates batches
			
 
				+- **`Runtime`** (`hivemind/runtime/__init__.py`) aggregates batches
			
 
				   and performs inference/training of experts according to their priority.
			
 
				-- **`TesseractServer`** (`tesseract/server/__init__.py`) wraps runtime and
			
 
				+- **`Server`** (`hivemind/server/__init__.py`) wraps runtime and
			
 
				   periodically uploads experts into `DHTNode`.
			
 
				 
			
 
				 **DHT:**
			
 
				 
			
 
				-- **`DHTNode`**(`tesseract/dht/__init__.py`) is a node of
			
 
				+- **`DHTNode`**(`hivemind/dht/__init__.py`) is a node of
			
 
				   Kademlia-based DHT that stores metadata used by trainer and runtime.
			
 
				 
			
 
				 ## Limitations
			
@@ -52,6 +52,6 @@ do something complex with it, please contact us by opening an issue (less prefer
 
				 
			
 
				 **Runtime**:
			
 
				 * You can achieve 4x less network load by passing quantized uint8 activations across experts.
			
 
				-    Implement your own quantization or wait for tesseract v0.8.
			
 
				+    Implement your own quantization or wait for hivemind v0.8.
			
 
				 * Currently runtime can form batches that exceed maximal batch_size by task_size - 1. 
			
 
				     We will fix that in the nearest patch.
			
--- a/tesseract/__init__.py
+++ b/tesseract/__init__.py
--- a/tesseract/client/__init__.py
+++ b/tesseract/client/__init__.py
--- a/tesseract/client/expert.py
+++ b/tesseract/client/expert.py
@@ -16,8 +16,8 @@ class RemoteExpert(nn.Module):
 
				     Sending wrong input shapes can cause RemoteExpert to freeze indefinitely due to error in runtime.
			
 
				 
			
 
				     :param uid: unique expert identifier
			
 
				-    :param host: hostname where TesseractServer operates
			
 
				-    :param port: port to which TesseractServer listens
			
 
				+    :param host: hostname where Server operates
			
 
				+    :param port: port to which Server listens
			
 
				     """
			
 
				 
			
 
				     def __init__(self, uid, host='127.0.0.1', port=8080):
			
--- a/tesseract/client/moe.py
+++ b/tesseract/client/moe.py
@@ -23,7 +23,7 @@ class RemoteMixtureOfExperts(nn.Module):
 
				      the missing experts
			
 
				 
			
 
				     :param in_features: common input size for experts and gating function
			
 
				-    :param grid_size: tesseract dimensions that form expert uid (see below)
			
 
				+    :param grid_size: hivemind dimensions that form expert uid (see below)
			
 
				     :param uid_prefix: common prefix for all expert uids
			
 
				      expert uid follows the pattern {uid_prefix}.{0...grid_size[0]}.{0...grid_size[1]}...{0...grid_size[-1]}
			
 
				     :param dht: DHTNode where the experts reside
			
--- a/tesseract/dht/__init__.py
+++ b/tesseract/dht/__init__.py
@@ -6,8 +6,8 @@ from typing import Tuple, List, Optional
 
				 
			
 
				 from kademlia.network import Server
			
 
				 
			
 
				-from tesseract.client import RemoteExpert
			
 
				-from tesseract.utils import run_forever, SharedFuture, PickleSerializer
			
 
				+from hivemind.client import RemoteExpert
			
 
				+from hivemind.utils import run_forever, SharedFuture, PickleSerializer
			
 
				 
			
 
				 
			
 
				 class DHTNode(mp.Process):
			
@@ -44,7 +44,7 @@ class DHTNode(mp.Process):
 
				         """
			
 
				         self.start()
			
 
				         if await_ready and not self.ready.wait(timeout=timeout):
			
 
				-            raise TimeoutError("TesseractServer didn't notify .ready in {timeout} seconds")
			
 
				+            raise TimeoutError("Server didn't notify .ready in {timeout} seconds")
			
 
				 
			
 
				     def shutdown(self) -> None:
			
 
				         """ Shuts down the dht process """
			
--- a/tesseract/runtime/__init__.py
+++ b/tesseract/runtime/__init__.py
@@ -12,15 +12,15 @@ from .expert_backend import ExpertBackend
 
				 from .task_pool import TaskPool, TaskPoolBase
			
 
				 
			
 
				 
			
 
				-class TesseractRuntime(threading.Thread):
			
 
				+class Runtime(threading.Thread):
			
 
				     """
			
 
				     A group of processes that processes incoming requests for multiple experts on a shared device.
			
 
				-    TesseractRuntime is usually created and managed by TesseractServer, humans need not apply.
			
 
				+    Runtime is usually created and managed by Server, humans need not apply.
			
 
				 
			
 
				     For debugging, you can start runtime manually with .start() or .run()
			
 
				 
			
 
				     >>> expert_backends = {'expert_name': ExpertBackend(**kwargs)}
			
 
				-    >>> runtime = TesseractRuntime(expert_backends)
			
 
				+    >>> runtime = Runtime(expert_backends)
			
 
				     >>> runtime.start()  # start runtime in background thread. To start in current thread, use runtime.run()
			
 
				     >>> runtime.ready.wait()  # await for runtime to load all experts on device and create request pools
			
 
				     >>> future = runtime.expert_backends['expert_name'].forward_pool.submit_task(*expert_inputs)
			
--- a/tesseract/runtime/expert_backend.py
+++ b/tesseract/runtime/expert_backend.py
@@ -9,7 +9,7 @@ from ..utils import nested_flatten, nested_pack, nested_compare, BatchTensorProt
 
				 
			
 
				 class ExpertBackend(nn.Module):
			
 
				     """
			
 
				-    ExpertBackend is a wrapper around torch module that allows it to run tasks asynchronously with TesseractRuntime
			
 
				+    ExpertBackend is a wrapper around torch module that allows it to run tasks asynchronously with Runtime
			
 
				     By default, ExpertBackend handles three types of requests:
			
 
				 
			
 
				      - forward - receive inputs and compute outputs. Concurrent requests will be batched for better GPU utilization.
			
@@ -57,7 +57,7 @@ class ExpertBackend(nn.Module):
 
				 
			
 
				     def forward(self, *inputs: torch.Tensor) -> Tuple[torch.Tensor, ...]:
			
 
				         """
			
 
				-        Apply forward pass to an aggregated batch of requests. Used by TesseractRuntime, do not call this manually;
			
 
				+        Apply forward pass to an aggregated batch of requests. Used by Runtime, do not call this manually;
			
 
				         To submit a request for asynchronous processing, please use ``ExpertBackend.forward_pool.submit_task``.
			
 
				 
			
 
				         Subclassing:
			
@@ -78,7 +78,7 @@ class ExpertBackend(nn.Module):
 
				 
			
 
				     def backward(self, *inputs: torch.Tensor) -> Tuple[torch.Tensor, ...]:
			
 
				         """
			
 
				-        Apply backward pass to an aggregated batch of requests. Used by TesseractRuntime, do not call this manually
			
 
				+        Apply backward pass to an aggregated batch of requests. Used by Runtime, do not call this manually
			
 
				         To submit a request for asynchronous processing, please use ``ExpertBackend.backward_pool.submit_task``.
			
 
				 
			
 
				         Subclassing:
			
@@ -86,7 +86,7 @@ class ExpertBackend(nn.Module):
 
				 
			
 
				            It should return gradients w.r.t. inputs that follow ``nested_flatten(self.forward_schema)``;
			
 
				 
			
 
				-           TesseractRuntime doesn't guarantee that backward will be performed in the same order and for the same data
			
 
				+           Runtime doesn't guarantee that backward will be performed in the same order and for the same data
			
 
				            as forward, so we recommend stateless backward pass that re-runs expert forward pass inside backward.
			
 
				 
			
 
				            .. todo state, randomness, etc
			
@@ -127,6 +127,6 @@ class ExpertBackend(nn.Module):
 
				                     keyword_names=tuple(self.kwargs_schema.keys()))
			
 
				 
			
 
				     def get_pools(self) -> Sequence[TaskPool]:
			
 
				-        """ return all pools that should be processed by ``TesseractRuntime`` """
			
 
				+        """ return all pools that should be processed by ``Runtime`` """
			
 
				         return self.forward_pool, self.backward_pool
			
 
				 
			
--- a/tesseract/runtime/task_pool.py
+++ b/tesseract/runtime/task_pool.py
@@ -20,7 +20,7 @@ Task = namedtuple("Task", ("future", "args"))
 
				 
			
 
				 
			
 
				 class TaskPoolBase(mp.Process):
			
 
				-    """ A pool that accepts tasks and forms batches for parallel processing, interacts with TesseractRuntime """
			
 
				+    """ A pool that accepts tasks and forms batches for parallel processing, interacts with Runtime """
			
 
				 
			
 
				     def __init__(self, process_func: callable):
			
 
				         super().__init__()
			
@@ -55,10 +55,10 @@ class TaskPoolBase(mp.Process):
 
				 
			
 
				 class TaskPool(TaskPoolBase):
			
 
				     """
			
 
				-    Request aggregator that accepts processing requests, groups them into batches, waits for TesseractRuntime
			
 
				+    Request aggregator that accepts processing requests, groups them into batches, waits for Runtime
			
 
				     to process these batches and dispatches results back to request sources. Operates as a background process.
			
 
				 
			
 
				-    :param process_func: function to be applied to every formed batch; called by TesseractRuntime
			
 
				+    :param process_func: function to be applied to every formed batch; called by Runtime
			
 
				         Note that process_func should accept only \*args Tensors and return a flat tuple of Tensors
			
 
				     :param max_batch_size: process at most this many inputs in a batch (task contains have one or several inputs)
			
 
				     :param min_batch_size: process at least this many inputs in a batch, otherwise wait for more
			
@@ -81,7 +81,7 @@ class TaskPool(TaskPoolBase):
 
				         self.tasks = mp.Queue(maxsize=pool_size or 0)
			
 
				         self.undispatched_task_timestamps = mp.SimpleQueue()
			
 
				 
			
 
				-        # interaction with TesseractRuntime
			
 
				+        # interaction with Runtime
			
 
				         self.batch_receiver, self.batch_sender = mp.Pipe(duplex=False)  # send/recv arrays that contain batch inputs
			
 
				         self.batch_received = mp.Event()  # runtime can notify pool that it can send next batch
			
 
				         self.outputs_receiver, self.outputs_sender = mp.Pipe(duplex=False)  # send/recv arrays that contain outputs
			
--- a/tesseract/server/__init__.py
+++ b/tesseract/server/__init__.py
@@ -7,18 +7,18 @@ from typing import Dict
 
				 from .connection_handler import handle_connection
			
 
				 from .dht_handler import DHTHandlerThread
			
 
				 from ..dht import DHTNode
			
 
				-from ..runtime import TesseractRuntime, ExpertBackend
			
 
				+from ..runtime import Runtime, ExpertBackend
			
 
				 
			
 
				 
			
 
				-class TesseractServer(threading.Thread):
			
 
				+class Server(threading.Thread):
			
 
				     """
			
 
				-    TesseractServer allows you to host "experts" - pytorch sub-networks used by Decentralized Mixture of Experts.
			
 
				-    After creation, a server should be started: see TesseractServer.run or TesseractServer.run_in_background.
			
 
				+    Server allows you to host "experts" - pytorch sub-networks used by Decentralized Mixture of Experts.
			
 
				+    After creation, a server should be started: see Server.run or Server.run_in_background.
			
 
				 
			
 
				     A working server does 3 things:
			
 
				-     - processes incoming forward/backward requests via TesseractRuntime (created by the server)
			
 
				+     - processes incoming forward/backward requests via Runtime (created by the server)
			
 
				      - publishes updates to expert status every :update_period: seconds
			
 
				-     - follows orders from TesseractController - if it exists
			
 
				+     - follows orders from HivemindController - if it exists
			
 
				 
			
 
				     :type dht: DHTNode or None. Server with dht=None will NOT be visible from DHT,
			
 
				      but it will still support accessing experts directly with RemoteExpert(uid=UID, host=IPADDR, port=PORT).
			
@@ -40,15 +40,15 @@ class TesseractServer(threading.Thread):
 
				         self.dht, self.experts, self.update_period = dht, expert_backends, update_period
			
 
				         self.addr, self.port = addr, port
			
 
				         self.conn_handlers = self._create_connection_handlers(conn_handler_processes)
			
 
				-        self.runtime = TesseractRuntime(self.experts, **kwargs)
			
 
				+        self.runtime = Runtime(self.experts, **kwargs)
			
 
				 
			
 
				         if start:
			
 
				             self.run_in_background(await_ready=True)
			
 
				 
			
 
				     def run(self):
			
 
				         """
			
 
				-        Starts TesseractServer in the current thread. Initializes dht if necessary, starts connection handlers,
			
 
				-        runs TesseractRuntime (self.runtime) to process incoming requests.
			
 
				+        Starts Server in the current thread. Initializes dht if necessary, starts connection handlers,
			
 
				+        runs Runtime (self.runtime) to process incoming requests.
			
 
				         """
			
 
				         if self.dht:
			
 
				             if not self.dht.is_alive():
			
@@ -71,12 +71,12 @@ class TesseractServer(threading.Thread):
 
				 
			
 
				     def run_in_background(self, await_ready=True, timeout=None):
			
 
				         """
			
 
				-        Starts TesseractServer in a background thread. if await_ready, this method will wait until background server
			
 
				+        Starts Server in a background thread. if await_ready, this method will wait until background server
			
 
				         is ready to process incoming requests or for :timeout: seconds max.
			
 
				         """
			
 
				         self.start()
			
 
				         if await_ready and not self.ready.wait(timeout=timeout):
			
 
				-            raise TimeoutError("TesseractServer didn't notify .ready in {timeout} seconds")
			
 
				+            raise TimeoutError("Server didn't notify .ready in {timeout} seconds")
			
 
				 
			
 
				     @property
			
 
				     def ready(self) -> mp.synchronize.Event:
			
@@ -104,7 +104,7 @@ class TesseractServer(threading.Thread):
 
				 
			
 
				     def shutdown(self):
			
 
				         """
			
 
				-        Gracefully terminate a tesseract server, process-safe.
			
 
				+        Gracefully terminate a hivemind server, process-safe.
			
 
				         Please note that terminating server otherwise (e.g. by killing processes) may result in zombie processes.
			
 
				         If you did already cause a zombie outbreak, your only option is to kill them with -9 (SIGKILL).
			
 
				         """
			
--- a/tesseract/server/connection_handler.py
+++ b/tesseract/server/connection_handler.py
@@ -1,8 +1,8 @@
 
				 from socket import socket
			
 
				 from typing import Tuple, Dict
			
 
				 
			
 
				-from tesseract.runtime.expert_backend import ExpertBackend
			
 
				-from tesseract.utils import PytorchSerializer, Connection
			
 
				+from hivemind.runtime.expert_backend import ExpertBackend
			
 
				+from hivemind.utils import PytorchSerializer, Connection
			
 
				 
			
 
				 
			
 
				 def handle_connection(connection_tuple: Tuple[socket, str], experts: Dict[str, ExpertBackend]):
			
--- a/tesseract/server/dht_handler.py
+++ b/tesseract/server/dht_handler.py
--- a/tesseract/utils/__init__.py
+++ b/tesseract/utils/__init__.py
--- a/tesseract/utils/autograd.py
+++ b/tesseract/utils/autograd.py
--- a/tesseract/utils/connection.py
+++ b/tesseract/utils/connection.py
--- a/tesseract/utils/data.py
+++ b/tesseract/utils/data.py
--- a/tesseract/utils/nested.py
+++ b/tesseract/utils/nested.py
--- a/tesseract/utils/proto.py
+++ b/tesseract/utils/proto.py
--- a/tesseract/utils/serializer.py
+++ b/tesseract/utils/serializer.py
--- a/tesseract/utils/shared_future.py
+++ b/tesseract/utils/shared_future.py
--- a/tesseract/utils/threading.py
+++ b/tesseract/utils/threading.py
@@ -3,7 +3,7 @@ from concurrent.futures import Future, ThreadPoolExecutor, as_completed, Timeout
 
				 import time
			
 
				 from typing import Optional, List
			
 
				 
			
 
				-GLOBAL_EXECUTOR = ThreadPoolExecutor(max_workers=os.environ.get("TESSERACT_THREADS", float('inf')))
			
 
				+GLOBAL_EXECUTOR = ThreadPoolExecutor(max_workers=os.environ.get("HIVEMIND_THREADS", float('inf')))
			
 
				 
			
 
				 
			
 
				 def run_in_background(func: callable, *args, **kwargs) -> Future:
			
--- a/setup.py
+++ b/setup.py
@@ -10,18 +10,18 @@ with open('requirements.txt') as requirements_file:
 
				     install_requires = [str(requirement) for requirement in parse_requirements(requirements_file)]
			
 
				 
			
 
				 # loading version from setup.py
			
 
				-with codecs.open(os.path.join(here, 'tesseract/__init__.py'), encoding='utf-8') as init_file:
			
 
				+with codecs.open(os.path.join(here, 'hivemind/__init__.py'), encoding='utf-8') as init_file:
			
 
				     version_match = re.search(r"^__version__ = ['\"]([^'\"]*)['\"]", init_file.read(), re.M)
			
 
				     version_string = version_match.group(1)
			
 
				 
			
 
				 setup(
			
 
				-    name='tesseract',
			
 
				+    name='hivemind',
			
 
				     version=version_string,
			
 
				     description='',
			
 
				     long_description='',
			
 
				     author='Learning@home authors',
			
 
				     author_email='mryabinin@hse.ru',
			
 
				-    packages=['tesseract'],
			
 
				+    packages=['hivemind'],
			
 
				     license='MIT',
			
 
				     install_requires=install_requires,
			
 
				     classifiers=[
			
--- a/tests/benchmark_throughput.py
+++ b/tests/benchmark_throughput.py
@@ -7,14 +7,14 @@ import time
 
				 
			
 
				 import torch
			
 
				 from test_utils import layers, print_device_info
			
 
				-from tesseract import find_open_port
			
 
				+from hivemind import find_open_port
			
 
				 
			
 
				-import tesseract
			
 
				+import hivemind
			
 
				 
			
 
				 
			
 
				 def client_process(can_start, benchmarking_failed, port, num_experts, batch_size, hid_dim, num_batches, backprop=True):
			
 
				     can_start.wait()
			
 
				-    experts = [tesseract.RemoteExpert(f"expert{i}", port=port) for i in range(num_experts)]
			
 
				+    experts = [hivemind.RemoteExpert(f"expert{i}", port=port) for i in range(num_experts)]
			
 
				 
			
 
				     try:
			
 
				         dummy_batch = torch.randn(batch_size, hid_dim)
			
@@ -62,14 +62,14 @@ def benchmark_throughput(num_experts=16, num_handlers=None, num_clients=128, num
 
				         experts = {}
			
 
				         for i in range(num_experts):
			
 
				             expert = torch.jit.script(layers.name_to_block[expert_cls](hid_dim))
			
 
				-            experts[f'expert{i}'] = tesseract.ExpertBackend(name=f'expert{i}',
			
 
				-                                                            expert=expert, opt=torch.optim.Adam(expert.parameters()),
			
 
				-                                                            args_schema=(tesseract.BatchTensorProto(hid_dim),),
			
 
				-                                                            outputs_schema=tesseract.BatchTensorProto(hid_dim),
			
 
				-                                                            max_batch_size=max_batch_size,
			
 
				-                                                            )
			
 
				+            experts[f'expert{i}'] = hivemind.ExpertBackend(name=f'expert{i}',
			
 
				+                                                           expert=expert, opt=torch.optim.Adam(expert.parameters()),
			
 
				+                                                           args_schema=(hivemind.BatchTensorProto(hid_dim),),
			
 
				+                                                           outputs_schema=hivemind.BatchTensorProto(hid_dim),
			
 
				+                                                           max_batch_size=max_batch_size,
			
 
				+                                                           )
			
 
				         timestamps['created_experts'] = time.perf_counter()
			
 
				-        server = tesseract.TesseractServer(None, experts, port=port, conn_handler_processes=num_handlers, device=device)
			
 
				+        server = hivemind.Server(None, experts, port=port, conn_handler_processes=num_handlers, device=device)
			
 
				         server.start()
			
 
				         server.ready.wait()
			
 
				         timestamps['server_ready'] = time.perf_counter()
			
--- a/tests/test_moe.py
+++ b/tests/test_moe.py
@@ -1,5 +1,5 @@
 
				 import torch
			
 
				-import tesseract
			
 
				+import hivemind
			
 
				 from test_utils.run_server import background_server
			
 
				 
			
 
				 
			
@@ -20,8 +20,8 @@ def test_remote_module_call():
 
				 
			
 
				     with background_server(num_experts=num_experts, device='cpu',
			
 
				                            no_optimizer=True, no_dht=True) as (localhost, server_port, dht_port):
			
 
				-        experts = [tesseract.RemoteExpert(uid=f'expert.{i}', port=server_port) for i in range(num_experts)]
			
 
				-        moe_output, = tesseract.client.moe._RemoteMoECall.apply(
			
 
				+        experts = [hivemind.RemoteExpert(uid=f'expert.{i}', port=server_port) for i in range(num_experts)]
			
 
				+        moe_output, = hivemind.client.moe._RemoteMoECall.apply(
			
 
				             logits, experts[:len(logits)], k_min, timeout_after_k_min, backward_k_min, timeout_total, backward_timeout,
			
 
				             [(None,), {}], xx)
			
 
				 
			
@@ -45,15 +45,15 @@ def test_remote_module_call():
 
				 
			
 
				 def test_compute_expert_scores():
			
 
				     try:
			
 
				-        dht = tesseract.DHTNode(port=tesseract.find_open_port(), start=True)
			
 
				-        moe = tesseract.client.moe.RemoteMixtureOfExperts(
			
 
				+        dht = hivemind.DHTNode(port=hivemind.find_open_port(), start=True)
			
 
				+        moe = hivemind.client.moe.RemoteMixtureOfExperts(
			
 
				             dht=dht, in_features=1024, grid_size=[40], k_best=4, k_min=1, timeout_after_k_min=1,
			
 
				             uid_prefix='expert')
			
 
				         gx, gy = torch.randn(4, 5, requires_grad=True), torch.torch.randn(4, 3, requires_grad=True)
			
 
				         ii = [[4, 0, 2], [3, 1, 1, 1, 3], [0], [3, 2]]
			
 
				         jj = [[2, 2, 1], [0, 1, 2, 0, 1], [0], [1, 2]]
			
 
				         batch_experts = [
			
 
				-            [tesseract.RemoteExpert(uid=f'expert.{ii[b][e]}.{jj[b][e]}') for e in range(len(ii[b]))]
			
 
				+            [hivemind.RemoteExpert(uid=f'expert.{ii[b][e]}.{jj[b][e]}') for e in range(len(ii[b]))]
			
 
				             for b in range(len(ii))
			
 
				         ]  # note: these experts do not exists on server, we use them only to test moe compute_expert_scores
			
 
				         logits = moe.compute_expert_scores([gx, gy], batch_experts)
			
--- a/tests/test_utils/run_server.py
+++ b/tests/test_utils/run_server.py
@@ -4,14 +4,14 @@ import multiprocessing as mp
 
				 import argparse
			
 
				 
			
 
				 import torch
			
 
				-import tesseract
			
 
				+import hivemind
			
 
				 from .layers import name_to_block
			
 
				 
			
 
				 
			
 
				 def make_dummy_server(host='0.0.0.0', port=None, num_experts=1, expert_cls='ffn', hidden_dim=1024, num_handlers=None,
			
 
				                       expert_prefix='expert', expert_offset=0, max_batch_size=16384, device=None, no_optimizer=False,
			
 
				                       no_dht=False, initial_peers=(), dht_port=None, root_port=None, verbose=True, start=False,
			
 
				-                      UID_DELIMETER=tesseract.DHTNode.UID_DELIMETER, **kwargs) -> tesseract.TesseractServer:
			
 
				+                      UID_DELIMETER=hivemind.DHTNode.UID_DELIMETER, **kwargs) -> hivemind.Server:
			
 
				     """ A context manager that creates server in a background thread, awaits .ready on entry and shutdowns on exit """
			
 
				     if verbose and len(kwargs) != 0:
			
 
				         print("Ignored kwargs:", kwargs)
			
@@ -24,8 +24,8 @@ def make_dummy_server(host='0.0.0.0', port=None, num_experts=1, expert_cls='ffn'
 
				     if not no_dht:
			
 
				         if not len(initial_peers):
			
 
				             print("No initial peers provided. Starting additional dht as an initial peer.")
			
 
				-            dht_root = tesseract.DHTNode(
			
 
				-                *initial_peers, port=root_port or tesseract.find_open_port(), start=True)
			
 
				+            dht_root = hivemind.DHTNode(
			
 
				+                *initial_peers, port=root_port or hivemind.find_open_port(), start=True)
			
 
				             print(f"Initializing DHT with port {dht_root.port}")
			
 
				             initial_peers = (('localhost', dht_root.port), )
			
 
				         else:
			
@@ -33,8 +33,8 @@ def make_dummy_server(host='0.0.0.0', port=None, num_experts=1, expert_cls='ffn'
 
				             if root_port is not None:
			
 
				                 print(f"Warning: root_port={root_port} will not be used since we already have peers.")
			
 
				 
			
 
				-        dht = tesseract.DHTNode(
			
 
				-            *initial_peers, port=dht_port or tesseract.find_open_port(), start=True)
			
 
				+        dht = hivemind.DHTNode(
			
 
				+            *initial_peers, port=dht_port or hivemind.find_open_port(), start=True)
			
 
				         if verbose:
			
 
				             print(f"Running dht node on port {dht.port}")
			
 
				 
			
@@ -44,14 +44,14 @@ def make_dummy_server(host='0.0.0.0', port=None, num_experts=1, expert_cls='ffn'
 
				         expert = torch.jit.script(name_to_block[expert_cls](hidden_dim))
			
 
				         opt = torch.optim.SGD(expert.parameters(), 0.0) if no_optimizer else torch.optim.Adam(expert.parameters())
			
 
				         expert_uid = f'{expert_prefix}{UID_DELIMETER}{i + expert_offset}'
			
 
				-        experts[expert_uid] = tesseract.ExpertBackend(name=expert_uid, expert=expert, opt=opt,
			
 
				-                                                      args_schema=(tesseract.BatchTensorProto(hidden_dim),),
			
 
				-                                                      outputs_schema=tesseract.BatchTensorProto(hidden_dim),
			
 
				-                                                      max_batch_size=max_batch_size,
			
 
				-                                                      )
			
 
				+        experts[expert_uid] = hivemind.ExpertBackend(name=expert_uid, expert=expert, opt=opt,
			
 
				+                                                     args_schema=(hivemind.BatchTensorProto(hidden_dim),),
			
 
				+                                                     outputs_schema=hivemind.BatchTensorProto(hidden_dim),
			
 
				+                                                     max_batch_size=max_batch_size,
			
 
				+                                                     )
			
 
				     # actually start server
			
 
				-    server = tesseract.TesseractServer(
			
 
				-        dht, experts, addr=host, port=port or tesseract.find_open_port(),
			
 
				+    server = hivemind.Server(
			
 
				+        dht, experts, addr=host, port=port or hivemind.find_open_port(),
			
 
				         conn_handler_processes=num_handlers, device=device)
			
 
				 
			
 
				     if start: