AIForce
/
hivemind


			
				
					
						
						
							1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950
							import os
import pytest
from typing import Optional

import torch

import hivemind
from hivemind import RemoteExpert, background_server

@pytest.mark.forked
def test_custom_expert(port: Optional[int] = None, hid_dim=16):
    with background_server(
        expert_cls='perceptron', num_experts=2, device='cpu',
        hidden_dim=hid_dim, num_handlers=2, no_dht=True,
        custom_module_path=os.path.join(os.path.dirname(__file__), 'custom_networks.py')) as (server_endpoint, _):

        expert0 = RemoteExpert('expert.0', server_endpoint)
        expert1 = RemoteExpert('expert.1', server_endpoint)

        for batch_size in (1, 4):
            batch = torch.randn(batch_size, hid_dim)

            output0 = expert0(batch)
            output1 = expert1(batch)

            loss = output0.sum()
            loss.backward()
            loss = output1.sum()
            loss.backward()

@pytest.mark.forked
def test_multihead_expert(port: Optional[int] = None, hid_dim=16):
    with background_server(
        expert_cls='multihead', num_experts=2, device='cpu',
        hidden_dim=hid_dim, num_handlers=2, no_dht=True,
        custom_module_path=os.path.join(os.path.dirname(__file__), 'custom_networks.py')) as (server_endpoint, _):

        expert0 = RemoteExpert('expert.0', server_endpoint)
        expert1 = RemoteExpert('expert.1', server_endpoint)

        for batch_size in (1, 4):
            batch = (torch.randn(batch_size, hid_dim), torch.randn(batch_size, 2 * hid_dim), torch.randn(batch_size, 3 * hid_dim))

            output0 = expert0(*batch)
            output1 = expert1(*batch)

            loss = output0.sum()
            loss.backward()
            loss = output1.sum()
            loss.backward()