.. |
layers
|
62652e1717
Add Switch Transformers-like RemoteMixtureOfExperts (#228)
|
%!s(int64=4) %!d(string=hai) anos |
__init__.py
|
62652e1717
Add Switch Transformers-like RemoteMixtureOfExperts (#228)
|
%!s(int64=4) %!d(string=hai) anos |
checkpoints.py
|
3024d381c5
Support learning rate schedulers in ExpertBackend (#196)
|
%!s(int64=4) %!d(string=hai) anos |
connection_handler.py
|
916c3db52d
Move compression-related code to hivemind.utils.compression (#213)
|
%!s(int64=4) %!d(string=hai) anos |
dht_handler.py
|
f132294edb
Extract expert-specific methods from DHT (#192)
|
%!s(int64=4) %!d(string=hai) anos |
expert_backend.py
|
ca5c7610ae
Add tool for custom user experts (#189)
|
%!s(int64=4) %!d(string=hai) anos |
expert_uid.py
|
3024d381c5
Support learning rate schedulers in ExpertBackend (#196)
|
%!s(int64=4) %!d(string=hai) anos |
runtime.py
|
6128cbbd51
Add gradient clipping support to ExpertBackend (#214)
|
%!s(int64=4) %!d(string=hai) anos |
task_pool.py
|
6f8f192150
Improve Runtime exception handling (#207)
|
%!s(int64=4) %!d(string=hai) anos |