Explorar o código

Add standard experts

Max Ryabinin %!s(int64=2) %!d(string=hai) anos
pai
achega
0fc36c8eed
Modificáronse 1 ficheiros con 0 adicións e 1 borrados
  1. 0 1
      hivemind/moe/server/layers/albert.py

+ 0 - 1
hivemind/moe/server/layers/albert.py

@@ -571,7 +571,6 @@ class HeadExpert(nn.Module):
 class StandardHeadExpert(HeadExpert):
     def __init__(self, hid_dim):
         super().__init__(hid_dim)
-        self.config.num_hidden_layers = 1
 
 
 body_sample_input = lambda batch_size, hid_dim: (torch.empty((batch_size, SEQUENCE_LENGTH, hid_dim)),)