Explorar o código

hidden_act_gated = True

Max Ryabinin %!s(int64=3) %!d(string=hai) anos
pai
achega
04173527c3
Modificáronse 1 ficheiros con 1 adicións e 1 borrados
  1. 1 1
      hivemind/moe/server/layers/albert.py

+ 1 - 1
hivemind/moe/server/layers/albert.py

@@ -46,7 +46,7 @@ _TOKENIZER_FOR_DOC = "AlbertTokenizer"
 
 class LeanAlbertConfig(AlbertConfig):
     rotary_embedding_base: int = 10_000
-    hidden_act_gated: bool = False
+    hidden_act_gated: bool = True
 
     def __hash__(self):
         return hash("\t".join(f"{k}={v}" for k, v in self.__dict__.items() if not k.startswith("_")))