瀏覽代碼

hidden_act_gated = True

Max Ryabinin 3 年之前
父節點
當前提交
04173527c3
共有 1 個文件被更改,包括 1 次插入1 次删除
  1. 1 1
      hivemind/moe/server/layers/albert.py

+ 1 - 1
hivemind/moe/server/layers/albert.py

@@ -46,7 +46,7 @@ _TOKENIZER_FOR_DOC = "AlbertTokenizer"
 
 class LeanAlbertConfig(AlbertConfig):
     rotary_embedding_base: int = 10_000
-    hidden_act_gated: bool = False
+    hidden_act_gated: bool = True
 
     def __hash__(self):
         return hash("\t".join(f"{k}={v}" for k, v in self.__dict__.items() if not k.startswith("_")))