瀏覽代碼

PR attribution

foksly 3 年之前
父節點
當前提交
4aa38e7191
共有 1 個文件被更改,包括 1 次插入1 次删除
  1. 1 1
      benchmarks/benchmark_optimizer.py

+ 1 - 1
benchmarks/benchmark_optimizer.py

@@ -29,7 +29,7 @@ class TrainingArguments:
     reuse_grad_buffers: bool = True
     delay_grad_averaging: bool = True
     delay_optimizer_step: bool = True
-    average_state_every: int = 3
+    average_state_every: int = 1
     use_amp: bool = False
 
     lr_base: float = 0.1