Преглед на файлове

Try removing OffloadOptimizer

Aleksandr Borzunov преди 3 години
родител
ревизия
e97e7b8811
променени са 2 файла, в които са добавени 3 реда и са изтрити 5 реда
  1. 2 2
      arguments.py
  2. 1 3
      task.py

+ 2 - 2
arguments.py

@@ -9,8 +9,8 @@ from transformers import TrainingArguments
 class HFTrainerArguments(TrainingArguments):
     """Arguments for huggingface/transformers.Trainer"""
     dataloader_num_workers: int = 1
-    per_device_train_batch_size: int = 3
-    per_device_eval_batch_size: int = 3
+    per_device_train_batch_size: int = 2
+    per_device_eval_batch_size: int = 2
     gradient_accumulation_steps: int = 1
     text_seq_length: int = 256
 

+ 1 - 3
task.py

@@ -17,7 +17,6 @@ from arguments import HFTrainerArguments, BasePeerArguments, CollaborativeArgume
 from data import make_dataset
 from huggingface_auth import authorize_with_huggingface
 from lib.training.clipped_lamb import LambWithGradientClipping
-from lib.training.offload import OffloadOptimizer
 
 
 logger = hivemind.get_logger(__name__)
@@ -142,9 +141,8 @@ class TrainingTask:
             },
         ]
 
-        opt = OffloadOptimizer(
+        opt = LambWithGradientClipping(
             optimizer_grouped_parameters,
-            optim_cls=LambWithGradientClipping,
             lr=training_args.learning_rate,
             betas=(training_args.adam_beta1, training_args.adam_beta2),
             eps=training_args.adam_epsilon,