|
@@ -79,11 +79,8 @@ def get_optimizer_and_scheduler(training_args, model):
|
|
|
|
|
|
opt = Adafactor(
|
|
|
optimizer_grouped_parameters,
|
|
|
- lr=training_args.learning_rate,
|
|
|
eps=training_args.adam_epsilon,
|
|
|
weight_decay=training_args.weight_decay,
|
|
|
- relative_step=False,
|
|
|
-
|
|
|
)
|
|
|
|
|
|
scheduler = get_linear_schedule_with_warmup(
|