swap order of optimizer.step() and scheduler.step()

This commit is contained in:
Andreas Daiminger
2019-08-28 19:18:27 +02:00
parent 0ecfd17f49
commit 1d15a7f278

View File

@@ -157,8 +157,8 @@ def train(args, train_dataset, model, tokenizer):
tr_loss += loss.item() tr_loss += loss.item()
if (step + 1) % args.gradient_accumulation_steps == 0: if (step + 1) % args.gradient_accumulation_steps == 0:
scheduler.step() # Update learning rate schedule
optimizer.step() optimizer.step()
scheduler.step() # Update learning rate schedule
model.zero_grad() model.zero_grad()
global_step += 1 global_step += 1