Fixup no_trainer save logic (#16968)

* Fixup all examples
This commit is contained in:
Zachary Mueller
2022-04-27 14:46:49 -04:00
committed by GitHub
parent c79bbc3ba5
commit 60e1d883f1
12 changed files with 200 additions and 132 deletions

View File

@@ -563,11 +563,13 @@ def main():
logger.info(f" Gradient Accumulation steps = {args.gradient_accumulation_steps}")
logger.info(f" Total optimization steps = {args.max_train_steps}")
completed_steps = 0
starting_epoch = 0
# Only show the progress bar once on each machine.
progress_bar = tqdm(range(args.max_train_steps), disable=not accelerator.is_local_main_process)
completed_steps = 0
for epoch in range(args.num_train_epochs):
starting_epoch = 0
for epoch in range(starting_epoch, args.num_train_epochs):
model.train()
for step, batch in enumerate(train_dataloader):
# compute num of losses