correct resume training steps number in progress bar (#25691)

feat: correct update resume update with steps
This commit is contained in:
Phuc Van Phan 2023-08-24 01:09:14 +07:00 committed by GitHub
parent 6add3b313d
commit 656e17f6f7
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

View File

@ -598,8 +598,8 @@ def main():
# need to multiply `gradient_accumulation_steps` to reflect real steps
resume_step = int(training_difference.replace("step_", "")) * args.gradient_accumulation_steps
starting_epoch = resume_step // len(train_dataloader)
resume_step -= starting_epoch * len(train_dataloader)
completed_steps = resume_step // args.gradient_accumulation_steps
resume_step -= starting_epoch * len(train_dataloader)
# update the progress_bar if load from checkpoint
progress_bar.update(completed_steps)