From 695f0061c8c9e1c9f710a8c05cbc7fdd91c375a1 Mon Sep 17 00:00:00 2001 From: rizar Date: Tue, 7 Jan 2025 21:06:05 +0000 Subject: [PATCH] fixed the skipped last step --- examples/rl_gsm8k/orchestrate_rl.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/examples/rl_gsm8k/orchestrate_rl.py b/examples/rl_gsm8k/orchestrate_rl.py index fbaca406..fb520558 100644 --- a/examples/rl_gsm8k/orchestrate_rl.py +++ b/examples/rl_gsm8k/orchestrate_rl.py @@ -475,7 +475,7 @@ def main(cfg: DictConfig): finetune_cfg = cfg.copy() checkpoint_steps = finetune_cfg.finetune.save_checkpoint_steps - interrupt_train_steps = int((state["iteration"] + 1) * checkpoint_steps - 1) + interrupt_train_steps = int((state["iteration"] + 1) * checkpoint_steps) finetune_cfg.finetune.interrupt_train_steps = interrupt_train_steps finetune_cfg.output_dir = str(finetune_path)