diff --git a/examples/rl_gsm8k/orchestrate_rl.py b/examples/rl_gsm8k/orchestrate_rl.py index 930ad786..49c8c3ad 100644 --- a/examples/rl_gsm8k/orchestrate_rl.py +++ b/examples/rl_gsm8k/orchestrate_rl.py @@ -19,6 +19,7 @@ from termcolor import colored from tqdm import tqdm +import wandb from tapeagents.agent import Agent from tapeagents.core import LLMCall, LLMOutputParsingFailureAction, StepMetadata, TrainingText from tapeagents.finetune.data import MASKED_TOKEN_ID