diff --git a/README.md b/README.md index 833a856..36a379b 100644 --- a/README.md +++ b/README.md @@ -234,7 +234,7 @@ result = ts.trainer.offpolicy_trainer( train_fn=lambda epoch, env_step: policy.set_eps(eps_train), test_fn=lambda epoch, env_step: policy.set_eps(eps_test), stop_fn=lambda mean_rewards: mean_rewards >= env.spec.reward_threshold, - writer=writer, task=task) + writer=writer) print(f'Finished training! Use {result["duration"]}') ```