fix readme (#273)
This commit is contained in:
parent
c6f2648e87
commit
866e35d550
@ -234,7 +234,7 @@ result = ts.trainer.offpolicy_trainer(
|
||||
train_fn=lambda epoch, env_step: policy.set_eps(eps_train),
|
||||
test_fn=lambda epoch, env_step: policy.set_eps(eps_test),
|
||||
stop_fn=lambda mean_rewards: mean_rewards >= env.spec.reward_threshold,
|
||||
writer=writer, task=task)
|
||||
writer=writer)
|
||||
print(f'Finished training! Use {result["duration"]}')
|
||||
```
|
||||
|
||||
|
Loading…
x
Reference in New Issue
Block a user