fix exception in tutorials/dqn.rst (#327)
This commit is contained in:
parent
7db21f3df6
commit
8963a14327
@ -280,7 +280,7 @@ If you find Tianshou useful, please cite it in your publications.
|
|||||||
|
|
||||||
```latex
|
```latex
|
||||||
@misc{tianshou,
|
@misc{tianshou,
|
||||||
author = {Jiayi Weng, Minghao Zhang, Alexis Duburcq, Kaichao You, Dong Yan, Hang Su, Jun Zhu},
|
author = {Jiayi Weng, Huayu Chen, Alexis Duburcq, Kaichao You, Minghao Zhang, Dong Yan, Hang Su, Jun Zhu},
|
||||||
title = {Tianshou},
|
title = {Tianshou},
|
||||||
year = {2020},
|
year = {2020},
|
||||||
publisher = {GitHub},
|
publisher = {GitHub},
|
||||||
|
@ -129,8 +129,7 @@ Tianshou provides :func:`~tianshou.trainer.onpolicy_trainer`, :func:`~tianshou.t
|
|||||||
update_per_step=0.1, episode_per_test=100, batch_size=64,
|
update_per_step=0.1, episode_per_test=100, batch_size=64,
|
||||||
train_fn=lambda epoch, env_step: policy.set_eps(0.1),
|
train_fn=lambda epoch, env_step: policy.set_eps(0.1),
|
||||||
test_fn=lambda epoch, env_step: policy.set_eps(0.05),
|
test_fn=lambda epoch, env_step: policy.set_eps(0.05),
|
||||||
stop_fn=lambda mean_rewards: mean_rewards >= env.spec.reward_threshold,
|
stop_fn=lambda mean_rewards: mean_rewards >= env.spec.reward_threshold)
|
||||||
logger=None)
|
|
||||||
print(f'Finished training! Use {result["duration"]}')
|
print(f'Finished training! Use {result["duration"]}')
|
||||||
|
|
||||||
The meaning of each parameter is as follows (full description can be found at :func:`~tianshou.trainer.offpolicy_trainer`):
|
The meaning of each parameter is as follows (full description can be found at :func:`~tianshou.trainer.offpolicy_trainer`):
|
||||||
|
Loading…
x
Reference in New Issue
Block a user