Fix windows env setup bugs and other typo. (#11)
This commit is contained in:
parent
98feb79057
commit
4da857d86e
2
setup.py
2
setup.py
@ -16,7 +16,7 @@ setup(
|
|||||||
name='tianshou',
|
name='tianshou',
|
||||||
version=version,
|
version=version,
|
||||||
description='A Library for Deep Reinforcement Learning',
|
description='A Library for Deep Reinforcement Learning',
|
||||||
long_description=open('README.md').read(),
|
long_description=open('README.md', encoding='utf8').read(),
|
||||||
long_description_content_type='text/markdown',
|
long_description_content_type='text/markdown',
|
||||||
url='https://github.com/thu-ml/tianshou',
|
url='https://github.com/thu-ml/tianshou',
|
||||||
author='TSAIL',
|
author='TSAIL',
|
||||||
|
@ -74,7 +74,7 @@ def test_a2c(args=get_args()):
|
|||||||
policy, train_envs, ReplayBuffer(args.buffer_size))
|
policy, train_envs, ReplayBuffer(args.buffer_size))
|
||||||
test_collector = Collector(policy, test_envs)
|
test_collector = Collector(policy, test_envs)
|
||||||
# log
|
# log
|
||||||
writer = SummaryWriter(args.logdir + '/' + 'ppo')
|
writer = SummaryWriter(args.logdir + '/' + 'a2c')
|
||||||
|
|
||||||
def stop_fn(x):
|
def stop_fn(x):
|
||||||
return x >= env.spec.reward_threshold
|
return x >= env.spec.reward_threshold
|
||||||
|
@ -73,7 +73,7 @@ def test_dqn(args=get_args()):
|
|||||||
# policy.set_eps(1)
|
# policy.set_eps(1)
|
||||||
train_collector.collect(n_step=args.batch_size)
|
train_collector.collect(n_step=args.batch_size)
|
||||||
# log
|
# log
|
||||||
writer = SummaryWriter(args.logdir + '/' + 'ppo')
|
writer = SummaryWriter(args.logdir + '/' + 'dqn')
|
||||||
|
|
||||||
def stop_fn(x):
|
def stop_fn(x):
|
||||||
return x >= env.spec.reward_threshold
|
return x >= env.spec.reward_threshold
|
||||||
|
@ -122,7 +122,7 @@ def test_pg(args=get_args()):
|
|||||||
policy, train_envs, ReplayBuffer(args.buffer_size))
|
policy, train_envs, ReplayBuffer(args.buffer_size))
|
||||||
test_collector = Collector(policy, test_envs)
|
test_collector = Collector(policy, test_envs)
|
||||||
# log
|
# log
|
||||||
writer = SummaryWriter(args.logdir + '/' + 'ppo')
|
writer = SummaryWriter(args.logdir + '/' + 'pg')
|
||||||
|
|
||||||
def stop_fn(x):
|
def stop_fn(x):
|
||||||
return x >= env.spec.reward_threshold
|
return x >= env.spec.reward_threshold
|
||||||
|
@ -1,7 +1,7 @@
|
|||||||
from tianshou import data, env, utils, policy, trainer, \
|
from tianshou import data, env, utils, policy, trainer, \
|
||||||
exploration
|
exploration
|
||||||
|
|
||||||
__version__ = '0.2.0post2'
|
__version__ = '0.2.0.post2'
|
||||||
__all__ = [
|
__all__ = [
|
||||||
'env',
|
'env',
|
||||||
'data',
|
'data',
|
||||||
|
Loading…
x
Reference in New Issue
Block a user