Tianshou/test/base/env.py

43 lines
1.4 KiB
Python
Raw Normal View History

2020-03-21 10:58:01 +08:00
import gym
import time
class MyTestEnv(gym.Env):
2020-04-28 20:56:02 +08:00
def __init__(self, size, sleep=0, dict_state=False):
2020-03-21 10:58:01 +08:00
self.size = size
self.sleep = sleep
2020-04-28 20:56:02 +08:00
self.dict_state = dict_state
2020-03-21 10:58:01 +08:00
self.reset()
def reset(self, state=0):
2020-03-21 10:58:01 +08:00
self.done = False
self.index = state
2020-04-28 20:56:02 +08:00
return {'index': self.index} if self.dict_state else self.index
2020-03-21 10:58:01 +08:00
def step(self, action):
if self.done:
raise ValueError('step after done !!!')
if self.sleep > 0:
time.sleep(self.sleep)
if self.index == self.size:
self.done = True
2020-04-28 20:56:02 +08:00
if self.dict_state:
return {'index': self.index}, 0, True, {}
else:
return self.index, 0, True, {}
2020-03-21 10:58:01 +08:00
if action == 0:
self.index = max(self.index - 1, 0)
2020-04-28 20:56:02 +08:00
if self.dict_state:
2020-06-01 08:30:09 +08:00
return {'index': self.index}, 0, False, {'key': 1, 'env': self}
2020-04-28 20:56:02 +08:00
else:
return self.index, 0, False, {}
2020-03-21 10:58:01 +08:00
elif action == 1:
self.index += 1
self.done = self.index == self.size
2020-04-28 20:56:02 +08:00
if self.dict_state:
return {'index': self.index}, int(self.done), self.done, \
2020-06-01 08:30:09 +08:00
{'key': 1, 'env': self}
2020-04-28 20:56:02 +08:00
else:
2020-06-01 08:30:09 +08:00
return self.index, int(self.done), self.done, \
{'key': 1, 'env': self}