20 lines
440 B
Python
20 lines
440 B
Python
from __future__ import absolute_import
|
|
from __future__ import division
|
|
|
|
import tensorflow as tf
|
|
|
|
|
|
class PolicyBase(object):
|
|
"""
|
|
base class for policy. only provides `act` method with exploration
|
|
"""
|
|
def act(self, observation, my_feed_dict):
|
|
raise NotImplementedError()
|
|
|
|
def reset(self):
|
|
"""
|
|
for temporal correlated random process exploration, as in DDPG
|
|
:return:
|
|
"""
|
|
pass
|