Trinkle23897 39de63592f finish pg
2020-03-17 11:37:31 +08:00

25 lines
510 B
Python

from abc import ABC, abstractmethod
class BasePolicy(ABC):
"""docstring for BasePolicy"""
def __init__(self):
super().__init__()
self.model = None
def process_fn(self, batch, buffer, indice):
return batch
@abstractmethod
def __call__(self, batch, state=None):
# return Batch(logits=..., act=np.array(), state=None, ...)
pass
@abstractmethod
def learn(self, batch, batch_size=None):
pass
def sync_weight(self):
pass