Tianshou/tianshou/data/batch.py

import torch
import pprint
import numpy as np
from typing import Any, List, Union, Iterator, Optional


class Batch:
    """Tianshou provides :class:`~tianshou.data.Batch` as the internal data
    structure to pass any kind of data to other methods, for example, a
    collector gives a :class:`~tianshou.data.Batch` to policy for learning.
    Here is the usage:
    ::

        >>> import numpy as np
        >>> from tianshou.data import Batch
        >>> data = Batch(a=4, b=[5, 5], c='2312312')
        >>> data.b
        [5, 5]
        >>> data.b = np.array([3, 4, 5])
        >>> print(data)
        Batch(
            a: 4,
            b: array([3, 4, 5]),
            c: '2312312',
        )

    In short, you can define a :class:`Batch` with any key-value pair. The
    current implementation of Tianshou typically use 7 reserved keys in
    :class:`~tianshou.data.Batch`:

    * ``obs`` the observation of step :math:`t` ;
    * ``act`` the action of step :math:`t` ;
    * ``rew`` the reward of step :math:`t` ;
    * ``done`` the done flag of step :math:`t` ;
    * ``obs_next`` the observation of step :math:`t+1` ;
    * ``info`` the info of step :math:`t` (in ``gym.Env``, the ``env.step()``\
        function return 4 arguments, and the last one is ``info``);
    * ``policy`` the data computed by policy in step :math:`t`;

    :class:`~tianshou.data.Batch` has other methods, including
    :meth:`~tianshou.data.Batch.__getitem__`,
    :meth:`~tianshou.data.Batch.__len__`,
    :meth:`~tianshou.data.Batch.append`,
    and :meth:`~tianshou.data.Batch.split`:
    ::

        >>> data = Batch(obs=np.array([0, 11, 22]), rew=np.array([6, 6, 6]))
        >>> # here we test __getitem__
        >>> index = [2, 1]
        >>> data[index].obs
        array([22, 11])

        >>> # here we test __len__
        >>> len(data)
        3

        >>> data.append(data)  # similar to list.append
        >>> data.obs
        array([0, 11, 22, 0, 11, 22])

        >>> # split whole data into multiple small batch
        >>> for d in data.split(size=2, shuffle=False):
        ...     print(d.obs, d.rew)
        [ 0 11] [6 6]
        [22  0] [6 6]
        [11 22] [6 6]
    """

    def __init__(self, **kwargs) -> None:
        super().__init__()
        self._meta = {}
        for k, v in kwargs.items():
            if isinstance(v, (list, np.ndarray)) \
                    and len(v) > 0 and isinstance(v[0], dict) and k != 'info':
                self._meta[k] = list(v[0].keys())
                for k_ in v[0].keys():
                    k__ = '_' + k + '@' + k_
                    self.__dict__[k__] = np.array([
                        v[i][k_] for i in range(len(v))
                    ])
            elif isinstance(v, dict):
                self._meta[k] = list(v.keys())
                for k_, v_ in v.items():
                    k__ = '_' + k + '@' + k_
                    self.__dict__[k__] = v_
            else:
                self.__dict__[k] = kwargs[k]

    def __getitem__(self, index: Union[str, slice]) -> Union['Batch', dict]:
        """Return self[index]."""
        if isinstance(index, str):
            return self.__getattr__(index)
        b = Batch()
        for k, v in self.__dict__.items():
            if k != '_meta' and v is not None:
                b.__dict__.update(**{k: v[index]})
        b._meta = self._meta
        return b

    def __getattr__(self, key: str) -> Union['Batch', Any]:
        """Return self.key"""
        if key not in self._meta.keys():
            if key not in self.__dict__:
                raise AttributeError(key)
            return self.__dict__[key]
        d = {}
        for k_ in self._meta[key]:
            k__ = '_' + key + '@' + k_
            d[k_] = self.__dict__[k__]
        return Batch(**d)

    def __repr__(self) -> str:
        """Return str(self)."""
        s = self.__class__.__name__ + '(\n'
        flag = False
        for k in sorted(list(self.__dict__) + list(self._meta)):
            if k[0] != '_' and (self.__dict__.get(k, None) is not None or
                                k in self._meta):
                rpl = '\n' + ' ' * (6 + len(k))
                obj = pprint.pformat(self.__getattr__(k)).replace('\n', rpl)
                s += f'    {k}: {obj},\n'
                flag = True
        if flag:
            s += ')'
        else:
            s = self.__class__.__name__ + '()'
        return s

    def keys(self) -> List[str]:
        """Return self.keys()."""
        return sorted(list(self._meta.keys()) +
                      [k for k in self.__dict__.keys() if k[0] != '_'])

    def values(self) -> List[Any]:
        """Return self.values()."""
        return [self[k] for k in self.keys()]

    def get(self, k: str, d: Optional[Any] = None) -> Union['Batch', Any]:
        """Return self[k] if k in self else d. d defaults to None."""
        if k in self.__dict__ or k in self._meta:
            return self.__getattr__(k)
        return d

    def to_numpy(self) -> None:
        """Change all torch.Tensor to numpy.ndarray. This is an inplace
        operation.
        """
        for k, v in self.__dict__.items():
            if isinstance(v, torch.Tensor):
                self.__dict__[k] = v.cpu().numpy()
            elif isinstance(v, Batch):
                v.to_numpy()

    def to_torch(self,
                 dtype: Optional[torch.dtype] = None,
                 device: Union[str, int] = 'cpu'
                 ) -> None:
        """Change all numpy.ndarray to torch.Tensor. This is an inplace
        operation.
        """
        for k, v in self.__dict__.items():
            if isinstance(v, np.ndarray):
                v = torch.from_numpy(v).to(device)
                if dtype is not None:
                    v = v.type(dtype)
                self.__dict__[k] = v
            elif isinstance(v, Batch):
                v.to_torch()

    def append(self, batch: 'Batch') -> None:
        """Append a :class:`~tianshou.data.Batch` object to current batch."""
        assert isinstance(batch, Batch), 'Only append Batch is allowed!'
        for k, v in batch.__dict__.items():
            if k == '_meta':
                self._meta.update(batch._meta)
                continue
            if v is None:
                continue
            if not hasattr(self, k) or self.__dict__[k] is None:
                self.__dict__[k] = v
            elif isinstance(v, np.ndarray):
                self.__dict__[k] = np.concatenate([self.__dict__[k], v])
            elif isinstance(v, torch.Tensor):
                self.__dict__[k] = torch.cat([self.__dict__[k], v])
            elif isinstance(v, list):
                self.__dict__[k] += v
            else:
                s = f'No support for append with type \
                      {type(v)} in class Batch.'
                raise TypeError(s)

    def __len__(self) -> int:
        """Return len(self)."""
        return min([len(v) for k, v in self.__dict__.items()
                    if k != '_meta' and v is not None])

    def split(self, size: Optional[int] = None,
              shuffle: bool = True) -> Iterator['Batch']:
        """Split whole data into multiple small batch.

        :param int size: if it is ``None``, it does not split the data batch;
            otherwise it will divide the data batch with the given size.
            Default to ``None``.
        :param bool shuffle: randomly shuffle the entire data batch if it is
            ``True``, otherwise remain in the same. Default to ``True``.
        """
        length = len(self)
        if size is None:
            size = length
        if shuffle:
            indices = np.random.permutation(length)
        else:
            indices = np.arange(length)
        for idx in np.arange(0, length, size):
            yield self[indices[idx:(idx + size)]]
add cache buf in collector 2020-03-14 21:48:31 +08:00			`import torch`
Multimodal obs (#38, #27, #25) 2020-04-28 20:56:02 +08:00			`import pprint`
maybe finished collector? 2020-03-13 17:49:22 +08:00			`import numpy as np`
add type annotation 2020-05-12 11:31:47 +08:00			`from typing import Any, List, Union, Iterator, Optional`
maybe finished collector? 2020-03-13 17:49:22 +08:00

Minor refactor for Batch class. (#61) * Minor refactor for Batch class. * Fix. * Add back key sorting. Co-authored-by: Alexis Duburcq <alexis.duburcq@wandercraft.eu> 2020-05-29 11:56:46 +02:00			`class Batch:`
add docs of collector and trainer (#20) 2020-04-05 18:34:45 +08:00			"""Tianshou provides :class:`~tianshou.data.Batch` as the internal data
add some docs 2020-04-03 21:28:12 +08:00			`structure to pass any kind of data to other methods, for example, a`
			collector gives a :class:`~tianshou.data.Batch` to policy for learning.
			`Here is the usage:`
			`::`

			`>>> import numpy as np`
			`>>> from tianshou.data import Batch`
			`>>> data = Batch(a=4, b=[5, 5], c='2312312')`
			`>>> data.b`
			`[5, 5]`
			`>>> data.b = np.array([3, 4, 5])`
seealso and change policy dir structure 2020-04-09 21:36:53 +08:00			`>>> print(data)`
			`Batch(`
			`a: 4,`
add type annotation 2020-05-12 11:31:47 +08:00			`b: array([3, 4, 5]),`
			`c: '2312312',`
seealso and change policy dir structure 2020-04-09 21:36:53 +08:00			`)`
add some docs 2020-04-03 21:28:12 +08:00
			In short, you can define a :class:`Batch` with any key-value pair. The
reserve 'policy' keyword in replay buffer 2020-04-29 17:48:48 +08:00			`current implementation of Tianshou typically use 7 reserved keys in`
add some docs 2020-04-03 21:28:12 +08:00			:class:`~tianshou.data.Batch`:

add docs of collector and trainer (#20) 2020-04-05 18:34:45 +08:00			* ``obs`` the observation of step :math:`t` ;
			* ``act`` the action of step :math:`t` ;
			* ``rew`` the reward of step :math:`t` ;
			* ``done`` the done flag of step :math:`t` ;
			* ``obs_next`` the observation of step :math:`t+1` ;
			* ``info`` the info of step :math:`t` (in ``gym.Env``, the ``env.step()``\
add some docs 2020-04-03 21:28:12 +08:00			function return 4 arguments, and the last one is ``info``);
reserve 'policy' keyword in replay buffer 2020-04-29 17:48:48 +08:00			* ``policy`` the data computed by policy in step :math:`t`;
add some docs 2020-04-03 21:28:12 +08:00
			:class:`~tianshou.data.Batch` has other methods, including
			:meth:`~tianshou.data.Batch.__getitem__`,
			:meth:`~tianshou.data.Batch.__len__`,
			:meth:`~tianshou.data.Batch.append`,
			and :meth:`~tianshou.data.Batch.split`:
			`::`

			`>>> data = Batch(obs=np.array([0, 11, 22]), rew=np.array([6, 6, 6]))`
			`>>> # here we test __getitem__`
			`>>> index = [2, 1]`
			`>>> data[index].obs`
			`array([22, 11])`

			`>>> # here we test __len__`
			`>>> len(data)`
			`3`

			`>>> data.append(data) # similar to list.append`
			`>>> data.obs`
			`array([0, 11, 22, 0, 11, 22])`

			`>>> # split whole data into multiple small batch`
Multimodal obs (#38, #27, #25) 2020-04-28 20:56:02 +08:00			`>>> for d in data.split(size=2, shuffle=False):`
add some docs 2020-04-03 21:28:12 +08:00			`... print(d.obs, d.rew)`
			`[ 0 11] [6 6]`
			`[22 0] [6 6]`
			`[11 22] [6 6]`
			`"""`
maybe finished collector? 2020-03-13 17:49:22 +08:00
add type annotation 2020-05-12 11:31:47 +08:00			`def __init__(self, **kwargs) -> None:`
env and data 2020-03-11 09:09:56 +08:00			`super().__init__()`
Multimodal obs (#38, #27, #25) 2020-04-28 20:56:02 +08:00			`self._meta = {}`
			`for k, v in kwargs.items():`
item3 of #51 2020-05-27 11:02:23 +08:00			`if isinstance(v, (list, np.ndarray)) \`
Multimodal obs (#38, #27, #25) 2020-04-28 20:56:02 +08:00			`and len(v) > 0 and isinstance(v[0], dict) and k != 'info':`
			`self._meta[k] = list(v[0].keys())`
			`for k_ in v[0].keys():`
			`k__ = '_' + k + '@' + k_`
			`self.__dict__[k__] = np.array([`
			`v[i][k_] for i in range(len(v))`
			`])`
item3 of #51 2020-05-27 11:02:23 +08:00			`elif isinstance(v, dict):`
Multimodal obs (#38, #27, #25) 2020-04-28 20:56:02 +08:00			`self._meta[k] = list(v.keys())`
Minor refactor for Batch class. (#61) * Minor refactor for Batch class. * Fix. * Add back key sorting. Co-authored-by: Alexis Duburcq <alexis.duburcq@wandercraft.eu> 2020-05-29 11:56:46 +02:00			`for k_, v_ in v.items():`
Multimodal obs (#38, #27, #25) 2020-04-28 20:56:02 +08:00			`k__ = '_' + k + '@' + k_`
Minor refactor for Batch class. (#61) * Minor refactor for Batch class. * Fix. * Add back key sorting. Co-authored-by: Alexis Duburcq <alexis.duburcq@wandercraft.eu> 2020-05-29 11:56:46 +02:00			`self.__dict__[k__] = v_`
Multimodal obs (#38, #27, #25) 2020-04-28 20:56:02 +08:00			`else:`
			`self.__dict__[k] = kwargs[k]`
half of collector 2020-03-12 22:20:33 +08:00
add type annotation 2020-05-12 11:31:47 +08:00			`def __getitem__(self, index: Union[str, slice]) -> Union['Batch', dict]:`
docs for env 2020-04-04 21:02:06 +08:00			`"""Return self[index]."""`
Multimodal obs (#38, #27, #25) 2020-04-28 20:56:02 +08:00			`if isinstance(index, str):`
			`return self.__getattr__(index)`
add cache buf in collector 2020-03-14 21:48:31 +08:00			`b = Batch()`
Minor refactor for Batch class. (#61) * Minor refactor for Batch class. * Fix. * Add back key sorting. Co-authored-by: Alexis Duburcq <alexis.duburcq@wandercraft.eu> 2020-05-29 11:56:46 +02:00			`for k, v in self.__dict__.items():`
			`if k != '_meta' and v is not None:`
			`b.__dict__.update(**{k: v[index]})`
Multimodal obs (#38, #27, #25) 2020-04-28 20:56:02 +08:00			`b._meta = self._meta`
add cache buf in collector 2020-03-14 21:48:31 +08:00			`return b`

add type annotation 2020-05-12 11:31:47 +08:00			`def __getattr__(self, key: str) -> Union['Batch', Any]:`
Multimodal obs (#38, #27, #25) 2020-04-28 20:56:02 +08:00			`"""Return self.key"""`
Minor refactor for Batch class. (#61) * Minor refactor for Batch class. * Fix. * Add back key sorting. Co-authored-by: Alexis Duburcq <alexis.duburcq@wandercraft.eu> 2020-05-29 11:56:46 +02:00			`if key not in self._meta.keys():`
support Batch of Batch and fix bugs (#38) 2020-04-29 12:14:53 +08:00			`if key not in self.__dict__:`
Multimodal obs (#38, #27, #25) 2020-04-28 20:56:02 +08:00			`raise AttributeError(key)`
			`return self.__dict__[key]`
			`d = {}`
			`for k_ in self._meta[key]:`
			`k__ = '_' + key + '@' + k_`
			`d[k_] = self.__dict__[k__]`
support Batch of Batch and fix bugs (#38) 2020-04-29 12:14:53 +08:00			`return Batch(**d)`
Multimodal obs (#38, #27, #25) 2020-04-28 20:56:02 +08:00
add type annotation 2020-05-12 11:31:47 +08:00			`def __repr__(self) -> str:`
fix rnn (#19), add __repr__, and fix #26 2020-04-09 19:53:45 +08:00			`"""Return str(self)."""`
			`s = self.__class__.__name__ + '(\n'`
			`flag = False`
support Batch of Batch and fix bugs (#38) 2020-04-29 12:14:53 +08:00			`for k in sorted(list(self.__dict__) + list(self._meta)):`
Multimodal obs (#38, #27, #25) 2020-04-28 20:56:02 +08:00			`if k[0] != '_' and (self.__dict__.get(k, None) is not None or`
support Batch of Batch and fix bugs (#38) 2020-04-29 12:14:53 +08:00			`k in self._meta):`
fix rnn (#19), add __repr__, and fix #26 2020-04-09 19:53:45 +08:00			`rpl = '\n' + ' ' * (6 + len(k))`
Multimodal obs (#38, #27, #25) 2020-04-28 20:56:02 +08:00			`obj = pprint.pformat(self.__getattr__(k)).replace('\n', rpl)`
fix rnn (#19), add __repr__, and fix #26 2020-04-09 19:53:45 +08:00			`s += f' {k}: {obj},\n'`
			`flag = True`
			`if flag:`
support Batch of Batch and fix bugs (#38) 2020-04-29 12:14:53 +08:00			`s += ')'`
fix rnn (#19), add __repr__, and fix #26 2020-04-09 19:53:45 +08:00			`else:`
support Batch of Batch and fix bugs (#38) 2020-04-29 12:14:53 +08:00			`s = self.__class__.__name__ + '()'`
fix rnn (#19), add __repr__, and fix #26 2020-04-09 19:53:45 +08:00			`return s`

add type annotation 2020-05-12 11:31:47 +08:00			`def keys(self) -> List[str]:`
Multimodal obs (#38, #27, #25) 2020-04-28 20:56:02 +08:00			`"""Return self.keys()."""`
Minor refactor for Batch class. (#61) * Minor refactor for Batch class. * Fix. * Add back key sorting. Co-authored-by: Alexis Duburcq <alexis.duburcq@wandercraft.eu> 2020-05-29 11:56:46 +02:00			`return sorted(list(self._meta.keys()) +`
			`[k for k in self.__dict__.keys() if k[0] != '_'])`
Multimodal obs (#38, #27, #25) 2020-04-28 20:56:02 +08:00
fix #56 2020-05-29 08:03:37 +08:00			`def values(self) -> List[Any]:`
			`"""Return self.values()."""`
			`return [self[k] for k in self.keys()]`

add type annotation 2020-05-12 11:31:47 +08:00			`def get(self, k: str, d: Optional[Any] = None) -> Union['Batch', Any]:`
add preprocess_fn (#42) 2020-05-05 13:39:51 +08:00			`"""Return self[k] if k in self else d. d defaults to None."""`
			`if k in self.__dict__ or k in self._meta:`
			`return self.__getattr__(k)`
			`return d`

Robust conversion from/to numpy/pytorch (#63) * Enable to convert Batch data back to torch. * Add torch converter to collector. * Fix * Move to_numpy/to_torch convert in dedicated utils.py. * Use to_numpy/to_torch to convert arrays. * fix lint * fix * Add unit test to check Batch from/to numpy. * Fix Batch over Batch. Co-authored-by: Alexis Duburcq <alexis.duburcq@wandercraft.eu> 2020-05-29 14:45:21 +02:00			`def to_numpy(self) -> None:`
reserve 'policy' keyword in replay buffer 2020-04-29 17:48:48 +08:00			`"""Change all torch.Tensor to numpy.ndarray. This is an inplace`
			`operation.`
			`"""`
Minor refactor for Batch class. (#61) * Minor refactor for Batch class. * Fix. * Add back key sorting. Co-authored-by: Alexis Duburcq <alexis.duburcq@wandercraft.eu> 2020-05-29 11:56:46 +02:00			`for k, v in self.__dict__.items():`
			`if isinstance(v, torch.Tensor):`
			`self.__dict__[k] = v.cpu().numpy()`
Robust conversion from/to numpy/pytorch (#63) * Enable to convert Batch data back to torch. * Add torch converter to collector. * Fix * Move to_numpy/to_torch convert in dedicated utils.py. * Use to_numpy/to_torch to convert arrays. * fix lint * fix * Add unit test to check Batch from/to numpy. * Fix Batch over Batch. Co-authored-by: Alexis Duburcq <alexis.duburcq@wandercraft.eu> 2020-05-29 14:45:21 +02:00			`elif isinstance(v, Batch):`
			`v.to_numpy()`

			`def to_torch(self,`
			`dtype: Optional[torch.dtype] = None,`
			`device: Union[str, int] = 'cpu'`
			`) -> None:`
			`"""Change all numpy.ndarray to torch.Tensor. This is an inplace`
			`operation.`
			`"""`
			`for k, v in self.__dict__.items():`
			`if isinstance(v, np.ndarray):`
			`v = torch.from_numpy(v).to(device)`
			`if dtype is not None:`
			`v = v.type(dtype)`
			`self.__dict__[k] = v`
			`elif isinstance(v, Batch):`
			`v.to_torch()`
reserve 'policy' keyword in replay buffer 2020-04-29 17:48:48 +08:00
add type annotation 2020-05-12 11:31:47 +08:00			`def append(self, batch: 'Batch') -> None:`
add docs of collector and trainer (#20) 2020-04-05 18:34:45 +08:00			"""Append a :class:`~tianshou.data.Batch` object to current batch."""
maybe finished collector? 2020-03-13 17:49:22 +08:00			`assert isinstance(batch, Batch), 'Only append Batch is allowed!'`
Minor refactor for Batch class. (#61) * Minor refactor for Batch class. * Fix. * Add back key sorting. Co-authored-by: Alexis Duburcq <alexis.duburcq@wandercraft.eu> 2020-05-29 11:56:46 +02:00			`for k, v in batch.__dict__.items():`
Multimodal obs (#38, #27, #25) 2020-04-28 20:56:02 +08:00			`if k == '_meta':`
support Batch of Batch and fix bugs (#38) 2020-04-29 12:14:53 +08:00			`self._meta.update(batch._meta)`
Multimodal obs (#38, #27, #25) 2020-04-28 20:56:02 +08:00			`continue`
Minor refactor for Batch class. (#61) * Minor refactor for Batch class. * Fix. * Add back key sorting. Co-authored-by: Alexis Duburcq <alexis.duburcq@wandercraft.eu> 2020-05-29 11:56:46 +02:00			`if v is None:`
maybe finished collector? 2020-03-13 17:49:22 +08:00			`continue`
			`if not hasattr(self, k) or self.__dict__[k] is None:`
Minor refactor for Batch class. (#61) * Minor refactor for Batch class. * Fix. * Add back key sorting. Co-authored-by: Alexis Duburcq <alexis.duburcq@wandercraft.eu> 2020-05-29 11:56:46 +02:00			`self.__dict__[k] = v`
			`elif isinstance(v, np.ndarray):`
			`self.__dict__[k] = np.concatenate([self.__dict__[k], v])`
			`elif isinstance(v, torch.Tensor):`
			`self.__dict__[k] = torch.cat([self.__dict__[k], v])`
			`elif isinstance(v, list):`
			`self.__dict__[k] += v`
maybe finished collector? 2020-03-13 17:49:22 +08:00			`else:`
Minor refactor for Batch class. (#61) * Minor refactor for Batch class. * Fix. * Add back key sorting. Co-authored-by: Alexis Duburcq <alexis.duburcq@wandercraft.eu> 2020-05-29 11:56:46 +02:00			`s = f'No support for append with type \`
			`{type(v)} in class Batch.'`
add rllib result and fix pep8 2020-03-28 09:43:35 +08:00			`raise TypeError(s)`
finish pg 2020-03-17 11:37:31 +08:00
add type annotation 2020-05-12 11:31:47 +08:00			`def __len__(self) -> int:`
docs for env 2020-04-04 21:02:06 +08:00			`"""Return len(self)."""`
Minor refactor for Batch class. (#61) * Minor refactor for Batch class. * Fix. * Add back key sorting. Co-authored-by: Alexis Duburcq <alexis.duburcq@wandercraft.eu> 2020-05-29 11:56:46 +02:00			`return min([len(v) for k, v in self.__dict__.items()`
			`if k != '_meta' and v is not None])`
add some docs 2020-04-03 21:28:12 +08:00
add type annotation 2020-05-12 11:31:47 +08:00			`def split(self, size: Optional[int] = None,`
fix optional type syntax 2020-05-16 20:08:32 +08:00			`shuffle: bool = True) -> Iterator['Batch']:`
add docs of collector and trainer (#20) 2020-04-05 18:34:45 +08:00			`"""Split whole data into multiple small batch.`
add some docs 2020-04-03 21:28:12 +08:00
add policy docs (#21) 2020-04-06 19:36:59 +08:00			:param int size: if it is ``None``, it does not split the data batch;
add some docs 2020-04-03 21:28:12 +08:00			`otherwise it will divide the data batch with the given size.`
add policy docs (#21) 2020-04-06 19:36:59 +08:00			Default to ``None``.
Multimodal obs (#38, #27, #25) 2020-04-28 20:56:02 +08:00			`:param bool shuffle: randomly shuffle the entire data batch if it is`
add policy docs (#21) 2020-04-06 19:36:59 +08:00			``True``, otherwise remain in the same. Default to ``True``.
add some docs 2020-04-03 21:28:12 +08:00			`"""`
			`length = len(self)`
finish pg 2020-03-17 11:37:31 +08:00			`if size is None:`
			`size = length`
Multimodal obs (#38, #27, #25) 2020-04-28 20:56:02 +08:00			`if shuffle:`
Minor refactor for Batch class. (#61) * Minor refactor for Batch class. * Fix. * Add back key sorting. Co-authored-by: Alexis Duburcq <alexis.duburcq@wandercraft.eu> 2020-05-29 11:56:46 +02:00			`indices = np.random.permutation(length)`
ppo and early stop 2020-03-20 19:52:29 +08:00			`else:`
Minor refactor for Batch class. (#61) * Minor refactor for Batch class. * Fix. * Add back key sorting. Co-authored-by: Alexis Duburcq <alexis.duburcq@wandercraft.eu> 2020-05-29 11:56:46 +02:00			`indices = np.arange(length)`
			`for idx in np.arange(0, length, size):`
			`yield self[indices[idx:(idx + size)]]`