Docstring: minor changes to let ruff pass

2023-12-04 13:52:10 +01:00 · 2023-12-04 13:52:10 +01:00 · 2e39a252e3
commit 2e39a252e3
parent 28fda00b27
13 changed files with 56 additions and 36 deletions
--- a/docs/autogen_rst.py
+++ b/docs/autogen_rst.py
@ -39,6 +39,7 @@ def write_to_file(content: str, path: str):
 def make_rst(src_root, rst_root, clean=False, overwrite=False, package_prefix=""):
    """Creates/updates documentation in form of rst files for modules and packages.
    Does not delete any existing rst files. Thus, rst files for packages or modules that have been removed or renamed
    should be deleted by hand.
@ -116,6 +117,6 @@ if __name__ == "__main__":
    docs_root = Path(__file__).parent
    make_rst(
        docs_root / ".." / "tianshou",
-        docs_root / "api",
+        docs_root / "03_api",
        clean=True,
    )
--- a/tianshou/data/buffer/base.py
+++ b/tianshou/data/buffer/base.py
@ -18,7 +18,7 @@ class ReplayBuffer:
    stores all the data in a batch with circular-queue style.
    For the example usage of ReplayBuffer, please check out Section Buffer in
-    :doc:`/tutorials/01_concepts`.
+    :doc:`/01_tutorials/01_concepts`.
    :param size: the maximum size of replay buffer.
    :param stack_num: the frame-stack sampling argument, should be greater than or
--- a/tianshou/highlevel/env.py
+++ b/tianshou/highlevel/env.py
@ -81,8 +81,7 @@ class Environments(ToStringMixin, ABC):
        num_training_envs: int,
        num_test_envs: int,
    ) -> "Environments":
-        """Creates a suitable subtype instance from a factory function that creates a single instance and
+        """Creates a suitable subtype instance from a factory function that creates a single instance and the type of environment (continuous/discrete).
        the type of environment (continuous/discrete).
        :param factory_fn: the factory for a single environment instance
        :param env_type: the type of environments created by `factory_fn`
@ -115,8 +114,7 @@ class Environments(ToStringMixin, ABC):
        }
    def set_persistence(self, *p: Persistence) -> None:
-        """Associates the given persistence handlers which may persist and restore
+        """Associates the given persistence handlers which may persist and restore environment-specific information.
        environment-specific information.
        :param p: persistence handlers
        """
--- a/tianshou/highlevel/experiment.py
+++ b/tianshou/highlevel/experiment.py
@ -188,7 +188,9 @@ class Experiment(ToStringMixin):
        experiment_name: str | None = None,
        logger_run_id: str | None = None,
    ) -> ExperimentResult:
-        """:param experiment_name: the experiment name, which corresponds to the directory (within the logging
+        """Run the experiment and return the results.
        :param experiment_name: the experiment name, which corresponds to the directory (within the logging
            directory) where all results associated with the experiment will be saved.
            The name may contain path separators (i.e. `os.path.sep`, as used by `os.path.join`), in which case
            a nested directory structure will be created.
@ -327,6 +329,7 @@ class ExperimentBuilder:
    def with_logger_factory(self, logger_factory: LoggerFactory) -> Self:
        """Allows to customize the logger factory to use.
        If this method is not called, the default logger factory :class:`LoggerFactoryDefault` will be used.
        :param logger_factory: the factory to use
@ -346,6 +349,7 @@ class ExperimentBuilder:
    def with_optim_factory(self, optim_factory: OptimizerFactory) -> Self:
        """Allows to customize the gradient-based optimizer to use.
        By default, :class:`OptimizerFactoryAdam` will be used with default parameters.
        :param optim_factory: the optimizer factory
@ -390,6 +394,7 @@ class ExperimentBuilder:
    def with_trainer_stop_callback(self, callback: TrainerStopCallback) -> Self:
        """Allows to define a callback that decides whether training shall stop early.
        The callback receives the undiscounted returns of the testing result.
        :param callback: the callback
@ -435,6 +440,7 @@ class _BuilderMixinActorFactory(ActorFutureProviderProtocol):
    def with_actor_factory(self, actor_factory: ActorFactory) -> Self:
        """Allows to customize the actor component via the specification of a factory.
        If this function is not called, a default actor factory (with default parameters) will be used.
        :param actor_factory: the factory to use for the creation of the actor network
@ -450,7 +456,9 @@ class _BuilderMixinActorFactory(ActorFutureProviderProtocol):
        continuous_unbounded: bool = False,
        continuous_conditioned_sigma: bool = False,
    ) -> Self:
-        """:param hidden_sizes: the sequence of hidden dimensions to use in the network structure
+        """Adds a default actor factory with the given parameters.
        :param hidden_sizes: the sequence of hidden dimensions to use in the network structure
        :param continuous_unbounded: whether, for continuous action spaces, to apply tanh activation on final logits
        :param continuous_conditioned_sigma: whether, for continuous action spaces, the standard deviation of continuous actions (sigma)
            shall be computed from the input; if False, sigma is an independent parameter.
@ -479,9 +487,7 @@ class _BuilderMixinActorFactory(ActorFutureProviderProtocol):
 class _BuilderMixinActorFactory_ContinuousGaussian(_BuilderMixinActorFactory):
-    """Specialization of the actor mixin where, in the continuous case, the actor component outputs
+    """Specialization of the actor mixin where, in the continuous case, the actor component outputs Gaussian distribution parameters."""
    Gaussian distribution parameters.
    """
    def __init__(self) -> None:
        super().__init__(ContinuousActorType.GAUSSIAN)
@ -494,6 +500,7 @@ class _BuilderMixinActorFactory_ContinuousGaussian(_BuilderMixinActorFactory):
        continuous_conditioned_sigma: bool = False,
    ) -> Self:
        """Defines use of the default actor factory, allowing its parameters it to be customized.
        The default actor factory uses an MLP-style architecture.
        :param hidden_sizes: dimensions of hidden layers used by the network
@ -523,6 +530,7 @@ class _BuilderMixinActorFactory_ContinuousDeterministic(_BuilderMixinActorFactor
        hidden_activation: ModuleType = torch.nn.ReLU,
    ) -> Self:
        """Defines use of the default actor factory, allowing its parameters it to be customized.
        The default actor factory uses an MLP-style architecture.
        :param hidden_sizes: dimensions of hidden layers used by the network
@ -700,6 +708,7 @@ class _BuilderMixinCriticEnsembleFactory:
    def with_critic_ensemble_factory(self, factory: CriticEnsembleFactory) -> Self:
        """Specifies that the given factory shall be used for the critic ensemble.
        If unspecified, the default factory (:class:`CriticEnsembleFactoryDefault`) is used.
        :param factory: the critic ensemble factory
--- a/tianshou/highlevel/logger.py
+++ b/tianshou/highlevel/logger.py
@ -19,7 +19,9 @@ class LoggerFactory(ToStringMixin, ABC):
        run_id: str | None,
        config_dict: dict,
    ) -> TLogger:
-        """:param log_dir: path to the directory in which log data is to be stored
+        """Creates the logger.
        :param log_dir: path to the directory in which log data is to be stored
        :param experiment_name: the name of the job, which may contain `os.path.sep`
        :param run_id: a unique name, which, depending on the logging framework, may be used to identify the logger
        :param config_dict: a dictionary with data that is to be logged
--- a/tianshou/highlevel/module/actor.py
+++ b/tianshou/highlevel/module/actor.py
@ -168,7 +168,9 @@ class ActorFactoryContinuousGaussianNet(ActorFactoryContinuous):
        conditioned_sigma: bool = False,
        activation: ModuleType = nn.ReLU,
    ):
-        """:param hidden_sizes: the sequence of hidden dimensions to use in the network structure
+        """For actors with Gaussian policies.
        :param hidden_sizes: the sequence of hidden dimensions to use in the network structure
        :param unbounded: whether to apply tanh activation on final logits
        :param conditioned_sigma: if True, the standard deviation of continuous actions (sigma) is computed from the
            input; if False, sigma is an independent parameter
@ -229,9 +231,7 @@ class ActorFactoryDiscreteNet(ActorFactory):
 class ActorFactoryTransientStorageDecorator(ActorFactory):
-    """Wraps an actor factory, storing the most recently created actor instance such that it
+    """Wraps an actor factory, storing the most recently created actor instance such that it can be retrieved."""
    can be retrieved.
    """
    def __init__(self, actor_factory: ActorFactory, actor_future: ActorFuture):
        self.actor_factory = actor_factory
--- a/tianshou/highlevel/optim.py
+++ b/tianshou/highlevel/optim.py
@ -20,7 +20,9 @@ class OptimizerFactory(ABC, ToStringMixin):
 class OptimizerFactoryTorch(OptimizerFactory):
    def __init__(self, optim_class: OptimizerWithLearningRateProtocol, **kwargs: Any):
-        """:param optim_class: the optimizer class (e.g. subclass of `torch.optim.Optimizer`),
+        """Factory for torch optimizers.
        :param optim_class: the optimizer class (e.g. subclass of `torch.optim.Optimizer`),
            which will be passed the module parameters, the learning rate as `lr` and the
            kwargs provided.
        :param kwargs: keyword arguments to provide at optimizer construction
--- a/tianshou/highlevel/params/noise.py
+++ b/tianshou/highlevel/params/noise.py
@ -12,13 +12,12 @@ class NoiseFactory(ToStringMixin, ABC):
 class NoiseFactoryMaxActionScaledGaussian(NoiseFactory):
    """Factory for Gaussian noise where the standard deviation is a fraction of the maximum action value.
    This factory can only be applied to continuous action spaces.
    """
    def __init__(self, std_fraction: float):
-        """:param std_fraction: fraction (between 0 and 1) of the maximum action value that shall
+        """Factory for Gaussian noise where the standard deviation is a fraction of the maximum action value.
        This factory can only be applied to continuous action spaces.
        :param std_fraction: fraction (between 0 and 1) of the maximum action value that shall
        be used as the standard deviation
        """
        self.std_fraction = std_fraction
--- a/tianshou/highlevel/params/policy_params.py
+++ b/tianshou/highlevel/params/policy_params.py
@ -43,7 +43,9 @@ class ParamTransformerData:
 class ParamTransformer(ABC):
-    """Transforms one or more parameters from the representation used by the high-level API
+    """Base class for parameter transformations from high to low-level API.
    Transforms one or more parameters from the representation used by the high-level API
    to the representation required by the (low-level) policy implementation.
    It operates directly on a dictionary of keyword arguments, which is initially
    generated from the parameter dataclass (subclass of `Params`).
@ -83,7 +85,9 @@ class ParamTransformerChangeValue(ParamTransformer):
 class ParamTransformerLRScheduler(ParamTransformer):
-    """Transforms a key containing a learning rate scheduler factory (removed) into a key containing
+    """Transformer for learning rate scheduler params.
    Transforms a key containing a learning rate scheduler factory (removed) into a key containing
    a learning rate scheduler (added) for the data member `optim`.
    """
@ -100,12 +104,12 @@ class ParamTransformerLRScheduler(ParamTransformer):
 class ParamTransformerMultiLRScheduler(ParamTransformer):
    """Transforms several scheduler factories into a single scheduler, which may be a MultipleLRSchedulers instance
    if more than one factory is indeed given.
    """
    def __init__(self, optim_key_list: list[tuple[torch.optim.Optimizer, str]], key_scheduler: str):
-        """:param optim_key_list: a list of tuples (optimizer, key of learning rate factory)
+        """Transforms several scheduler factories into a single scheduler.
         The result may be a `MultipleLRSchedulers` instance if more than one factory is indeed given.
        :param optim_key_list: a list of tuples (optimizer, key of learning rate factory)
        :param key_scheduler: the key under which to store the resulting learning rate scheduler
        """
        self.optim_key_list = optim_key_list
--- a/tianshou/highlevel/persistence.py
+++ b/tianshou/highlevel/persistence.py
@ -57,9 +57,9 @@ class PersistenceGroup(Persistence):
 class PolicyPersistence:
    """Handles persistence of the policy."""
    class Mode(Enum):
        """Mode of persistence."""
        POLICY_STATE_DICT = "policy_state_dict"
        """Persist only the policy's state dictionary. Note that for a policy to be restored from
        such a dictionary, it is necessary to first create a structurally equivalent object which can
@ -81,7 +81,9 @@ class PolicyPersistence:
        enabled: bool = True,
        mode: Mode = Mode.POLICY,
    ):
-        """:param additional_persistence: a persistence instance which is to be invoked whenever
+        """Handles persistence of the policy.
        :param additional_persistence: a persistence instance which is to be invoked whenever
            this object is used to persist/restore data
        :param enabled: whether persistence is enabled (restoration is always enabled)
        :param mode: the persistence mode
--- a/tianshou/highlevel/trainer.py
+++ b/tianshou/highlevel/trainer.py
@ -51,7 +51,9 @@ class TrainerStopCallback(ToStringMixin, ABC):
    @abstractmethod
    def should_stop(self, mean_rewards: float, context: TrainingContext) -> bool:
-        """:param mean_rewards: the average undiscounted returns of the testing result
+        """Determines whether training should stop.
        :param mean_rewards: the average undiscounted returns of the testing result
        :param context: the training context
        :return: True if the goal has been reached and training should stop, False otherwise
        """
--- a/tianshou/policy/base.py
+++ b/tianshou/policy/base.py
@ -159,8 +159,7 @@ class BasePolicy(ABC, nn.Module):
        info: dict[str, Any] | None = None,
        state: dict | BatchProtocol | np.ndarray | None = None,
    ) -> np.ndarray | int:
-        """Get action as int (for discrete env's) or array (for continuous ones) from
+        """Get action as int (for discrete env's) or array (for continuous ones) from an env's observation and info.
        an env's observation and info.
        :param obs: observation from the gym's env.
        :param info: information given by the gym's env.
--- a/tianshou/utils/string.py
+++ b/tianshou/utils/string.py
@ -16,6 +16,8 @@ reCommaWhitespacePotentiallyBreaks = re.compile(r",\s+")
 log = logging.getLogger(__name__)
 # ruff: noqa
 class StringConverter(ABC):
    """Abstraction for a string conversion mechanism."""