* Created mixins for agent factories to reduce code duplication * Further factorised params & mixins for experiment factories * Additional parameter abstractions * Implement high-level MuJoCo TD3 example
20 lines
527 B
Python
20 lines
527 B
Python
from dataclasses import dataclass
|
|
|
|
|
|
@dataclass
|
|
class RLSamplingConfig:
|
|
"""Sampling, epochs, parallelization, buffers, collectors, and batching."""
|
|
|
|
# TODO: What are reasonable defaults?
|
|
num_epochs: int = 100
|
|
step_per_epoch: int = 30000
|
|
batch_size: int = 64
|
|
num_train_envs: int = 64
|
|
num_test_envs: int = 10
|
|
buffer_size: int = 4096
|
|
step_per_collect: int = 2048
|
|
repeat_per_collect: int = 10
|
|
update_per_step: int = 1
|
|
start_timesteps: int = 0
|
|
start_timesteps_random: bool = False
|