diff --git a/examples/mujoco/config/logger.yml b/examples/mujoco/config/logger.yml deleted file mode 100644 index 16fe055..0000000 --- a/examples/mujoco/config/logger.yml +++ /dev/null @@ -1,5 +0,0 @@ -# Default logger config, keep in sync with LoggerConfig dataclass - -logger: tensorboard -logdir: log -wandb_project: mujoco.benchmark diff --git a/examples/mujoco/config/sampling.yml b/examples/mujoco/config/sampling.yml deleted file mode 100644 index 87ee291..0000000 --- a/examples/mujoco/config/sampling.yml +++ /dev/null @@ -1,10 +0,0 @@ -# Default config for sampling, epochs, parallelization, buffers, collectors, and batching. -# Keep in sync with RLSamplingConfig dataclass. -epoch: 100 -step_per_epoch: 30000 -batch_size: 64 -training_num: 64 -test_num: 10 -buffer_size: 4096 -step_per_collect: 2048 -repeat_per_collect: 10 diff --git a/examples/mujoco/default_config.yml b/examples/mujoco/default_config.yml deleted file mode 100644 index 6fdb01e..0000000 --- a/examples/mujoco/default_config.yml +++ /dev/null @@ -1,45 +0,0 @@ -# General config -logger: "tensorboard" -wandb_project: "mujoco.benchmark" -seed: 24 -logdir: "log" -device: "cpu" -watch: false -render: 0.0 -resume_path: null -resume_id: null - -# Training: NN -lr: 3e-4 -hidden_sizes: [64, 64] -lr_decay: true - -# Training: sampling -training_num: 64 -test_num: 10 -repeat_per_collect: 10 -batch_size: 64 -epoch: 100 -step_per_epoch: 30000 -step_per_collect: 2048 -buffer_size: 4096 - -# Training: RL modelling -gamma: 0.99 -rew_norm: true -dual_clip: null -value_clip: false -norm_adv: false -recompute_adv: true -gae_lambda: 0.95 - -# Training: PPO specifics -ent_coef: 0.0 -vf_coef: 0.25 -bound_action_method: "clip" -max_grad_norm: 0.5 -eps_clip: 0.2 - - -# Mujoco -task: "Ant-v3"