From 7fa588309b035601dde0dfe14bad6e4dd77a7678 Mon Sep 17 00:00:00 2001 From: Dominik Jain Date: Wed, 10 Jan 2024 15:39:53 +0100 Subject: [PATCH] Update MuJoCo examples to use Ant-v4 instead of Ant-v3 --- examples/mujoco/mujoco_a2c.py | 2 +- examples/mujoco/mujoco_ddpg.py | 2 +- examples/mujoco/mujoco_ddpg_hl.py | 2 +- examples/mujoco/mujoco_npg.py | 2 +- examples/mujoco/mujoco_npg_hl.py | 2 +- examples/mujoco/mujoco_ppo.py | 2 +- examples/mujoco/mujoco_redq.py | 2 +- examples/mujoco/mujoco_reinforce.py | 2 +- examples/mujoco/mujoco_reinforce_hl.py | 2 +- examples/mujoco/mujoco_sac.py | 2 +- examples/mujoco/mujoco_td3.py | 2 +- examples/mujoco/mujoco_trpo.py | 2 +- examples/mujoco/mujoco_trpo_hl.py | 2 +- 13 files changed, 13 insertions(+), 13 deletions(-) diff --git a/examples/mujoco/mujoco_a2c.py b/examples/mujoco/mujoco_a2c.py index b58c802..7abd620 100755 --- a/examples/mujoco/mujoco_a2c.py +++ b/examples/mujoco/mujoco_a2c.py @@ -23,7 +23,7 @@ from tianshou.utils.net.continuous import ActorProb, Critic def get_args(): parser = argparse.ArgumentParser() - parser.add_argument("--task", type=str, default="Ant-v3") + parser.add_argument("--task", type=str, default="Ant-v4") parser.add_argument("--seed", type=int, default=0) parser.add_argument("--buffer-size", type=int, default=4096) parser.add_argument("--hidden-sizes", type=int, nargs="*", default=[64, 64]) diff --git a/examples/mujoco/mujoco_ddpg.py b/examples/mujoco/mujoco_ddpg.py index 7594867..7cb9132 100755 --- a/examples/mujoco/mujoco_ddpg.py +++ b/examples/mujoco/mujoco_ddpg.py @@ -21,7 +21,7 @@ from tianshou.utils.net.continuous import Actor, Critic def get_args(): parser = argparse.ArgumentParser() - parser.add_argument("--task", type=str, default="Ant-v3") + parser.add_argument("--task", type=str, default="Ant-v4") parser.add_argument("--seed", type=int, default=0) parser.add_argument("--buffer-size", type=int, default=1000000) parser.add_argument("--hidden-sizes", type=int, nargs="*", default=[256, 256]) diff --git a/examples/mujoco/mujoco_ddpg_hl.py b/examples/mujoco/mujoco_ddpg_hl.py index 3e3fc7a..40a3136 100644 --- a/examples/mujoco/mujoco_ddpg_hl.py +++ b/examples/mujoco/mujoco_ddpg_hl.py @@ -17,7 +17,7 @@ from tianshou.utils.logging import datetime_tag def main( experiment_config: ExperimentConfig, - task: str = "Ant-v3", + task: str = "Ant-v4", buffer_size: int = 1000000, hidden_sizes: Sequence[int] = (256, 256), actor_lr: float = 1e-3, diff --git a/examples/mujoco/mujoco_npg.py b/examples/mujoco/mujoco_npg.py index 6b1e8c1..f6b951b 100755 --- a/examples/mujoco/mujoco_npg.py +++ b/examples/mujoco/mujoco_npg.py @@ -23,7 +23,7 @@ from tianshou.utils.net.continuous import ActorProb, Critic def get_args(): parser = argparse.ArgumentParser() - parser.add_argument("--task", type=str, default="Ant-v3") + parser.add_argument("--task", type=str, default="Ant-v4") parser.add_argument("--seed", type=int, default=0) parser.add_argument("--buffer-size", type=int, default=4096) parser.add_argument( diff --git a/examples/mujoco/mujoco_npg_hl.py b/examples/mujoco/mujoco_npg_hl.py index a423768..6784108 100644 --- a/examples/mujoco/mujoco_npg_hl.py +++ b/examples/mujoco/mujoco_npg_hl.py @@ -23,7 +23,7 @@ from tianshou.utils.logging import datetime_tag def main( experiment_config: ExperimentConfig, - task: str = "Ant-v3", + task: str = "Ant-v4", buffer_size: int = 4096, hidden_sizes: Sequence[int] = (64, 64), lr: float = 1e-3, diff --git a/examples/mujoco/mujoco_ppo.py b/examples/mujoco/mujoco_ppo.py index e7287f5..40b2f39 100755 --- a/examples/mujoco/mujoco_ppo.py +++ b/examples/mujoco/mujoco_ppo.py @@ -23,7 +23,7 @@ from tianshou.utils.net.continuous import ActorProb, Critic def get_args(): parser = argparse.ArgumentParser() - parser.add_argument("--task", type=str, default="Ant-v3") + parser.add_argument("--task", type=str, default="Ant-v4") parser.add_argument("--seed", type=int, default=0) parser.add_argument("--buffer-size", type=int, default=4096) parser.add_argument("--hidden-sizes", type=int, nargs="*", default=[64, 64]) diff --git a/examples/mujoco/mujoco_redq.py b/examples/mujoco/mujoco_redq.py index e39c7b0..b50304f 100755 --- a/examples/mujoco/mujoco_redq.py +++ b/examples/mujoco/mujoco_redq.py @@ -20,7 +20,7 @@ from tianshou.utils.net.continuous import ActorProb, Critic def get_args(): parser = argparse.ArgumentParser() - parser.add_argument("--task", type=str, default="Ant-v3") + parser.add_argument("--task", type=str, default="Ant-v4") parser.add_argument("--seed", type=int, default=0) parser.add_argument("--buffer-size", type=int, default=1000000) parser.add_argument("--hidden-sizes", type=int, nargs="*", default=[256, 256]) diff --git a/examples/mujoco/mujoco_reinforce.py b/examples/mujoco/mujoco_reinforce.py index 1b39418..be0eb04 100755 --- a/examples/mujoco/mujoco_reinforce.py +++ b/examples/mujoco/mujoco_reinforce.py @@ -23,7 +23,7 @@ from tianshou.utils.net.continuous import ActorProb def get_args(): parser = argparse.ArgumentParser() - parser.add_argument("--task", type=str, default="Ant-v3") + parser.add_argument("--task", type=str, default="Ant-v4") parser.add_argument("--seed", type=int, default=0) parser.add_argument("--buffer-size", type=int, default=4096) parser.add_argument("--hidden-sizes", type=int, nargs="*", default=[64, 64]) diff --git a/examples/mujoco/mujoco_reinforce_hl.py b/examples/mujoco/mujoco_reinforce_hl.py index 4f9bfdc..a524b0e 100644 --- a/examples/mujoco/mujoco_reinforce_hl.py +++ b/examples/mujoco/mujoco_reinforce_hl.py @@ -20,7 +20,7 @@ from tianshou.utils.logging import datetime_tag def main( experiment_config: ExperimentConfig, - task: str = "Ant-v3", + task: str = "Ant-v4", buffer_size: int = 4096, hidden_sizes: Sequence[int] = (64, 64), lr: float = 1e-3, diff --git a/examples/mujoco/mujoco_sac.py b/examples/mujoco/mujoco_sac.py index a53c04c..286f2cc 100755 --- a/examples/mujoco/mujoco_sac.py +++ b/examples/mujoco/mujoco_sac.py @@ -20,7 +20,7 @@ from tianshou.utils.net.continuous import ActorProb, Critic def get_args(): parser = argparse.ArgumentParser() - parser.add_argument("--task", type=str, default="Ant-v3") + parser.add_argument("--task", type=str, default="Ant-v4") parser.add_argument("--seed", type=int, default=0) parser.add_argument("--buffer-size", type=int, default=1000000) parser.add_argument("--hidden-sizes", type=int, nargs="*", default=[256, 256]) diff --git a/examples/mujoco/mujoco_td3.py b/examples/mujoco/mujoco_td3.py index 8e94761..ef98616 100755 --- a/examples/mujoco/mujoco_td3.py +++ b/examples/mujoco/mujoco_td3.py @@ -21,7 +21,7 @@ from tianshou.utils.net.continuous import Actor, Critic def get_args(): parser = argparse.ArgumentParser() - parser.add_argument("--task", type=str, default="Ant-v3") + parser.add_argument("--task", type=str, default="Ant-v4") parser.add_argument("--seed", type=int, default=0) parser.add_argument("--buffer-size", type=int, default=1000000) parser.add_argument("--hidden-sizes", type=int, nargs="*", default=[256, 256]) diff --git a/examples/mujoco/mujoco_trpo.py b/examples/mujoco/mujoco_trpo.py index 97fc0f9..d38afdb 100755 --- a/examples/mujoco/mujoco_trpo.py +++ b/examples/mujoco/mujoco_trpo.py @@ -23,7 +23,7 @@ from tianshou.utils.net.continuous import ActorProb, Critic def get_args(): parser = argparse.ArgumentParser() - parser.add_argument("--task", type=str, default="Ant-v3") + parser.add_argument("--task", type=str, default="Ant-v4") parser.add_argument("--seed", type=int, default=0) parser.add_argument("--buffer-size", type=int, default=4096) parser.add_argument( diff --git a/examples/mujoco/mujoco_trpo_hl.py b/examples/mujoco/mujoco_trpo_hl.py index 692e302..855caec 100644 --- a/examples/mujoco/mujoco_trpo_hl.py +++ b/examples/mujoco/mujoco_trpo_hl.py @@ -23,7 +23,7 @@ from tianshou.utils.logging import datetime_tag def main( experiment_config: ExperimentConfig, - task: str = "Ant-v3", + task: str = "Ant-v4", buffer_size: int = 4096, hidden_sizes: Sequence[int] = (64, 64), lr: float = 1e-3,