diff --git a/examples/atari/README.md b/examples/atari/README.md index 47c50d3..971231b 100644 --- a/examples/atari/README.md +++ b/examples/atari/README.md @@ -60,13 +60,13 @@ One epoch here is equal to 100,000 env step, 100 epochs stand for 10M. | task | best reward | reward curve | parameters | | --------------------------- | ----------- | ------------------------------------- | ------------------------------------------------------------ | -| PongNoFrameskip-v4 | 20.9 | ![](results/iqn/Pong_rew.png) | `python3 atari_iqn.py --task "PongNoFrameskip-v4" --batch-size 64` | -| BreakoutNoFrameskip-v4 | 578.3 | ![](results/iqn/Breakout_rew.png) | `python3 atari_iqn.py --task "BreakoutNoFrameskip-v4" --n-step 1` | -| EnduroNoFrameskip-v4 | 1507 | ![](results/iqn/Enduro_rew.png) | `python3 atari_iqn.py --task "EnduroNoFrameskip-v4"` | -| QbertNoFrameskip-v4 | 15520 | ![](results/iqn/Qbert_rew.png) | `python3 atari_iqn.py --task "QbertNoFrameskip-v4"` | -| MsPacmanNoFrameskip-v4 | 2911 | ![](results/iqn/MsPacman_rew.png) | `python3 atari_iqn.py --task "MsPacmanNoFrameskip-v4"` | -| SeaquestNoFrameskip-v4 | 6236 | ![](results/iqn/Seaquest_rew.png) | `python3 atari_iqn.py --task "SeaquestNoFrameskip-v4"` | -| SpaceInvadersNoFrameskip-v4 | 1370 | ![](results/iqn/SpaceInvader_rew.png) | `python3 atari_iqn.py --task "SpaceInvadersNoFrameskip-v4"` | +| PongNoFrameskip-v4 | 20.3 | ![](results/iqn/Pong_rew.png) | `python3 atari_iqn.py --task "PongNoFrameskip-v4" --batch-size 64` | +| BreakoutNoFrameskip-v4 | 496.7 | ![](results/iqn/Breakout_rew.png) | `python3 atari_iqn.py --task "BreakoutNoFrameskip-v4" --n-step 1` | +| EnduroNoFrameskip-v4 | 1545 | ![](results/iqn/Enduro_rew.png) | `python3 atari_iqn.py --task "EnduroNoFrameskip-v4"` | +| QbertNoFrameskip-v4 | 15342.5 | ![](results/iqn/Qbert_rew.png) | `python3 atari_iqn.py --task "QbertNoFrameskip-v4"` | +| MsPacmanNoFrameskip-v4 | 2915 | ![](results/iqn/MsPacman_rew.png) | `python3 atari_iqn.py --task "MsPacmanNoFrameskip-v4"` | +| SeaquestNoFrameskip-v4 | 4874 | ![](results/iqn/Seaquest_rew.png) | `python3 atari_iqn.py --task "SeaquestNoFrameskip-v4"` | +| SpaceInvadersNoFrameskip-v4 | 1498.5 | ![](results/iqn/SpaceInvaders_rew.png) | `python3 atari_iqn.py --task "SpaceInvadersNoFrameskip-v4"` | # BCQ diff --git a/examples/atari/results/iqn/Breakout_rew.png b/examples/atari/results/iqn/Breakout_rew.png index d486bf6..ab9b948 100644 Binary files a/examples/atari/results/iqn/Breakout_rew.png and b/examples/atari/results/iqn/Breakout_rew.png differ diff --git a/examples/atari/results/iqn/Enduro_rew.png b/examples/atari/results/iqn/Enduro_rew.png index 6d0a8a0..2b91299 100644 Binary files a/examples/atari/results/iqn/Enduro_rew.png and b/examples/atari/results/iqn/Enduro_rew.png differ diff --git a/examples/atari/results/iqn/MsPacman_rew.png b/examples/atari/results/iqn/MsPacman_rew.png index da9bcba..af6f3ae 100644 Binary files a/examples/atari/results/iqn/MsPacman_rew.png and b/examples/atari/results/iqn/MsPacman_rew.png differ diff --git a/examples/atari/results/iqn/Pong_rew.png b/examples/atari/results/iqn/Pong_rew.png index d5c91bd..bb8d31f 100644 Binary files a/examples/atari/results/iqn/Pong_rew.png and b/examples/atari/results/iqn/Pong_rew.png differ diff --git a/examples/atari/results/iqn/Qbert_rew.png b/examples/atari/results/iqn/Qbert_rew.png index 749e818..085a64d 100644 Binary files a/examples/atari/results/iqn/Qbert_rew.png and b/examples/atari/results/iqn/Qbert_rew.png differ diff --git a/examples/atari/results/iqn/Seaquest_rew.png b/examples/atari/results/iqn/Seaquest_rew.png index 0b14469..8f343cd 100644 Binary files a/examples/atari/results/iqn/Seaquest_rew.png and b/examples/atari/results/iqn/Seaquest_rew.png differ diff --git a/examples/atari/results/iqn/SpaceInvaders_rew.png b/examples/atari/results/iqn/SpaceInvaders_rew.png index 39b67dd..d8e7b33 100644 Binary files a/examples/atari/results/iqn/SpaceInvaders_rew.png and b/examples/atari/results/iqn/SpaceInvaders_rew.png differ