update atari ppo slots (#529)
@ -102,10 +102,10 @@ One epoch here is equal to 100,000 env step, 100 epochs stand for 10M.
|
||||
|
||||
| task | best reward | reward curve | parameters |
|
||||
| --------------------------- | ----------- | ------------------------------------- | ------------------------------------------------------------ |
|
||||
| PongNoFrameskip-v4 | 20 |  | `python3 atari_ppo.py --task "PongNoFrameskip-v4"` |
|
||||
| BreakoutNoFrameskip-v4 | 442.1 |  | `python3 atari_ppo.py --task "BreakoutNoFrameskip-v4"` |
|
||||
| EnduroNoFrameskip-v4 | 1386.4 |  | `python3 atari_ppo.py --task "EnduroNoFrameskip-v4"` |
|
||||
| QbertNoFrameskip-v4 | 19585 |  | `python3 atari_ppo.py --task "QbertNoFrameskip-v4"` |
|
||||
| MsPacmanNoFrameskip-v4 | 2319 |  | `python3 atari_ppo.py --task "MsPacmanNoFrameskip-v4"` |
|
||||
| SeaquestNoFrameskip-v4 | 1764 |  | `python3 atari_ppo.py --task "SeaquestNoFrameskip-v4"` |
|
||||
| SpaceInvadersNoFrameskip-v4 | 1184 |  | `python3 atari_ppo.py --task "SpaceInvadersNoFrameskip-v4"` |
|
||||
| PongNoFrameskip-v4 | 20.1 |  | `python3 atari_ppo.py --task "PongNoFrameskip-v4"` |
|
||||
| BreakoutNoFrameskip-v4 | 438.5 |  | `python3 atari_ppo.py --task "BreakoutNoFrameskip-v4"` |
|
||||
| EnduroNoFrameskip-v4 | 1304.8 |  | `python3 atari_ppo.py --task "EnduroNoFrameskip-v4"` |
|
||||
| QbertNoFrameskip-v4 | 13640 |  | `python3 atari_ppo.py --task "QbertNoFrameskip-v4"` |
|
||||
| MsPacmanNoFrameskip-v4 | 1930 |  | `python3 atari_ppo.py --task "MsPacmanNoFrameskip-v4"` |
|
||||
| SeaquestNoFrameskip-v4 | 904 |  | `python3 atari_ppo.py --task "SeaquestNoFrameskip-v4" --lr 2.5e-5` |
|
||||
| SpaceInvadersNoFrameskip-v4 | 843 |  | `python3 atari_ppo.py --task "SpaceInvadersNoFrameskip-v4"` |
|
||||
|
@ -24,7 +24,7 @@ def get_args():
|
||||
parser.add_argument('--seed', type=int, default=4213)
|
||||
parser.add_argument('--scale-obs', type=int, default=0)
|
||||
parser.add_argument('--buffer-size', type=int, default=100000)
|
||||
parser.add_argument('--lr', type=float, default=1e-4)
|
||||
parser.add_argument('--lr', type=float, default=5e-5)
|
||||
parser.add_argument('--gamma', type=float, default=0.99)
|
||||
parser.add_argument('--epoch', type=int, default=100)
|
||||
parser.add_argument('--step-per-epoch', type=int, default=100000)
|
||||
|
Before Width: | Height: | Size: 142 KiB After Width: | Height: | Size: 142 KiB |
Before Width: | Height: | Size: 144 KiB After Width: | Height: | Size: 146 KiB |
Before Width: | Height: | Size: 162 KiB After Width: | Height: | Size: 152 KiB |
Before Width: | Height: | Size: 119 KiB After Width: | Height: | Size: 115 KiB |
Before Width: | Height: | Size: 146 KiB After Width: | Height: | Size: 145 KiB |
Before Width: | Height: | Size: 136 KiB After Width: | Height: | Size: 137 KiB |
Before Width: | Height: | Size: 159 KiB After Width: | Height: | Size: 159 KiB |