[{"env_step": 0, "rew": 5.89, "rew_std": 1.2613, "Agent": "PPO"}, {"env_step": 30720, "rew": 991.92, "rew_std": 18.7133, "Agent": "PPO"}, {"env_step": 61440, "rew": 1000.0, "rew_std": 0.0, "Agent": "PPO"}, {"env_step": 92160, "rew": 1000.0, "rew_std": 0.0, "Agent": "PPO"}, {"env_step": 122880, "rew": 1000.0, "rew_std": 0.0, "Agent": "PPO"}, {"env_step": 153600, "rew": 1000.0, "rew_std": 0.0, "Agent": "PPO"}, {"env_step": 184320, "rew": 1000.0, "rew_std": 0.0, "Agent": "PPO"}, {"env_step": 215040, "rew": 1000.0, "rew_std": 0.0, "Agent": "PPO"}, {"env_step": 245760, "rew": 1000.0, "rew_std": 0.0, "Agent": "PPO"}, {"env_step": 276480, "rew": 1000.0, "rew_std": 0.0, "Agent": "PPO"}, {"env_step": 307200, "rew": 1000.0, "rew_std": 0.0, "Agent": "PPO"}, {"env_step": 337920, "rew": 1000.0, "rew_std": 0.0, "Agent": "PPO"}, {"env_step": 368640, "rew": 1000.0, "rew_std": 0.0, "Agent": "PPO"}, {"env_step": 399360, "rew": 1000.0, "rew_std": 0.0, "Agent": "PPO"}, {"env_step": 430080, "rew": 1000.0, "rew_std": 0.0, "Agent": "PPO"}, {"env_step": 460800, "rew": 894.23, "rew_std": 282.0792, "Agent": "PPO"}, {"env_step": 491520, "rew": 909.04, "rew_std": 184.7011, "Agent": "PPO"}, {"env_step": 522240, "rew": 953.76, "rew_std": 138.72, "Agent": "PPO"}, {"env_step": 552960, "rew": 963.62, "rew_std": 109.14, "Agent": "PPO"}, {"env_step": 583680, "rew": 979.64, "rew_std": 61.08, "Agent": "PPO"}, {"env_step": 614400, "rew": 1000.0, "rew_std": 0.0, "Agent": "PPO"}, {"env_step": 645120, "rew": 983.94, "rew_std": 48.18, "Agent": "PPO"}, {"env_step": 675840, "rew": 957.85, "rew_std": 126.45, "Agent": "PPO"}, {"env_step": 706560, "rew": 921.94, "rew_std": 234.18, "Agent": "PPO"}, {"env_step": 737280, "rew": 913.44, "rew_std": 259.68, "Agent": "PPO"}, {"env_step": 768000, "rew": 917.6, "rew_std": 247.2, "Agent": "PPO"}, {"env_step": 798720, "rew": 921.5, "rew_std": 235.5, "Agent": "PPO"}, {"env_step": 829440, "rew": 921.61, "rew_std": 235.17, "Agent": "PPO"}, {"env_step": 860160, "rew": 874.86, "rew_std": 263.0724, "Agent": "PPO"}, {"env_step": 890880, "rew": 862.17, "rew_std": 248.3223, "Agent": "PPO"}, {"env_step": 921600, "rew": 751.64, "rew_std": 379.4485, "Agent": "PPO"}, {"env_step": 952320, "rew": 817.05, "rew_std": 326.3875, "Agent": "PPO"}, {"env_step": 983040, "rew": 824.11, "rew_std": 312.4759, "Agent": "PPO"}, {"env_step": 1013760, "rew": 791.61, "rew_std": 342.7439, "Agent": "PPO"}, {"env_step": 1044480, "rew": 814.11, "rew_std": 316.6064, "Agent": "PPO"}, {"env_step": 1075200, "rew": 732.38, "rew_std": 397.0806, "Agent": "PPO"}, {"env_step": 1105920, "rew": 735.99, "rew_std": 393.5189, "Agent": "PPO"}, {"env_step": 1136640, "rew": 756.65, "rew_std": 388.4296, "Agent": "PPO"}, {"env_step": 1167360, "rew": 648.53, "rew_std": 440.111, "Agent": "PPO"}, {"env_step": 1198080, "rew": 673.59, "rew_std": 434.882, "Agent": "PPO"}, {"env_step": 1228800, "rew": 663.75, "rew_std": 435.8427, "Agent": "PPO"}, {"env_step": 1259520, "rew": 663.65, "rew_std": 435.3639, "Agent": "PPO"}, {"env_step": 1290240, "rew": 597.03, "rew_std": 439.9041, "Agent": "PPO"}, {"env_step": 1320960, "rew": 666.76, "rew_std": 430.241, "Agent": "PPO"}, {"env_step": 1351680, "rew": 695.85, "rew_std": 435.7469, "Agent": "PPO"}, {"env_step": 1382400, "rew": 614.87, "rew_std": 450.4714, "Agent": "PPO"}, {"env_step": 1413120, "rew": 514.3, "rew_std": 449.8707, "Agent": "PPO"}, {"env_step": 1443840, "rew": 504.17, "rew_std": 438.6437, "Agent": "PPO"}, {"env_step": 1474560, "rew": 486.43, "rew_std": 432.2417, "Agent": "PPO"}, {"env_step": 1505280, "rew": 492.89, "rew_std": 431.6997, "Agent": "PPO"}, {"env_step": 1536000, "rew": 505.8, "rew_std": 448.4553, "Agent": "PPO"}, {"env_step": 1566720, "rew": 504.57, "rew_std": 464.0222, "Agent": "PPO"}, {"env_step": 1597440, "rew": 478.38, "rew_std": 443.5053, "Agent": "PPO"}, {"env_step": 1628160, "rew": 499.29, "rew_std": 438.305, "Agent": "PPO"}, {"env_step": 1658880, "rew": 594.1, "rew_std": 446.8878, "Agent": "PPO"}, {"env_step": 1689600, "rew": 679.69, "rew_std": 422.8528, "Agent": "PPO"}, {"env_step": 1720320, "rew": 675.65, "rew_std": 425.7626, "Agent": "PPO"}, {"env_step": 1751040, "rew": 678.18, "rew_std": 421.0652, "Agent": "PPO"}, {"env_step": 1781760, "rew": 716.62, "rew_std": 433.3988, "Agent": "PPO"}, {"env_step": 1812480, "rew": 715.64, "rew_std": 434.7247, "Agent": "PPO"}, {"env_step": 1843200, "rew": 700.41, "rew_std": 423.6157, "Agent": "PPO"}, {"env_step": 1873920, "rew": 673.37, "rew_std": 404.6755, "Agent": "PPO"}, {"env_step": 1904640, "rew": 705.65, "rew_std": 412.9842, "Agent": "PPO"}, {"env_step": 1935360, "rew": 686.0, "rew_std": 406.3371, "Agent": "PPO"}, {"env_step": 1966080, "rew": 721.63, "rew_std": 406.8133, "Agent": "PPO"}, {"env_step": 1996800, "rew": 743.19, "rew_std": 376.0792, "Agent": "PPO"}, {"env_step": 2027520, "rew": 811.83, "rew_std": 350.2001, "Agent": "PPO"}, {"env_step": 2058240, "rew": 823.86, "rew_std": 352.3771, "Agent": "PPO"}, {"env_step": 2088960, "rew": 822.57, "rew_std": 354.871, "Agent": "PPO"}, {"env_step": 2119680, "rew": 825.47, "rew_std": 349.1095, "Agent": "PPO"}, {"env_step": 2150400, "rew": 803.09, "rew_std": 338.447, "Agent": "PPO"}, {"env_step": 2181120, "rew": 827.57, "rew_std": 344.8652, "Agent": "PPO"}, {"env_step": 2211840, "rew": 835.49, "rew_std": 329.0274, "Agent": "PPO"}, {"env_step": 2242560, "rew": 840.62, "rew_std": 319.6467, "Agent": "PPO"}, {"env_step": 2273280, "rew": 837.3, "rew_std": 310.0583, "Agent": "PPO"}, {"env_step": 2304000, "rew": 849.49, "rew_std": 305.1477, "Agent": "PPO"}, {"env_step": 2334720, "rew": 869.85, "rew_std": 250.1218, "Agent": "PPO"}, {"env_step": 2365440, "rew": 917.12, "rew_std": 248.64, "Agent": "PPO"}, {"env_step": 2396160, "rew": 915.76, "rew_std": 252.72, "Agent": "PPO"}, {"env_step": 2426880, "rew": 917.29, "rew_std": 238.4911, "Agent": "PPO"}, {"env_step": 2457600, "rew": 845.93, "rew_std": 291.2987, "Agent": "PPO"}, {"env_step": 2488320, "rew": 855.03, "rew_std": 261.2282, "Agent": "PPO"}, {"env_step": 2519040, "rew": 900.61, "rew_std": 243.8298, "Agent": "PPO"}, {"env_step": 2549760, "rew": 900.54, "rew_std": 246.8906, "Agent": "PPO"}, {"env_step": 2580480, "rew": 909.48, "rew_std": 234.424, "Agent": "PPO"}, {"env_step": 2611200, "rew": 900.49, "rew_std": 243.7414, "Agent": "PPO"}, {"env_step": 2641920, "rew": 921.6, "rew_std": 235.2, "Agent": "PPO"}, {"env_step": 2672640, "rew": 905.18, "rew_std": 237.499, "Agent": "PPO"}, {"env_step": 2703360, "rew": 925.26, "rew_std": 224.22, "Agent": "PPO"}, {"env_step": 2734080, "rew": 912.07, "rew_std": 232.4689, "Agent": "PPO"}, {"env_step": 2764800, "rew": 924.37, "rew_std": 222.5248, "Agent": "PPO"}, {"env_step": 2795520, "rew": 909.44, "rew_std": 226.5858, "Agent": "PPO"}, {"env_step": 2826240, "rew": 924.46, "rew_std": 212.8309, "Agent": "PPO"}, {"env_step": 2856960, "rew": 905.68, "rew_std": 211.3978, "Agent": "PPO"}, {"env_step": 2887680, "rew": 928.55, "rew_std": 214.35, "Agent": "PPO"}, {"env_step": 2918400, "rew": 924.14, "rew_std": 210.3213, "Agent": "PPO"}, {"env_step": 2949120, "rew": 922.3, "rew_std": 202.7814, "Agent": "PPO"}, {"env_step": 2979840, "rew": 934.52, "rew_std": 152.1107, "Agent": "PPO"}, {"env_step": 3010560, "rew": 934.61, "rew_std": 190.3107, "Agent": "PPO"}, {"env_step": 3041280, "rew": 925.86, "rew_std": 193.2455, "Agent": "PPO"}, {"env_step": 3072000, "rew": 934.13, "rew_std": 167.4007, "Agent": "PPO"}, {"env_step": 5000, "rew": 57.22, "rew_std": 8.7888, "Agent": "TD3"}, {"env_step": 10000, "rew": 63.94, "rew_std": 15.7719, "Agent": "TD3"}, {"env_step": 15000, "rew": 58.57, "rew_std": 17.0332, "Agent": "TD3"}, {"env_step": 20000, "rew": 126.66, "rew_std": 76.2021, "Agent": "TD3"}, {"env_step": 25000, "rew": 616.43, "rew_std": 388.5243, "Agent": "TD3"}, {"env_step": 30000, "rew": 828.24, "rew_std": 343.5527, "Agent": "TD3"}, {"env_step": 35000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 40000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 45000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 50000, "rew": 933.47, "rew_std": 199.59, "Agent": "TD3"}, {"env_step": 55000, "rew": 976.87, "rew_std": 69.39, "Agent": "TD3"}, {"env_step": 60000, "rew": 809.04, "rew_std": 381.9246, "Agent": "TD3"}, {"env_step": 65000, "rew": 808.35, "rew_std": 383.3043, "Agent": "TD3"}, {"env_step": 70000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 75000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 80000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 85000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 90000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 95000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 100000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 105000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 110000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 115000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 120000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 125000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 130000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 135000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 140000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 145000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 150000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 155000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 160000, "rew": 903.53, "rew_std": 289.41, "Agent": "TD3"}, {"env_step": 165000, "rew": 904.12, "rew_std": 287.64, "Agent": "TD3"}, {"env_step": 170000, "rew": 904.97, "rew_std": 285.09, "Agent": "TD3"}, {"env_step": 175000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 180000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 185000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 190000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 195000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 200000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 205000, "rew": 903.88, "rew_std": 288.36, "Agent": "TD3"}, {"env_step": 210000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 215000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 220000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 225000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 230000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 235000, "rew": 981.89, "rew_std": 54.33, "Agent": "TD3"}, {"env_step": 240000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 245000, "rew": 955.73, "rew_std": 132.81, "Agent": "TD3"}, {"env_step": 250000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 255000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 260000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 265000, "rew": 919.42, "rew_std": 241.74, "Agent": "TD3"}, {"env_step": 270000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 275000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 280000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 285000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 290000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 295000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 300000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 305000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 310000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 315000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 320000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 325000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 330000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 335000, "rew": 995.98, "rew_std": 12.06, "Agent": "TD3"}, {"env_step": 340000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 345000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 350000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 355000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 360000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 365000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 370000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 375000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 380000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 385000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 390000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 395000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 400000, "rew": 987.18, "rew_std": 38.46, "Agent": "TD3"}, {"env_step": 405000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 410000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 415000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 420000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 425000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 430000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 435000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 440000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 445000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 450000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 455000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 460000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 465000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 470000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 475000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 480000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 485000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 490000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 495000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 500000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 505000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 510000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 515000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 520000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 525000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 530000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 535000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 540000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 545000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 550000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 555000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 560000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 565000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 570000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 575000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 580000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 585000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 590000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 595000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 600000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 605000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 610000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 615000, "rew": 912.84, "rew_std": 261.48, "Agent": "TD3"}, {"env_step": 620000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 625000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 630000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 635000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 640000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 645000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 650000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 655000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 660000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 665000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 670000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 675000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 680000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 685000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 690000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 695000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 700000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 705000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 710000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 715000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 720000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 725000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 730000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 735000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 740000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 745000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 750000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 755000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 760000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 765000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 770000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 775000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 780000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 785000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 790000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 795000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 800000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 805000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 810000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 815000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 820000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 825000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 830000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 835000, "rew": 967.62, "rew_std": 97.14, "Agent": "TD3"}, {"env_step": 840000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 845000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 850000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 855000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 860000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 865000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 870000, "rew": 960.62, "rew_std": 118.14, "Agent": "TD3"}, {"env_step": 875000, "rew": 903.47, "rew_std": 289.59, "Agent": "TD3"}, {"env_step": 880000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 885000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 890000, "rew": 953.41, "rew_std": 139.77, "Agent": "TD3"}, {"env_step": 895000, "rew": 916.7, "rew_std": 249.9, "Agent": "TD3"}, {"env_step": 900000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 905000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 910000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 915000, "rew": 992.77, "rew_std": 21.69, "Agent": "TD3"}, {"env_step": 920000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 925000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 930000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 935000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 940000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 945000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 950000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 955000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 960000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 965000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 970000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 975000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 980000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 985000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 990000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 995000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1000000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1005000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1010000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1015000, "rew": 927.09, "rew_std": 218.73, "Agent": "TD3"}, {"env_step": 1020000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1025000, "rew": 930.37, "rew_std": 208.89, "Agent": "TD3"}, {"env_step": 1030000, "rew": 930.54, "rew_std": 208.38, "Agent": "TD3"}, {"env_step": 1035000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1040000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1045000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1050000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1055000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1060000, "rew": 980.63, "rew_std": 58.11, "Agent": "TD3"}, {"env_step": 1065000, "rew": 971.03, "rew_std": 86.91, "Agent": "TD3"}, {"env_step": 1070000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1075000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1080000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1085000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1090000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1095000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1100000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1105000, "rew": 966.52, "rew_std": 73.5236, "Agent": "TD3"}, {"env_step": 1110000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1115000, "rew": 960.61, "rew_std": 118.17, "Agent": "TD3"}, {"env_step": 1120000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1125000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1130000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1135000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1140000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1145000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1150000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1155000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1160000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1165000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1170000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1175000, "rew": 913.93, "rew_std": 258.21, "Agent": "TD3"}, {"env_step": 1180000, "rew": 991.61, "rew_std": 25.17, "Agent": "TD3"}, {"env_step": 1185000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1190000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1195000, "rew": 906.07, "rew_std": 281.79, "Agent": "TD3"}, {"env_step": 1200000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1205000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1210000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1215000, "rew": 966.09, "rew_std": 101.73, "Agent": "TD3"}, {"env_step": 1220000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1225000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1230000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1235000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1240000, "rew": 1000.0, "rew_std": 0.0, "Agent": "TD3"}, {"env_step": 1245000, "rew": 909.42, "rew_std": 271.74, "Agent": "TD3"}, {"env_step": 1250000, "rew": 983.56, "rew_std": 49.32, "Agent": "TD3"}, {"env_step": 0, "rew": 6.38, "rew_std": 1.0167, "Agent": "REINFORCE"}, {"env_step": 30720, "rew": 12.69, "rew_std": 2.9851, "Agent": "REINFORCE"}, {"env_step": 61440, "rew": 32.23, "rew_std": 3.8879, "Agent": "REINFORCE"}, {"env_step": 92160, "rew": 77.27, "rew_std": 26.6147, "Agent": "REINFORCE"}, {"env_step": 122880, "rew": 148.32, "rew_std": 8.6668, "Agent": "REINFORCE"}, {"env_step": 153600, "rew": 204.35, "rew_std": 34.1581, "Agent": "REINFORCE"}, {"env_step": 184320, "rew": 241.57, "rew_std": 36.1153, "Agent": "REINFORCE"}, {"env_step": 215040, "rew": 269.84, "rew_std": 56.4856, "Agent": "REINFORCE"}, {"env_step": 245760, "rew": 292.24, "rew_std": 59.8266, "Agent": "REINFORCE"}, {"env_step": 276480, "rew": 303.53, "rew_std": 72.1803, "Agent": "REINFORCE"}, {"env_step": 307200, "rew": 366.6, "rew_std": 69.1684, "Agent": "REINFORCE"}, {"env_step": 337920, "rew": 418.87, "rew_std": 122.7315, "Agent": "REINFORCE"}, {"env_step": 368640, "rew": 540.22, "rew_std": 110.6541, "Agent": "REINFORCE"}, {"env_step": 399360, "rew": 584.33, "rew_std": 162.809, "Agent": "REINFORCE"}, {"env_step": 430080, "rew": 647.97, "rew_std": 202.2086, "Agent": "REINFORCE"}, {"env_step": 460800, "rew": 674.07, "rew_std": 184.473, "Agent": "REINFORCE"}, {"env_step": 491520, "rew": 698.35, "rew_std": 200.3386, "Agent": "REINFORCE"}, {"env_step": 522240, "rew": 708.29, "rew_std": 169.5527, "Agent": "REINFORCE"}, {"env_step": 552960, "rew": 719.61, "rew_std": 145.3608, "Agent": "REINFORCE"}, {"env_step": 583680, "rew": 736.16, "rew_std": 163.8339, "Agent": "REINFORCE"}, {"env_step": 614400, "rew": 712.89, "rew_std": 164.4856, "Agent": "REINFORCE"}, {"env_step": 645120, "rew": 758.01, "rew_std": 186.5025, "Agent": "REINFORCE"}, {"env_step": 675840, "rew": 783.12, "rew_std": 186.196, "Agent": "REINFORCE"}, {"env_step": 706560, "rew": 828.69, "rew_std": 182.6344, "Agent": "REINFORCE"}, {"env_step": 737280, "rew": 827.53, "rew_std": 195.6721, "Agent": "REINFORCE"}, {"env_step": 768000, "rew": 810.95, "rew_std": 190.6268, "Agent": "REINFORCE"}, {"env_step": 798720, "rew": 770.26, "rew_std": 172.4914, "Agent": "REINFORCE"}, {"env_step": 829440, "rew": 779.48, "rew_std": 122.8061, "Agent": "REINFORCE"}, {"env_step": 860160, "rew": 830.8, "rew_std": 146.0733, "Agent": "REINFORCE"}, {"env_step": 890880, "rew": 828.59, "rew_std": 142.9545, "Agent": "REINFORCE"}, {"env_step": 921600, "rew": 849.73, "rew_std": 96.7585, "Agent": "REINFORCE"}, {"env_step": 952320, "rew": 917.15, "rew_std": 90.8268, "Agent": "REINFORCE"}, {"env_step": 983040, "rew": 932.22, "rew_std": 76.1166, "Agent": "REINFORCE"}, {"env_step": 1013760, "rew": 879.17, "rew_std": 122.7968, "Agent": "REINFORCE"}, {"env_step": 1044480, "rew": 907.47, "rew_std": 111.0657, "Agent": "REINFORCE"}, {"env_step": 1075200, "rew": 944.47, "rew_std": 80.4061, "Agent": "REINFORCE"}, {"env_step": 1105920, "rew": 892.28, "rew_std": 127.6802, "Agent": "REINFORCE"}, {"env_step": 1136640, "rew": 861.91, "rew_std": 126.3386, "Agent": "REINFORCE"}, {"env_step": 1167360, "rew": 889.43, "rew_std": 143.7161, "Agent": "REINFORCE"}, {"env_step": 1198080, "rew": 904.98, "rew_std": 123.0215, "Agent": "REINFORCE"}, {"env_step": 1228800, "rew": 876.33, "rew_std": 171.302, "Agent": "REINFORCE"}, {"env_step": 1259520, "rew": 891.96, "rew_std": 193.7084, "Agent": "REINFORCE"}, {"env_step": 1290240, "rew": 878.39, "rew_std": 164.648, "Agent": "REINFORCE"}, {"env_step": 1320960, "rew": 861.3, "rew_std": 181.4943, "Agent": "REINFORCE"}, {"env_step": 1351680, "rew": 867.75, "rew_std": 170.6529, "Agent": "REINFORCE"}, {"env_step": 1382400, "rew": 845.37, "rew_std": 193.2622, "Agent": "REINFORCE"}, {"env_step": 1413120, "rew": 842.0, "rew_std": 193.8438, "Agent": "REINFORCE"}, {"env_step": 1443840, "rew": 820.57, "rew_std": 219.4767, "Agent": "REINFORCE"}, {"env_step": 1474560, "rew": 815.99, "rew_std": 236.7662, "Agent": "REINFORCE"}, {"env_step": 1505280, "rew": 814.27, "rew_std": 219.5517, "Agent": "REINFORCE"}, {"env_step": 1536000, "rew": 830.9, "rew_std": 232.4408, "Agent": "REINFORCE"}, {"env_step": 1566720, "rew": 827.87, "rew_std": 226.6782, "Agent": "REINFORCE"}, {"env_step": 1597440, "rew": 835.52, "rew_std": 211.3546, "Agent": "REINFORCE"}, {"env_step": 1628160, "rew": 875.83, "rew_std": 180.7828, "Agent": "REINFORCE"}, {"env_step": 1658880, "rew": 907.5, "rew_std": 145.8232, "Agent": "REINFORCE"}, {"env_step": 1689600, "rew": 918.3, "rew_std": 119.6084, "Agent": "REINFORCE"}, {"env_step": 1720320, "rew": 923.26, "rew_std": 124.8266, "Agent": "REINFORCE"}, {"env_step": 1751040, "rew": 916.52, "rew_std": 127.6408, "Agent": "REINFORCE"}, {"env_step": 1781760, "rew": 881.89, "rew_std": 168.3299, "Agent": "REINFORCE"}, {"env_step": 1812480, "rew": 854.64, "rew_std": 152.5227, "Agent": "REINFORCE"}, {"env_step": 1843200, "rew": 843.18, "rew_std": 147.2391, "Agent": "REINFORCE"}, {"env_step": 1873920, "rew": 830.27, "rew_std": 199.4989, "Agent": "REINFORCE"}, {"env_step": 1904640, "rew": 760.88, "rew_std": 235.9908, "Agent": "REINFORCE"}, {"env_step": 1935360, "rew": 752.09, "rew_std": 262.4417, "Agent": "REINFORCE"}, {"env_step": 1966080, "rew": 824.91, "rew_std": 257.6926, "Agent": "REINFORCE"}, {"env_step": 1996800, "rew": 827.51, "rew_std": 279.11, "Agent": "REINFORCE"}, {"env_step": 2027520, "rew": 830.03, "rew_std": 275.1672, "Agent": "REINFORCE"}, {"env_step": 2058240, "rew": 816.47, "rew_std": 282.6688, "Agent": "REINFORCE"}, {"env_step": 2088960, "rew": 860.69, "rew_std": 263.9615, "Agent": "REINFORCE"}, {"env_step": 2119680, "rew": 889.93, "rew_std": 165.5766, "Agent": "REINFORCE"}, {"env_step": 2150400, "rew": 914.43, "rew_std": 139.7138, "Agent": "REINFORCE"}, {"env_step": 2181120, "rew": 866.68, "rew_std": 178.7052, "Agent": "REINFORCE"}, {"env_step": 2211840, "rew": 877.44, "rew_std": 147.7871, "Agent": "REINFORCE"}, {"env_step": 2242560, "rew": 933.0, "rew_std": 124.4947, "Agent": "REINFORCE"}, {"env_step": 2273280, "rew": 907.14, "rew_std": 150.9342, "Agent": "REINFORCE"}, {"env_step": 2304000, "rew": 933.29, "rew_std": 198.7339, "Agent": "REINFORCE"}, {"env_step": 2334720, "rew": 926.73, "rew_std": 172.8165, "Agent": "REINFORCE"}, {"env_step": 2365440, "rew": 933.02, "rew_std": 180.0415, "Agent": "REINFORCE"}, {"env_step": 2396160, "rew": 927.41, "rew_std": 139.3859, "Agent": "REINFORCE"}, {"env_step": 2426880, "rew": 918.35, "rew_std": 143.5981, "Agent": "REINFORCE"}, {"env_step": 2457600, "rew": 930.83, "rew_std": 134.4429, "Agent": "REINFORCE"}, {"env_step": 2488320, "rew": 915.37, "rew_std": 192.8453, "Agent": "REINFORCE"}, {"env_step": 2519040, "rew": 888.03, "rew_std": 202.7, "Agent": "REINFORCE"}, {"env_step": 2549760, "rew": 858.34, "rew_std": 201.8235, "Agent": "REINFORCE"}, {"env_step": 2580480, "rew": 864.93, "rew_std": 204.9745, "Agent": "REINFORCE"}, {"env_step": 2611200, "rew": 858.65, "rew_std": 199.3346, "Agent": "REINFORCE"}, {"env_step": 2641920, "rew": 835.58, "rew_std": 190.5613, "Agent": "REINFORCE"}, {"env_step": 2672640, "rew": 877.95, "rew_std": 189.4195, "Agent": "REINFORCE"}, {"env_step": 2703360, "rew": 889.08, "rew_std": 136.7458, "Agent": "REINFORCE"}, {"env_step": 2734080, "rew": 875.81, "rew_std": 187.1033, "Agent": "REINFORCE"}, {"env_step": 2764800, "rew": 900.8, "rew_std": 185.6886, "Agent": "REINFORCE"}, {"env_step": 2795520, "rew": 976.84, "rew_std": 36.2903, "Agent": "REINFORCE"}, {"env_step": 2826240, "rew": 994.83, "rew_std": 14.6638, "Agent": "REINFORCE"}, {"env_step": 2856960, "rew": 982.4, "rew_std": 41.4874, "Agent": "REINFORCE"}, {"env_step": 2887680, "rew": 958.21, "rew_std": 104.2025, "Agent": "REINFORCE"}, {"env_step": 2918400, "rew": 965.74, "rew_std": 48.0941, "Agent": "REINFORCE"}, {"env_step": 2949120, "rew": 992.54, "rew_std": 15.5009, "Agent": "REINFORCE"}, {"env_step": 2979840, "rew": 999.21, "rew_std": 2.37, "Agent": "REINFORCE"}, {"env_step": 3010560, "rew": 995.32, "rew_std": 10.7451, "Agent": "REINFORCE"}, {"env_step": 3041280, "rew": 979.38, "rew_std": 42.6937, "Agent": "REINFORCE"}, {"env_step": 3072000, "rew": 964.1, "rew_std": 82.9313, "Agent": "REINFORCE"}, {"env_step": 3102720, "rew": 959.63, "rew_std": 106.8083, "Agent": "REINFORCE"}, {"env_step": 3133440, "rew": 956.85, "rew_std": 106.4687, "Agent": "REINFORCE"}, {"env_step": 3164160, "rew": 949.08, "rew_std": 126.2108, "Agent": "REINFORCE"}, {"env_step": 3194880, "rew": 959.78, "rew_std": 75.3591, "Agent": "REINFORCE"}, {"env_step": 3225600, "rew": 986.1, "rew_std": 31.7728, "Agent": "REINFORCE"}, {"env_step": 3256320, "rew": 970.11, "rew_std": 58.0504, "Agent": "REINFORCE"}, {"env_step": 3287040, "rew": 925.99, "rew_std": 169.4014, "Agent": "REINFORCE"}, {"env_step": 3317760, "rew": 937.4, "rew_std": 132.2121, "Agent": "REINFORCE"}, {"env_step": 3348480, "rew": 938.35, "rew_std": 111.87, "Agent": "REINFORCE"}, {"env_step": 3379200, "rew": 958.97, "rew_std": 76.2582, "Agent": "REINFORCE"}, {"env_step": 3409920, "rew": 973.93, "rew_std": 78.21, "Agent": "REINFORCE"}, {"env_step": 3440640, "rew": 993.26, "rew_std": 13.4807, "Agent": "REINFORCE"}, {"env_step": 3471360, "rew": 1000.0, "rew_std": 0.0, "Agent": "REINFORCE"}, {"env_step": 3502080, "rew": 991.8, "rew_std": 24.6, "Agent": "REINFORCE"}, {"env_step": 3532800, "rew": 1000.0, "rew_std": 0.0, "Agent": "REINFORCE"}, {"env_step": 3563520, "rew": 987.43, "rew_std": 37.71, "Agent": "REINFORCE"}, {"env_step": 3594240, "rew": 993.49, "rew_std": 15.1111, "Agent": "REINFORCE"}, {"env_step": 3624960, "rew": 952.32, "rew_std": 96.3679, "Agent": "REINFORCE"}, {"env_step": 3655680, "rew": 958.15, "rew_std": 86.4831, "Agent": "REINFORCE"}, {"env_step": 3686400, "rew": 996.88, "rew_std": 9.36, "Agent": "REINFORCE"}, {"env_step": 3717120, "rew": 985.05, "rew_std": 43.4356, "Agent": "REINFORCE"}, {"env_step": 3747840, "rew": 988.67, "rew_std": 19.47, "Agent": "REINFORCE"}, {"env_step": 3778560, "rew": 1000.0, "rew_std": 0.0, "Agent": "REINFORCE"}, {"env_step": 3809280, "rew": 1000.0, "rew_std": 0.0, "Agent": "REINFORCE"}, {"env_step": 3840000, "rew": 1000.0, "rew_std": 0.0, "Agent": "REINFORCE"}, {"env_step": 3870720, "rew": 1000.0, "rew_std": 0.0, "Agent": "REINFORCE"}, {"env_step": 3901440, "rew": 997.36, "rew_std": 7.92, "Agent": "REINFORCE"}, {"env_step": 3932160, "rew": 961.05, "rew_std": 89.4592, "Agent": "REINFORCE"}, {"env_step": 3962880, "rew": 996.96, "rew_std": 9.12, "Agent": "REINFORCE"}, {"env_step": 3993600, "rew": 989.29, "rew_std": 23.3794, "Agent": "REINFORCE"}, {"env_step": 4024320, "rew": 980.13, "rew_std": 44.6161, "Agent": "REINFORCE"}, {"env_step": 4055040, "rew": 936.52, "rew_std": 138.0583, "Agent": "REINFORCE"}, {"env_step": 4085760, "rew": 898.51, "rew_std": 209.1586, "Agent": "REINFORCE"}, {"env_step": 4116480, "rew": 924.11, "rew_std": 150.3964, "Agent": "REINFORCE"}, {"env_step": 4147200, "rew": 947.87, "rew_std": 120.5692, "Agent": "REINFORCE"}, {"env_step": 4177920, "rew": 985.73, "rew_std": 29.0117, "Agent": "REINFORCE"}, {"env_step": 4208640, "rew": 997.0, "rew_std": 9.0, "Agent": "REINFORCE"}, {"env_step": 4239360, "rew": 984.57, "rew_std": 46.29, "Agent": "REINFORCE"}, {"env_step": 4270080, "rew": 1000.0, "rew_std": 0.0, "Agent": "REINFORCE"}, {"env_step": 4300800, "rew": 992.52, "rew_std": 22.44, "Agent": "REINFORCE"}, {"env_step": 4331520, "rew": 996.87, "rew_std": 9.3567, "Agent": "REINFORCE"}, {"env_step": 4362240, "rew": 971.22, "rew_std": 80.9581, "Agent": "REINFORCE"}, {"env_step": 4392960, "rew": 996.96, "rew_std": 6.8386, "Agent": "REINFORCE"}, {"env_step": 4423680, "rew": 984.05, "rew_std": 47.85, "Agent": "REINFORCE"}, {"env_step": 4454400, "rew": 969.73, "rew_std": 89.3859, "Agent": "REINFORCE"}, {"env_step": 4485120, "rew": 974.38, "rew_std": 51.5344, "Agent": "REINFORCE"}, {"env_step": 4515840, "rew": 980.65, "rew_std": 38.7903, "Agent": "REINFORCE"}, {"env_step": 4546560, "rew": 994.77, "rew_std": 11.3847, "Agent": "REINFORCE"}, {"env_step": 4577280, "rew": 989.89, "rew_std": 26.3412, "Agent": "REINFORCE"}, {"env_step": 4608000, "rew": 970.11, "rew_std": 56.3644, "Agent": "REINFORCE"}, {"env_step": 4638720, "rew": 976.69, "rew_std": 59.2732, "Agent": "REINFORCE"}, {"env_step": 4669440, "rew": 986.44, "rew_std": 40.68, "Agent": "REINFORCE"}, {"env_step": 4700160, "rew": 952.71, "rew_std": 125.6674, "Agent": "REINFORCE"}, {"env_step": 4730880, "rew": 928.08, "rew_std": 111.8978, "Agent": "REINFORCE"}, {"env_step": 4761600, "rew": 896.89, "rew_std": 206.626, "Agent": "REINFORCE"}, {"env_step": 4792320, "rew": 939.65, "rew_std": 163.6885, "Agent": "REINFORCE"}, {"env_step": 4823040, "rew": 944.47, "rew_std": 116.7956, "Agent": "REINFORCE"}, {"env_step": 4853760, "rew": 985.24, "rew_std": 34.0693, "Agent": "REINFORCE"}, {"env_step": 4884480, "rew": 941.44, "rew_std": 164.5019, "Agent": "REINFORCE"}, {"env_step": 4915200, "rew": 981.87, "rew_std": 52.8745, "Agent": "REINFORCE"}, {"env_step": 4945920, "rew": 969.33, "rew_std": 66.2071, "Agent": "REINFORCE"}, {"env_step": 4976640, "rew": 969.65, "rew_std": 82.8689, "Agent": "REINFORCE"}, {"env_step": 5007360, "rew": 923.34, "rew_std": 186.0589, "Agent": "REINFORCE"}, {"env_step": 5038080, "rew": 958.08, "rew_std": 125.76, "Agent": "REINFORCE"}, {"env_step": 5068800, "rew": 964.36, "rew_std": 64.0499, "Agent": "REINFORCE"}, {"env_step": 5099520, "rew": 944.88, "rew_std": 125.0058, "Agent": "REINFORCE"}, {"env_step": 5130240, "rew": 974.54, "rew_std": 47.3084, "Agent": "REINFORCE"}, {"env_step": 5160960, "rew": 942.66, "rew_std": 116.292, "Agent": "REINFORCE"}, {"env_step": 5191680, "rew": 972.72, "rew_std": 51.941, "Agent": "REINFORCE"}, {"env_step": 5222400, "rew": 955.78, "rew_std": 89.3096, "Agent": "REINFORCE"}, {"env_step": 5253120, "rew": 931.04, "rew_std": 137.3695, "Agent": "REINFORCE"}, {"env_step": 5283840, "rew": 978.13, "rew_std": 59.9788, "Agent": "REINFORCE"}, {"env_step": 5314560, "rew": 957.28, "rew_std": 75.6188, "Agent": "REINFORCE"}, {"env_step": 5345280, "rew": 975.95, "rew_std": 68.7852, "Agent": "REINFORCE"}, {"env_step": 5376000, "rew": 966.64, "rew_std": 96.825, "Agent": "REINFORCE"}, {"env_step": 5406720, "rew": 979.06, "rew_std": 62.82, "Agent": "REINFORCE"}, {"env_step": 5437440, "rew": 968.61, "rew_std": 86.5537, "Agent": "REINFORCE"}, {"env_step": 5468160, "rew": 976.44, "rew_std": 70.68, "Agent": "REINFORCE"}, {"env_step": 5498880, "rew": 958.38, "rew_std": 121.4329, "Agent": "REINFORCE"}, {"env_step": 5529600, "rew": 955.82, "rew_std": 88.6493, "Agent": "REINFORCE"}, {"env_step": 5560320, "rew": 946.08, "rew_std": 112.7584, "Agent": "REINFORCE"}, {"env_step": 5591040, "rew": 961.89, "rew_std": 60.2556, "Agent": "REINFORCE"}, {"env_step": 5621760, "rew": 940.04, "rew_std": 120.9129, "Agent": "REINFORCE"}, {"env_step": 5652480, "rew": 899.66, "rew_std": 236.9832, "Agent": "REINFORCE"}, {"env_step": 5683200, "rew": 931.92, "rew_std": 116.4014, "Agent": "REINFORCE"}, {"env_step": 5713920, "rew": 945.26, "rew_std": 146.3737, "Agent": "REINFORCE"}, {"env_step": 5744640, "rew": 948.53, "rew_std": 139.2984, "Agent": "REINFORCE"}, {"env_step": 5775360, "rew": 935.82, "rew_std": 163.0163, "Agent": "REINFORCE"}, {"env_step": 5806080, "rew": 941.58, "rew_std": 133.742, "Agent": "REINFORCE"}, {"env_step": 5836800, "rew": 946.76, "rew_std": 106.4974, "Agent": "REINFORCE"}, {"env_step": 5867520, "rew": 962.57, "rew_std": 79.0669, "Agent": "REINFORCE"}, {"env_step": 5898240, "rew": 981.65, "rew_std": 55.05, "Agent": "REINFORCE"}, {"env_step": 5928960, "rew": 972.05, "rew_std": 66.1885, "Agent": "REINFORCE"}, {"env_step": 5959680, "rew": 984.14, "rew_std": 47.58, "Agent": "REINFORCE"}, {"env_step": 5990400, "rew": 967.55, "rew_std": 88.655, "Agent": "REINFORCE"}, {"env_step": 6021120, "rew": 971.08, "rew_std": 86.76, "Agent": "REINFORCE"}, {"env_step": 6051840, "rew": 968.22, "rew_std": 95.34, "Agent": "REINFORCE"}, {"env_step": 6082560, "rew": 977.34, "rew_std": 67.98, "Agent": "REINFORCE"}, {"env_step": 6113280, "rew": 960.5, "rew_std": 118.5, "Agent": "REINFORCE"}, {"env_step": 6144000, "rew": 973.86, "rew_std": 78.42, "Agent": "REINFORCE"}, {"env_step": 6174720, "rew": 969.46, "rew_std": 58.3955, "Agent": "REINFORCE"}, {"env_step": 6205440, "rew": 979.65, "rew_std": 41.8987, "Agent": "REINFORCE"}, {"env_step": 6236160, "rew": 965.02, "rew_std": 99.5217, "Agent": "REINFORCE"}, {"env_step": 6266880, "rew": 971.33, "rew_std": 47.5716, "Agent": "REINFORCE"}, {"env_step": 6297600, "rew": 974.53, "rew_std": 38.7326, "Agent": "REINFORCE"}, {"env_step": 6328320, "rew": 977.68, "rew_std": 49.2839, "Agent": "REINFORCE"}, {"env_step": 6359040, "rew": 943.14, "rew_std": 137.6136, "Agent": "REINFORCE"}, {"env_step": 6389760, "rew": 929.24, "rew_std": 140.7475, "Agent": "REINFORCE"}, {"env_step": 6420480, "rew": 945.01, "rew_std": 125.1647, "Agent": "REINFORCE"}, {"env_step": 6451200, "rew": 985.98, "rew_std": 29.0759, "Agent": "REINFORCE"}, {"env_step": 6481920, "rew": 973.27, "rew_std": 54.1206, "Agent": "REINFORCE"}, {"env_step": 6512640, "rew": 993.2, "rew_std": 20.4, "Agent": "REINFORCE"}, {"env_step": 6543360, "rew": 995.22, "rew_std": 14.34, "Agent": "REINFORCE"}, {"env_step": 6574080, "rew": 983.8, "rew_std": 48.6, "Agent": "REINFORCE"}, {"env_step": 6604800, "rew": 977.69, "rew_std": 66.93, "Agent": "REINFORCE"}, {"env_step": 6635520, "rew": 970.33, "rew_std": 89.01, "Agent": "REINFORCE"}, {"env_step": 6666240, "rew": 928.35, "rew_std": 143.5004, "Agent": "REINFORCE"}, {"env_step": 6696960, "rew": 887.07, "rew_std": 264.9795, "Agent": "REINFORCE"}, {"env_step": 6727680, "rew": 912.96, "rew_std": 165.7926, "Agent": "REINFORCE"}, {"env_step": 6758400, "rew": 944.63, "rew_std": 112.7822, "Agent": "REINFORCE"}, {"env_step": 6789120, "rew": 972.56, "rew_std": 59.3623, "Agent": "REINFORCE"}, {"env_step": 6819840, "rew": 951.99, "rew_std": 100.6198, "Agent": "REINFORCE"}, {"env_step": 6850560, "rew": 970.37, "rew_std": 88.89, "Agent": "REINFORCE"}, {"env_step": 6881280, "rew": 959.42, "rew_std": 102.4488, "Agent": "REINFORCE"}, {"env_step": 6912000, "rew": 976.17, "rew_std": 71.49, "Agent": "REINFORCE"}, {"env_step": 6942720, "rew": 986.69, "rew_std": 29.621, "Agent": "REINFORCE"}, {"env_step": 6973440, "rew": 967.66, "rew_std": 75.8986, "Agent": "REINFORCE"}, {"env_step": 7004160, "rew": 974.04, "rew_std": 71.0949, "Agent": "REINFORCE"}, {"env_step": 7034880, "rew": 971.19, "rew_std": 63.3525, "Agent": "REINFORCE"}, {"env_step": 7065600, "rew": 964.4, "rew_std": 70.0223, "Agent": "REINFORCE"}, {"env_step": 7096320, "rew": 975.77, "rew_std": 42.3078, "Agent": "REINFORCE"}, {"env_step": 7127040, "rew": 953.71, "rew_std": 107.6088, "Agent": "REINFORCE"}, {"env_step": 7157760, "rew": 946.54, "rew_std": 160.38, "Agent": "REINFORCE"}, {"env_step": 7188480, "rew": 945.85, "rew_std": 156.6389, "Agent": "REINFORCE"}, {"env_step": 7219200, "rew": 986.76, "rew_std": 28.1261, "Agent": "REINFORCE"}, {"env_step": 7249920, "rew": 969.07, "rew_std": 79.0497, "Agent": "REINFORCE"}, {"env_step": 7280640, "rew": 964.18, "rew_std": 71.6487, "Agent": "REINFORCE"}, {"env_step": 7311360, "rew": 973.94, "rew_std": 66.5413, "Agent": "REINFORCE"}, {"env_step": 7342080, "rew": 967.18, "rew_std": 64.9514, "Agent": "REINFORCE"}, {"env_step": 7372800, "rew": 987.3, "rew_std": 38.1, "Agent": "REINFORCE"}, {"env_step": 7403520, "rew": 987.18, "rew_std": 26.4402, "Agent": "REINFORCE"}, {"env_step": 7434240, "rew": 988.15, "rew_std": 27.092, "Agent": "REINFORCE"}, {"env_step": 7464960, "rew": 997.34, "rew_std": 7.98, "Agent": "REINFORCE"}, {"env_step": 7495680, "rew": 989.45, "rew_std": 22.1128, "Agent": "REINFORCE"}, {"env_step": 7526400, "rew": 976.87, "rew_std": 32.5971, "Agent": "REINFORCE"}, {"env_step": 7557120, "rew": 990.95, "rew_std": 19.0453, "Agent": "REINFORCE"}, {"env_step": 7587840, "rew": 985.18, "rew_std": 44.46, "Agent": "REINFORCE"}, {"env_step": 7618560, "rew": 986.04, "rew_std": 27.1982, "Agent": "REINFORCE"}, {"env_step": 7649280, "rew": 996.89, "rew_std": 9.33, "Agent": "REINFORCE"}, {"env_step": 7680000, "rew": 995.35, "rew_std": 13.95, "Agent": "REINFORCE"}, {"env_step": 7710720, "rew": 993.68, "rew_std": 13.2519, "Agent": "REINFORCE"}, {"env_step": 7741440, "rew": 995.56, "rew_std": 13.32, "Agent": "REINFORCE"}, {"env_step": 7772160, "rew": 994.58, "rew_std": 16.26, "Agent": "REINFORCE"}, {"env_step": 7802880, "rew": 988.5, "rew_std": 19.8029, "Agent": "REINFORCE"}, {"env_step": 7833600, "rew": 983.51, "rew_std": 29.6331, "Agent": "REINFORCE"}, {"env_step": 7864320, "rew": 986.0, "rew_std": 35.8798, "Agent": "REINFORCE"}, {"env_step": 7895040, "rew": 999.01, "rew_std": 2.5046, "Agent": "REINFORCE"}, {"env_step": 7925760, "rew": 991.12, "rew_std": 19.6687, "Agent": "REINFORCE"}, {"env_step": 7956480, "rew": 995.02, "rew_std": 7.7363, "Agent": "REINFORCE"}, {"env_step": 7987200, "rew": 987.84, "rew_std": 16.5385, "Agent": "REINFORCE"}, {"env_step": 8017920, "rew": 998.27, "rew_std": 3.4658, "Agent": "REINFORCE"}, {"env_step": 8048640, "rew": 994.55, "rew_std": 11.6745, "Agent": "REINFORCE"}, {"env_step": 8079360, "rew": 997.05, "rew_std": 8.85, "Agent": "REINFORCE"}, {"env_step": 8110080, "rew": 996.69, "rew_std": 9.93, "Agent": "REINFORCE"}, {"env_step": 8140800, "rew": 988.87, "rew_std": 26.236, "Agent": "REINFORCE"}, {"env_step": 8171520, "rew": 998.81, "rew_std": 3.57, "Agent": "REINFORCE"}, {"env_step": 8202240, "rew": 987.15, "rew_std": 33.6569, "Agent": "REINFORCE"}, {"env_step": 8232960, "rew": 982.36, "rew_std": 27.6911, "Agent": "REINFORCE"}, {"env_step": 8263680, "rew": 989.91, "rew_std": 18.1475, "Agent": "REINFORCE"}, {"env_step": 8294400, "rew": 992.33, "rew_std": 15.7267, "Agent": "REINFORCE"}, {"env_step": 8325120, "rew": 984.41, "rew_std": 26.5234, "Agent": "REINFORCE"}, {"env_step": 8355840, "rew": 989.7, "rew_std": 26.1073, "Agent": "REINFORCE"}, {"env_step": 8386560, "rew": 994.3, "rew_std": 15.6883, "Agent": "REINFORCE"}, {"env_step": 8417280, "rew": 993.42, "rew_std": 15.0441, "Agent": "REINFORCE"}, {"env_step": 8448000, "rew": 995.75, "rew_std": 12.75, "Agent": "REINFORCE"}, {"env_step": 8478720, "rew": 987.79, "rew_std": 36.63, "Agent": "REINFORCE"}, {"env_step": 8509440, "rew": 990.6, "rew_std": 28.2, "Agent": "REINFORCE"}, {"env_step": 8540160, "rew": 987.92, "rew_std": 24.16, "Agent": "REINFORCE"}, {"env_step": 8570880, "rew": 993.01, "rew_std": 20.97, "Agent": "REINFORCE"}, {"env_step": 8601600, "rew": 991.45, "rew_std": 25.65, "Agent": "REINFORCE"}, {"env_step": 8632320, "rew": 988.16, "rew_std": 24.1036, "Agent": "REINFORCE"}, {"env_step": 8663040, "rew": 989.99, "rew_std": 27.2537, "Agent": "REINFORCE"}, {"env_step": 8693760, "rew": 980.57, "rew_std": 52.776, "Agent": "REINFORCE"}, {"env_step": 8724480, "rew": 979.38, "rew_std": 58.5658, "Agent": "REINFORCE"}, {"env_step": 8755200, "rew": 981.04, "rew_std": 45.9426, "Agent": "REINFORCE"}, {"env_step": 8785920, "rew": 988.11, "rew_std": 29.5302, "Agent": "REINFORCE"}, {"env_step": 8816640, "rew": 987.7, "rew_std": 24.7459, "Agent": "REINFORCE"}, {"env_step": 8847360, "rew": 979.86, "rew_std": 60.42, "Agent": "REINFORCE"}, {"env_step": 8878080, "rew": 977.88, "rew_std": 64.8739, "Agent": "REINFORCE"}, {"env_step": 8908800, "rew": 959.86, "rew_std": 108.7084, "Agent": "REINFORCE"}, {"env_step": 8939520, "rew": 970.0, "rew_std": 68.9139, "Agent": "REINFORCE"}, {"env_step": 8970240, "rew": 964.68, "rew_std": 74.6974, "Agent": "REINFORCE"}, {"env_step": 9000960, "rew": 990.37, "rew_std": 28.89, "Agent": "REINFORCE"}, {"env_step": 9031680, "rew": 979.94, "rew_std": 50.1546, "Agent": "REINFORCE"}, {"env_step": 9062400, "rew": 982.1, "rew_std": 52.7733, "Agent": "REINFORCE"}, {"env_step": 9093120, "rew": 986.99, "rew_std": 39.03, "Agent": "REINFORCE"}, {"env_step": 9123840, "rew": 989.79, "rew_std": 21.3974, "Agent": "REINFORCE"}, {"env_step": 9154560, "rew": 981.83, "rew_std": 52.1542, "Agent": "REINFORCE"}, {"env_step": 9185280, "rew": 982.49, "rew_std": 49.1926, "Agent": "REINFORCE"}, {"env_step": 9216000, "rew": 988.71, "rew_std": 33.87, "Agent": "REINFORCE"}, {"env_step": 9246720, "rew": 979.35, "rew_std": 34.6324, "Agent": "REINFORCE"}, {"env_step": 9277440, "rew": 974.84, "rew_std": 68.521, "Agent": "REINFORCE"}, {"env_step": 9308160, "rew": 985.45, "rew_std": 29.2879, "Agent": "REINFORCE"}, {"env_step": 9338880, "rew": 981.71, "rew_std": 40.8931, "Agent": "REINFORCE"}, {"env_step": 9369600, "rew": 982.45, "rew_std": 44.3861, "Agent": "REINFORCE"}, {"env_step": 9400320, "rew": 975.6, "rew_std": 50.5635, "Agent": "REINFORCE"}, {"env_step": 9431040, "rew": 954.35, "rew_std": 51.0388, "Agent": "REINFORCE"}, {"env_step": 9461760, "rew": 982.39, "rew_std": 40.8217, "Agent": "REINFORCE"}, {"env_step": 9492480, "rew": 977.28, "rew_std": 35.9271, "Agent": "REINFORCE"}, {"env_step": 9523200, "rew": 984.04, "rew_std": 32.9361, "Agent": "REINFORCE"}, {"env_step": 9553920, "rew": 997.36, "rew_std": 6.4032, "Agent": "REINFORCE"}, {"env_step": 9584640, "rew": 996.45, "rew_std": 10.65, "Agent": "REINFORCE"}, {"env_step": 9615360, "rew": 998.23, "rew_std": 3.6458, "Agent": "REINFORCE"}, {"env_step": 9646080, "rew": 998.04, "rew_std": 5.88, "Agent": "REINFORCE"}, {"env_step": 9676800, "rew": 1000.0, "rew_std": 0.0, "Agent": "REINFORCE"}, {"env_step": 9707520, "rew": 997.27, "rew_std": 8.19, "Agent": "REINFORCE"}, {"env_step": 9738240, "rew": 997.57, "rew_std": 4.8625, "Agent": "REINFORCE"}, {"env_step": 9768960, "rew": 998.22, "rew_std": 4.8606, "Agent": "REINFORCE"}, {"env_step": 9799680, "rew": 998.18, "rew_std": 5.46, "Agent": "REINFORCE"}, {"env_step": 9830400, "rew": 991.26, "rew_std": 25.9214, "Agent": "REINFORCE"}, {"env_step": 9861120, "rew": 995.78, "rew_std": 12.66, "Agent": "REINFORCE"}, {"env_step": 9891840, "rew": 993.67, "rew_std": 16.3826, "Agent": "REINFORCE"}, {"env_step": 9922560, "rew": 985.09, "rew_std": 30.4634, "Agent": "REINFORCE"}, {"env_step": 9953280, "rew": 993.93, "rew_std": 11.1788, "Agent": "REINFORCE"}, {"env_step": 9984000, "rew": 987.52, "rew_std": 28.9694, "Agent": "REINFORCE"}, {"env_step": 10014720, "rew": 993.16, "rew_std": 15.6074, "Agent": "REINFORCE"}, {"env_step": 10045440, "rew": 991.35, "rew_std": 17.309, "Agent": "REINFORCE"}, {"env_step": 10076160, "rew": 999.52, "rew_std": 1.2246, "Agent": "REINFORCE"}, {"env_step": 10106880, "rew": 1000.0, "rew_std": 0.0, "Agent": "REINFORCE"}, {"env_step": 10137600, "rew": 990.79, "rew_std": 21.6526, "Agent": "REINFORCE"}, {"env_step": 10168320, "rew": 998.24, "rew_std": 5.28, "Agent": "REINFORCE"}, {"env_step": 10199040, "rew": 982.93, "rew_std": 32.6478, "Agent": "REINFORCE"}, {"env_step": 10229760, "rew": 991.54, "rew_std": 17.0852, "Agent": "REINFORCE"}, {"env_step": 0, "rew": 10.32, "rew_std": 2.1711, "Agent": "SAC"}, {"env_step": 5000, "rew": 97.9, "rew_std": 54.3586, "Agent": "SAC"}, {"env_step": 10000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 15000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 20000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 25000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 30000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 35000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 40000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 45000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 50000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 55000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 60000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 65000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 70000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 75000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 80000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 85000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 90000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 95000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 100000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 105000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 110000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 115000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 120000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 125000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 130000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 135000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 140000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 145000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 150000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 155000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 160000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 165000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 170000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 175000, "rew": 920.69, "rew_std": 237.93, "Agent": "SAC"}, {"env_step": 180000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 185000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 190000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 195000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 200000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 205000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 210000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 215000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 220000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 225000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 230000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 235000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 240000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 245000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 250000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 255000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 260000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 265000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 270000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 275000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 280000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 285000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 290000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 295000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 300000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 305000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 310000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 315000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 320000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 325000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 330000, "rew": 994.56, "rew_std": 16.32, "Agent": "SAC"}, {"env_step": 335000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 340000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 345000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 350000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 355000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 360000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 365000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 370000, "rew": 988.24, "rew_std": 35.28, "Agent": "SAC"}, {"env_step": 375000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 380000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 385000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 390000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 395000, "rew": 912.58, "rew_std": 262.26, "Agent": "SAC"}, {"env_step": 400000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 405000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 410000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 415000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 420000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 425000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 430000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 435000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 440000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 445000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 450000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 455000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 460000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 465000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 470000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 475000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 480000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 485000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 490000, "rew": 924.73, "rew_std": 225.81, "Agent": "SAC"}, {"env_step": 495000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 500000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 505000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 510000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 515000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 520000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 525000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 530000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 535000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 540000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 545000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 550000, "rew": 942.67, "rew_std": 171.99, "Agent": "SAC"}, {"env_step": 555000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 560000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 565000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 570000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 575000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 580000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 585000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 590000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 595000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 600000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 605000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 610000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 615000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 620000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 625000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 630000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 635000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 640000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 645000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 650000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 655000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 660000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 665000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 670000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 675000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 680000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 685000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 690000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 695000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 700000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 705000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 710000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 715000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 720000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 725000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 730000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 735000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 740000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 745000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 750000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 755000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 760000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 765000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 770000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 775000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 780000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 785000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 790000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 795000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 800000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 805000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 810000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 815000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 820000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 825000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 830000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 835000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 840000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 845000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 850000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 855000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 860000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 865000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 870000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 875000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 880000, "rew": 957.33, "rew_std": 128.01, "Agent": "SAC"}, {"env_step": 885000, "rew": 907.27, "rew_std": 278.19, "Agent": "SAC"}, {"env_step": 890000, "rew": 944.61, "rew_std": 166.17, "Agent": "SAC"}, {"env_step": 895000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 900000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 905000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 910000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 915000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 920000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 925000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 930000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 935000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 940000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 945000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 950000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 955000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 960000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 965000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 970000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 975000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 980000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 985000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 990000, "rew": 971.67, "rew_std": 84.99, "Agent": "SAC"}, {"env_step": 995000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1000000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1005000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1010000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1015000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1020000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1025000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1030000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1035000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1040000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1045000, "rew": 907.31, "rew_std": 278.07, "Agent": "SAC"}, {"env_step": 1050000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1055000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1060000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1065000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1070000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1075000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1080000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1085000, "rew": 909.78, "rew_std": 270.66, "Agent": "SAC"}, {"env_step": 1090000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1095000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1100000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1105000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1110000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1115000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1120000, "rew": 912.78, "rew_std": 261.66, "Agent": "SAC"}, {"env_step": 1125000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1130000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1135000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1140000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1145000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1150000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1155000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1160000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1165000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1170000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1175000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1180000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1185000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1190000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1195000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1200000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1205000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1210000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1215000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1220000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1225000, "rew": 906.82, "rew_std": 279.54, "Agent": "SAC"}, {"env_step": 1230000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1235000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1240000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1245000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 1250000, "rew": 1000.0, "rew_std": 0.0, "Agent": "SAC"}, {"env_step": 0, "rew": 5.85, "rew_std": 1.136, "Agent": "TRPO"}, {"env_step": 30720, "rew": 1000.0, "rew_std": 0.0, "Agent": "TRPO"}, {"env_step": 61440, "rew": 1000.0, "rew_std": 0.0, "Agent": "TRPO"}, {"env_step": 92160, "rew": 989.51, "rew_std": 31.47, "Agent": "TRPO"}, {"env_step": 122880, "rew": 930.28, "rew_std": 209.16, "Agent": "TRPO"}, {"env_step": 153600, "rew": 1000.0, "rew_std": 0.0, "Agent": "TRPO"}, {"env_step": 184320, "rew": 1000.0, "rew_std": 0.0, "Agent": "TRPO"}, {"env_step": 215040, "rew": 1000.0, "rew_std": 0.0, "Agent": "TRPO"}, {"env_step": 245760, "rew": 900.3, "rew_std": 299.1, "Agent": "TRPO"}, {"env_step": 276480, "rew": 890.4, "rew_std": 297.269, "Agent": "TRPO"}, {"env_step": 307200, "rew": 797.21, "rew_std": 365.5592, "Agent": "TRPO"}, {"env_step": 337920, "rew": 774.04, "rew_std": 355.6657, "Agent": "TRPO"}, {"env_step": 368640, "rew": 758.81, "rew_std": 362.0865, "Agent": "TRPO"}, {"env_step": 399360, "rew": 739.53, "rew_std": 357.5581, "Agent": "TRPO"}, {"env_step": 430080, "rew": 740.46, "rew_std": 357.6159, "Agent": "TRPO"}, {"env_step": 460800, "rew": 810.95, "rew_std": 342.7054, "Agent": "TRPO"}, {"env_step": 491520, "rew": 763.75, "rew_std": 334.1058, "Agent": "TRPO"}, {"env_step": 522240, "rew": 695.41, "rew_std": 379.0516, "Agent": "TRPO"}, {"env_step": 552960, "rew": 684.67, "rew_std": 347.9525, "Agent": "TRPO"}, {"env_step": 583680, "rew": 798.47, "rew_std": 337.92, "Agent": "TRPO"}, {"env_step": 614400, "rew": 771.49, "rew_std": 360.9133, "Agent": "TRPO"}, {"env_step": 645120, "rew": 782.75, "rew_std": 348.4232, "Agent": "TRPO"}, {"env_step": 675840, "rew": 784.22, "rew_std": 346.8093, "Agent": "TRPO"}, {"env_step": 706560, "rew": 842.97, "rew_std": 328.1039, "Agent": "TRPO"}, {"env_step": 737280, "rew": 738.91, "rew_std": 344.5304, "Agent": "TRPO"}, {"env_step": 768000, "rew": 796.9, "rew_std": 315.0585, "Agent": "TRPO"}, {"env_step": 798720, "rew": 765.6, "rew_std": 347.7668, "Agent": "TRPO"}, {"env_step": 829440, "rew": 837.42, "rew_std": 319.9491, "Agent": "TRPO"}, {"env_step": 860160, "rew": 727.63, "rew_std": 367.1286, "Agent": "TRPO"}, {"env_step": 890880, "rew": 709.16, "rew_std": 385.3439, "Agent": "TRPO"}, {"env_step": 921600, "rew": 719.38, "rew_std": 381.2329, "Agent": "TRPO"}, {"env_step": 952320, "rew": 757.07, "rew_std": 368.2591, "Agent": "TRPO"}, {"env_step": 983040, "rew": 757.31, "rew_std": 368.0868, "Agent": "TRPO"}, {"env_step": 1013760, "rew": 849.57, "rew_std": 320.1672, "Agent": "TRPO"}, {"env_step": 1044480, "rew": 849.46, "rew_std": 320.29, "Agent": "TRPO"}, {"env_step": 1075200, "rew": 831.09, "rew_std": 315.6989, "Agent": "TRPO"}, {"env_step": 1105920, "rew": 840.4, "rew_std": 316.5183, "Agent": "TRPO"}, {"env_step": 1136640, "rew": 850.88, "rew_std": 318.7279, "Agent": "TRPO"}, {"env_step": 1167360, "rew": 850.19, "rew_std": 319.4808, "Agent": "TRPO"}, {"env_step": 1198080, "rew": 849.49, "rew_std": 320.2565, "Agent": "TRPO"}, {"env_step": 1228800, "rew": 847.75, "rew_std": 322.2357, "Agent": "TRPO"}, {"env_step": 1259520, "rew": 900.3, "rew_std": 299.1, "Agent": "TRPO"}, {"env_step": 1290240, "rew": 891.9, "rew_std": 297.3565, "Agent": "TRPO"}, {"env_step": 1320960, "rew": 900.3, "rew_std": 299.1, "Agent": "TRPO"}, {"env_step": 1351680, "rew": 878.07, "rew_std": 299.1249, "Agent": "TRPO"}, {"env_step": 1382400, "rew": 890.46, "rew_std": 297.2712, "Agent": "TRPO"}, {"env_step": 1413120, "rew": 880.74, "rew_std": 295.1124, "Agent": "TRPO"}, {"env_step": 1443840, "rew": 872.86, "rew_std": 295.9501, "Agent": "TRPO"}, {"env_step": 1474560, "rew": 859.85, "rew_std": 298.6305, "Agent": "TRPO"}, {"env_step": 1505280, "rew": 900.3, "rew_std": 299.1, "Agent": "TRPO"}, {"env_step": 1536000, "rew": 820.37, "rew_std": 308.4939, "Agent": "TRPO"}, {"env_step": 1566720, "rew": 807.55, "rew_std": 321.8834, "Agent": "TRPO"}, {"env_step": 1597440, "rew": 860.67, "rew_std": 293.4769, "Agent": "TRPO"}, {"env_step": 1628160, "rew": 884.96, "rew_std": 297.2065, "Agent": "TRPO"}, {"env_step": 1658880, "rew": 900.3, "rew_std": 299.1, "Agent": "TRPO"}, {"env_step": 1689600, "rew": 890.74, "rew_std": 297.2828, "Agent": "TRPO"}, {"env_step": 1720320, "rew": 825.01, "rew_std": 303.3167, "Agent": "TRPO"}, {"env_step": 1751040, "rew": 826.36, "rew_std": 314.9794, "Agent": "TRPO"}, {"env_step": 1781760, "rew": 844.24, "rew_std": 305.965, "Agent": "TRPO"}, {"env_step": 1812480, "rew": 846.04, "rew_std": 303.5831, "Agent": "TRPO"}, {"env_step": 1843200, "rew": 852.38, "rew_std": 301.714, "Agent": "TRPO"}, {"env_step": 1873920, "rew": 874.05, "rew_std": 295.5331, "Agent": "TRPO"}, {"env_step": 1904640, "rew": 894.66, "rew_std": 297.6953, "Agent": "TRPO"}, {"env_step": 1935360, "rew": 870.22, "rew_std": 294.9349, "Agent": "TRPO"}, {"env_step": 1966080, "rew": 811.99, "rew_std": 357.9505, "Agent": "TRPO"}, {"env_step": 1996800, "rew": 772.68, "rew_std": 389.2261, "Agent": "TRPO"}, {"env_step": 2027520, "rew": 775.23, "rew_std": 390.2144, "Agent": "TRPO"}, {"env_step": 2058240, "rew": 779.09, "rew_std": 390.0167, "Agent": "TRPO"}, {"env_step": 2088960, "rew": 779.66, "rew_std": 391.6124, "Agent": "TRPO"}, {"env_step": 2119680, "rew": 800.73, "rew_std": 398.54, "Agent": "TRPO"}, {"env_step": 2150400, "rew": 791.31, "rew_std": 394.9517, "Agent": "TRPO"}, {"env_step": 2181120, "rew": 800.65, "rew_std": 398.7, "Agent": "TRPO"}, {"env_step": 2211840, "rew": 800.66, "rew_std": 398.68, "Agent": "TRPO"}, {"env_step": 2242560, "rew": 794.25, "rew_std": 395.7409, "Agent": "TRPO"}, {"env_step": 2273280, "rew": 795.42, "rew_std": 396.3155, "Agent": "TRPO"}, {"env_step": 2304000, "rew": 794.41, "rew_std": 395.9396, "Agent": "TRPO"}, {"env_step": 2334720, "rew": 800.71, "rew_std": 398.58, "Agent": "TRPO"}, {"env_step": 2365440, "rew": 800.71, "rew_std": 398.58, "Agent": "TRPO"}, {"env_step": 2396160, "rew": 800.72, "rew_std": 398.56, "Agent": "TRPO"}, {"env_step": 2426880, "rew": 800.8, "rew_std": 398.4, "Agent": "TRPO"}, {"env_step": 2457600, "rew": 800.75, "rew_std": 398.5, "Agent": "TRPO"}, {"env_step": 2488320, "rew": 800.74, "rew_std": 398.52, "Agent": "TRPO"}, {"env_step": 2519040, "rew": 800.75, "rew_std": 398.5, "Agent": "TRPO"}, {"env_step": 2549760, "rew": 800.71, "rew_std": 398.5801, "Agent": "TRPO"}, {"env_step": 2580480, "rew": 800.82, "rew_std": 398.36, "Agent": "TRPO"}, {"env_step": 2611200, "rew": 800.75, "rew_std": 398.5, "Agent": "TRPO"}, {"env_step": 2641920, "rew": 800.79, "rew_std": 398.42, "Agent": "TRPO"}, {"env_step": 2672640, "rew": 800.81, "rew_std": 398.38, "Agent": "TRPO"}, {"env_step": 2703360, "rew": 800.78, "rew_std": 398.44, "Agent": "TRPO"}, {"env_step": 2734080, "rew": 800.8, "rew_std": 398.4, "Agent": "TRPO"}, {"env_step": 2764800, "rew": 800.88, "rew_std": 398.2402, "Agent": "TRPO"}, {"env_step": 2795520, "rew": 801.09, "rew_std": 397.8209, "Agent": "TRPO"}, {"env_step": 2826240, "rew": 801.48, "rew_std": 397.0411, "Agent": "TRPO"}, {"env_step": 2856960, "rew": 798.93, "rew_std": 396.2046, "Agent": "TRPO"}, {"env_step": 2887680, "rew": 801.56, "rew_std": 396.8826, "Agent": "TRPO"}, {"env_step": 2918400, "rew": 801.43, "rew_std": 397.1423, "Agent": "TRPO"}, {"env_step": 2949120, "rew": 801.23, "rew_std": 397.5418, "Agent": "TRPO"}, {"env_step": 2979840, "rew": 801.53, "rew_std": 396.9428, "Agent": "TRPO"}, {"env_step": 3010560, "rew": 801.61, "rew_std": 396.7822, "Agent": "TRPO"}, {"env_step": 3041280, "rew": 801.51, "rew_std": 396.983, "Agent": "TRPO"}, {"env_step": 3072000, "rew": 801.55, "rew_std": 396.9027, "Agent": "TRPO"}, {"env_step": 0, "rew": 5.85, "rew_std": 1.136, "Agent": "A2C"}, {"env_step": 30000, "rew": 88.42, "rew_std": 63.9144, "Agent": "A2C"}, {"env_step": 60000, "rew": 806.95, "rew_std": 282.5109, "Agent": "A2C"}, {"env_step": 90000, "rew": 938.33, "rew_std": 110.1344, "Agent": "A2C"}, {"env_step": 120000, "rew": 997.57, "rew_std": 7.29, "Agent": "A2C"}, {"env_step": 150000, "rew": 958.72, "rew_std": 123.84, "Agent": "A2C"}, {"env_step": 180000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 210000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 240000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 270000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 300000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 330000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 360000, "rew": 985.62, "rew_std": 43.14, "Agent": "A2C"}, {"env_step": 390000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 420000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 450000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 480000, "rew": 908.1, "rew_std": 275.7, "Agent": "A2C"}, {"env_step": 510000, "rew": 950.15, "rew_std": 149.55, "Agent": "A2C"}, {"env_step": 540000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 570000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 600000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 630000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 660000, "rew": 987.44, "rew_std": 37.68, "Agent": "A2C"}, {"env_step": 690000, "rew": 985.83, "rew_std": 30.9024, "Agent": "A2C"}, {"env_step": 720000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 750000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 780000, "rew": 916.63, "rew_std": 240.8891, "Agent": "A2C"}, {"env_step": 810000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 840000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 870000, "rew": 980.07, "rew_std": 59.79, "Agent": "A2C"}, {"env_step": 900000, "rew": 990.03, "rew_std": 29.91, "Agent": "A2C"}, {"env_step": 930000, "rew": 982.98, "rew_std": 51.06, "Agent": "A2C"}, {"env_step": 960000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 990000, "rew": 997.05, "rew_std": 8.85, "Agent": "A2C"}, {"env_step": 1020000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 1050000, "rew": 990.3, "rew_std": 29.1, "Agent": "A2C"}, {"env_step": 1080000, "rew": 997.45, "rew_std": 7.65, "Agent": "A2C"}, {"env_step": 1110000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 1140000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 1170000, "rew": 998.3, "rew_std": 5.1, "Agent": "A2C"}, {"env_step": 1200000, "rew": 996.27, "rew_std": 11.19, "Agent": "A2C"}, {"env_step": 1230000, "rew": 991.3, "rew_std": 26.1, "Agent": "A2C"}, {"env_step": 1260000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 1290000, "rew": 988.05, "rew_std": 35.85, "Agent": "A2C"}, {"env_step": 1320000, "rew": 990.15, "rew_std": 29.55, "Agent": "A2C"}, {"env_step": 1350000, "rew": 966.65, "rew_std": 62.7151, "Agent": "A2C"}, {"env_step": 1380000, "rew": 990.04, "rew_std": 29.88, "Agent": "A2C"}, {"env_step": 1410000, "rew": 965.01, "rew_std": 41.3867, "Agent": "A2C"}, {"env_step": 1440000, "rew": 988.5, "rew_std": 24.6456, "Agent": "A2C"}, {"env_step": 1470000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 1500000, "rew": 961.3, "rew_std": 77.545, "Agent": "A2C"}, {"env_step": 1530000, "rew": 982.48, "rew_std": 52.56, "Agent": "A2C"}, {"env_step": 1560000, "rew": 983.44, "rew_std": 32.7019, "Agent": "A2C"}, {"env_step": 1590000, "rew": 990.04, "rew_std": 29.88, "Agent": "A2C"}, {"env_step": 1620000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 1650000, "rew": 990.52, "rew_std": 28.44, "Agent": "A2C"}, {"env_step": 1680000, "rew": 996.82, "rew_std": 9.54, "Agent": "A2C"}, {"env_step": 1710000, "rew": 990.35, "rew_std": 28.95, "Agent": "A2C"}, {"env_step": 1740000, "rew": 993.4, "rew_std": 19.8, "Agent": "A2C"}, {"env_step": 1770000, "rew": 986.9, "rew_std": 20.1303, "Agent": "A2C"}, {"env_step": 1800000, "rew": 980.74, "rew_std": 31.9232, "Agent": "A2C"}, {"env_step": 1830000, "rew": 999.68, "rew_std": 0.96, "Agent": "A2C"}, {"env_step": 1860000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 1890000, "rew": 998.68, "rew_std": 3.96, "Agent": "A2C"}, {"env_step": 1920000, "rew": 990.71, "rew_std": 17.068, "Agent": "A2C"}, {"env_step": 1950000, "rew": 976.31, "rew_std": 32.7669, "Agent": "A2C"}, {"env_step": 1980000, "rew": 985.47, "rew_std": 26.0654, "Agent": "A2C"}, {"env_step": 2010000, "rew": 990.07, "rew_std": 19.927, "Agent": "A2C"}, {"env_step": 2040000, "rew": 973.07, "rew_std": 43.6664, "Agent": "A2C"}, {"env_step": 2070000, "rew": 960.61, "rew_std": 48.4627, "Agent": "A2C"}, {"env_step": 2100000, "rew": 968.58, "rew_std": 34.9946, "Agent": "A2C"}, {"env_step": 2130000, "rew": 986.28, "rew_std": 29.8019, "Agent": "A2C"}, {"env_step": 2160000, "rew": 961.58, "rew_std": 74.5038, "Agent": "A2C"}, {"env_step": 2190000, "rew": 994.86, "rew_std": 15.42, "Agent": "A2C"}, {"env_step": 2220000, "rew": 990.98, "rew_std": 18.0409, "Agent": "A2C"}, {"env_step": 2250000, "rew": 979.94, "rew_std": 31.9933, "Agent": "A2C"}, {"env_step": 2280000, "rew": 937.58, "rew_std": 86.2823, "Agent": "A2C"}, {"env_step": 2310000, "rew": 990.43, "rew_std": 21.5514, "Agent": "A2C"}, {"env_step": 2340000, "rew": 986.97, "rew_std": 26.871, "Agent": "A2C"}, {"env_step": 2370000, "rew": 986.95, "rew_std": 28.0129, "Agent": "A2C"}, {"env_step": 2400000, "rew": 965.02, "rew_std": 59.0354, "Agent": "A2C"}, {"env_step": 2430000, "rew": 958.08, "rew_std": 44.2822, "Agent": "A2C"}, {"env_step": 2460000, "rew": 988.03, "rew_std": 22.285, "Agent": "A2C"}, {"env_step": 2490000, "rew": 965.07, "rew_std": 40.4661, "Agent": "A2C"}, {"env_step": 2520000, "rew": 971.9, "rew_std": 42.5035, "Agent": "A2C"}, {"env_step": 2550000, "rew": 973.6, "rew_std": 36.2035, "Agent": "A2C"}, {"env_step": 2580000, "rew": 982.17, "rew_std": 27.2857, "Agent": "A2C"}, {"env_step": 2610000, "rew": 997.66, "rew_std": 5.784, "Agent": "A2C"}, {"env_step": 2640000, "rew": 997.64, "rew_std": 7.08, "Agent": "A2C"}, {"env_step": 2670000, "rew": 952.95, "rew_std": 64.1054, "Agent": "A2C"}, {"env_step": 2700000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 2730000, "rew": 993.46, "rew_std": 19.62, "Agent": "A2C"}, {"env_step": 2760000, "rew": 972.1, "rew_std": 42.7232, "Agent": "A2C"}, {"env_step": 2790000, "rew": 971.05, "rew_std": 49.9594, "Agent": "A2C"}, {"env_step": 2820000, "rew": 980.16, "rew_std": 34.1031, "Agent": "A2C"}, {"env_step": 2850000, "rew": 1000.0, "rew_std": 0.0, "Agent": "A2C"}, {"env_step": 2880000, "rew": 987.71, "rew_std": 15.4241, "Agent": "A2C"}, {"env_step": 2910000, "rew": 978.08, "rew_std": 52.676, "Agent": "A2C"}, {"env_step": 2940000, "rew": 982.23, "rew_std": 29.1027, "Agent": "A2C"}, {"env_step": 2970000, "rew": 965.08, "rew_std": 58.7017, "Agent": "A2C"}, {"env_step": 3000000, "rew": 980.32, "rew_std": 28.4113, "Agent": "A2C"}, {"env_step": 0, "rew": 5.99, "rew_std": 1.2349, "Agent": "ACKTR"}, {"env_step": 30000, "rew": 313.47, "rew_std": 203.7635, "Agent": "ACKTR"}, {"env_step": 60000, "rew": 534.03, "rew_std": 289.5857, "Agent": "ACKTR"}, {"env_step": 90000, "rew": 541.5, "rew_std": 329.0577, "Agent": "ACKTR"}, {"env_step": 120000, "rew": 609.41, "rew_std": 302.4261, "Agent": "ACKTR"}, {"env_step": 150000, "rew": 646.59, "rew_std": 352.701, "Agent": "ACKTR"}, {"env_step": 180000, "rew": 858.15, "rew_std": 211.9754, "Agent": "ACKTR"}, {"env_step": 210000, "rew": 847.46, "rew_std": 134.496, "Agent": "ACKTR"}, {"env_step": 240000, "rew": 919.39, "rew_std": 122.1931, "Agent": "ACKTR"}, {"env_step": 270000, "rew": 822.09, "rew_std": 272.8888, "Agent": "ACKTR"}, {"env_step": 300000, "rew": 775.75, "rew_std": 285.1984, "Agent": "ACKTR"}, {"env_step": 330000, "rew": 796.85, "rew_std": 191.7313, "Agent": "ACKTR"}, {"env_step": 360000, "rew": 793.5, "rew_std": 232.3509, "Agent": "ACKTR"}, {"env_step": 390000, "rew": 766.23, "rew_std": 186.8284, "Agent": "ACKTR"}, {"env_step": 420000, "rew": 770.9, "rew_std": 231.9864, "Agent": "ACKTR"}, {"env_step": 450000, "rew": 557.01, "rew_std": 265.0333, "Agent": "ACKTR"}, {"env_step": 480000, "rew": 643.63, "rew_std": 198.2259, "Agent": "ACKTR"}, {"env_step": 510000, "rew": 655.74, "rew_std": 248.7802, "Agent": "ACKTR"}, {"env_step": 540000, "rew": 644.07, "rew_std": 279.2841, "Agent": "ACKTR"}, {"env_step": 570000, "rew": 607.08, "rew_std": 278.9008, "Agent": "ACKTR"}, {"env_step": 600000, "rew": 448.93, "rew_std": 192.6356, "Agent": "ACKTR"}, {"env_step": 630000, "rew": 438.66, "rew_std": 261.3708, "Agent": "ACKTR"}, {"env_step": 660000, "rew": 452.1, "rew_std": 209.2038, "Agent": "ACKTR"}, {"env_step": 690000, "rew": 401.65, "rew_std": 190.0115, "Agent": "ACKTR"}, {"env_step": 720000, "rew": 437.32, "rew_std": 194.3982, "Agent": "ACKTR"}, {"env_step": 750000, "rew": 495.24, "rew_std": 232.2461, "Agent": "ACKTR"}, {"env_step": 780000, "rew": 424.89, "rew_std": 181.4208, "Agent": "ACKTR"}, {"env_step": 810000, "rew": 395.02, "rew_std": 177.9833, "Agent": "ACKTR"}, {"env_step": 840000, "rew": 438.87, "rew_std": 197.3462, "Agent": "ACKTR"}, {"env_step": 870000, "rew": 461.06, "rew_std": 171.3335, "Agent": "ACKTR"}, {"env_step": 900000, "rew": 408.88, "rew_std": 173.7583, "Agent": "ACKTR"}, {"env_step": 930000, "rew": 388.03, "rew_std": 130.1942, "Agent": "ACKTR"}, {"env_step": 960000, "rew": 368.69, "rew_std": 126.2282, "Agent": "ACKTR"}, {"env_step": 990000, "rew": 338.07, "rew_std": 115.6302, "Agent": "ACKTR"}, {"env_step": 1020000, "rew": 479.56, "rew_std": 116.6755, "Agent": "ACKTR"}, {"env_step": 1050000, "rew": 366.69, "rew_std": 65.0125, "Agent": "ACKTR"}, {"env_step": 1080000, "rew": 346.03, "rew_std": 100.4225, "Agent": "ACKTR"}, {"env_step": 1110000, "rew": 384.12, "rew_std": 138.678, "Agent": "ACKTR"}, {"env_step": 1140000, "rew": 404.38, "rew_std": 138.7965, "Agent": "ACKTR"}, {"env_step": 1170000, "rew": 408.8, "rew_std": 80.9222, "Agent": "ACKTR"}, {"env_step": 1200000, "rew": 463.52, "rew_std": 103.9175, "Agent": "ACKTR"}, {"env_step": 1230000, "rew": 458.96, "rew_std": 142.3945, "Agent": "ACKTR"}, {"env_step": 1260000, "rew": 424.97, "rew_std": 91.784, "Agent": "ACKTR"}, {"env_step": 1290000, "rew": 476.73, "rew_std": 116.2978, "Agent": "ACKTR"}, {"env_step": 1320000, "rew": 459.55, "rew_std": 108.4361, "Agent": "ACKTR"}, {"env_step": 1350000, "rew": 456.39, "rew_std": 112.051, "Agent": "ACKTR"}, {"env_step": 1380000, "rew": 452.93, "rew_std": 104.9081, "Agent": "ACKTR"}, {"env_step": 1410000, "rew": 492.24, "rew_std": 118.6143, "Agent": "ACKTR"}, {"env_step": 1440000, "rew": 458.97, "rew_std": 153.6851, "Agent": "ACKTR"}, {"env_step": 1470000, "rew": 401.87, "rew_std": 128.9353, "Agent": "ACKTR"}, {"env_step": 1500000, "rew": 370.83, "rew_std": 120.0335, "Agent": "ACKTR"}, {"env_step": 1530000, "rew": 412.28, "rew_std": 147.2309, "Agent": "ACKTR"}, {"env_step": 1560000, "rew": 460.41, "rew_std": 130.92, "Agent": "ACKTR"}, {"env_step": 1590000, "rew": 457.59, "rew_std": 73.1311, "Agent": "ACKTR"}, {"env_step": 1620000, "rew": 467.18, "rew_std": 125.8918, "Agent": "ACKTR"}, {"env_step": 1650000, "rew": 458.3, "rew_std": 81.4617, "Agent": "ACKTR"}, {"env_step": 1680000, "rew": 484.95, "rew_std": 105.4011, "Agent": "ACKTR"}, {"env_step": 1710000, "rew": 453.66, "rew_std": 129.8921, "Agent": "ACKTR"}, {"env_step": 1740000, "rew": 491.3, "rew_std": 64.6613, "Agent": "ACKTR"}, {"env_step": 1770000, "rew": 474.39, "rew_std": 141.4254, "Agent": "ACKTR"}, {"env_step": 1800000, "rew": 431.69, "rew_std": 171.9348, "Agent": "ACKTR"}, {"env_step": 1830000, "rew": 485.4, "rew_std": 87.1934, "Agent": "ACKTR"}, {"env_step": 1860000, "rew": 428.5, "rew_std": 113.7902, "Agent": "ACKTR"}, {"env_step": 1890000, "rew": 518.56, "rew_std": 181.2914, "Agent": "ACKTR"}, {"env_step": 1920000, "rew": 441.13, "rew_std": 117.0855, "Agent": "ACKTR"}, {"env_step": 1950000, "rew": 434.05, "rew_std": 89.4931, "Agent": "ACKTR"}, {"env_step": 1980000, "rew": 450.89, "rew_std": 97.5655, "Agent": "ACKTR"}, {"env_step": 2010000, "rew": 416.78, "rew_std": 107.1259, "Agent": "ACKTR"}, {"env_step": 2040000, "rew": 385.79, "rew_std": 117.5148, "Agent": "ACKTR"}, {"env_step": 2070000, "rew": 481.94, "rew_std": 85.9594, "Agent": "ACKTR"}, {"env_step": 2100000, "rew": 443.37, "rew_std": 58.4024, "Agent": "ACKTR"}, {"env_step": 2130000, "rew": 474.56, "rew_std": 155.324, "Agent": "ACKTR"}, {"env_step": 2160000, "rew": 558.26, "rew_std": 124.035, "Agent": "ACKTR"}, {"env_step": 2190000, "rew": 442.35, "rew_std": 130.7163, "Agent": "ACKTR"}, {"env_step": 2220000, "rew": 513.09, "rew_std": 197.6661, "Agent": "ACKTR"}, {"env_step": 2250000, "rew": 450.04, "rew_std": 110.6129, "Agent": "ACKTR"}, {"env_step": 2280000, "rew": 431.79, "rew_std": 111.2214, "Agent": "ACKTR"}, {"env_step": 2310000, "rew": 465.74, "rew_std": 135.4457, "Agent": "ACKTR"}, {"env_step": 2340000, "rew": 441.41, "rew_std": 55.1811, "Agent": "ACKTR"}, {"env_step": 2370000, "rew": 448.22, "rew_std": 121.5187, "Agent": "ACKTR"}, {"env_step": 2400000, "rew": 476.63, "rew_std": 129.5021, "Agent": "ACKTR"}, {"env_step": 2430000, "rew": 452.66, "rew_std": 105.8468, "Agent": "ACKTR"}, {"env_step": 2460000, "rew": 446.97, "rew_std": 83.4278, "Agent": "ACKTR"}, {"env_step": 2490000, "rew": 429.67, "rew_std": 108.2704, "Agent": "ACKTR"}, {"env_step": 2520000, "rew": 439.24, "rew_std": 102.1129, "Agent": "ACKTR"}, {"env_step": 2550000, "rew": 432.48, "rew_std": 92.3938, "Agent": "ACKTR"}, {"env_step": 2580000, "rew": 477.79, "rew_std": 97.2943, "Agent": "ACKTR"}, {"env_step": 2610000, "rew": 493.62, "rew_std": 116.7853, "Agent": "ACKTR"}, {"env_step": 2640000, "rew": 510.83, "rew_std": 91.1766, "Agent": "ACKTR"}, {"env_step": 2670000, "rew": 525.39, "rew_std": 131.0754, "Agent": "ACKTR"}, {"env_step": 2700000, "rew": 414.55, "rew_std": 86.8364, "Agent": "ACKTR"}, {"env_step": 2730000, "rew": 504.56, "rew_std": 111.8608, "Agent": "ACKTR"}, {"env_step": 2760000, "rew": 488.42, "rew_std": 169.2835, "Agent": "ACKTR"}, {"env_step": 2790000, "rew": 454.02, "rew_std": 124.0767, "Agent": "ACKTR"}, {"env_step": 2820000, "rew": 495.83, "rew_std": 160.6988, "Agent": "ACKTR"}, {"env_step": 2850000, "rew": 382.39, "rew_std": 145.6528, "Agent": "ACKTR"}, {"env_step": 2880000, "rew": 489.15, "rew_std": 87.9129, "Agent": "ACKTR"}, {"env_step": 2910000, "rew": 492.83, "rew_std": 75.5344, "Agent": "ACKTR"}, {"env_step": 2940000, "rew": 485.68, "rew_std": 144.0268, "Agent": "ACKTR"}, {"env_step": 2970000, "rew": 498.1, "rew_std": 139.3425, "Agent": "ACKTR"}, {"env_step": 3000000, "rew": 485.74, "rew_std": 118.2865, "Agent": "ACKTR"}, {"env_step": 0, "rew": 10.32, "rew_std": 2.1711, "Agent": "DDPG"}, {"env_step": 5000, "rew": 41.15, "rew_std": 17.2288, "Agent": "DDPG"}, {"env_step": 10000, "rew": 53.78, "rew_std": 29.9129, "Agent": "DDPG"}, {"env_step": 15000, "rew": 638.39, "rew_std": 444.4626, "Agent": "DDPG"}, {"env_step": 20000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 25000, "rew": 982.36, "rew_std": 52.92, "Agent": "DDPG"}, {"env_step": 30000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 35000, "rew": 946.08, "rew_std": 141.1384, "Agent": "DDPG"}, {"env_step": 40000, "rew": 922.44, "rew_std": 232.68, "Agent": "DDPG"}, {"env_step": 45000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 50000, "rew": 990.96, "rew_std": 27.12, "Agent": "DDPG"}, {"env_step": 55000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 60000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 65000, "rew": 904.88, "rew_std": 262.7022, "Agent": "DDPG"}, {"env_step": 70000, "rew": 996.64, "rew_std": 10.08, "Agent": "DDPG"}, {"env_step": 75000, "rew": 847.65, "rew_std": 310.1592, "Agent": "DDPG"}, {"env_step": 80000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 85000, "rew": 754.62, "rew_std": 378.6501, "Agent": "DDPG"}, {"env_step": 90000, "rew": 909.22, "rew_std": 272.34, "Agent": "DDPG"}, {"env_step": 95000, "rew": 906.05, "rew_std": 281.85, "Agent": "DDPG"}, {"env_step": 100000, "rew": 907.39, "rew_std": 277.83, "Agent": "DDPG"}, {"env_step": 105000, "rew": 959.77, "rew_std": 120.69, "Agent": "DDPG"}, {"env_step": 110000, "rew": 995.98, "rew_std": 12.06, "Agent": "DDPG"}, {"env_step": 115000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 120000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 125000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 130000, "rew": 909.5, "rew_std": 271.5, "Agent": "DDPG"}, {"env_step": 135000, "rew": 909.05, "rew_std": 272.85, "Agent": "DDPG"}, {"env_step": 140000, "rew": 980.01, "rew_std": 59.97, "Agent": "DDPG"}, {"env_step": 145000, "rew": 912.67, "rew_std": 261.99, "Agent": "DDPG"}, {"env_step": 150000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 155000, "rew": 844.36, "rew_std": 321.8701, "Agent": "DDPG"}, {"env_step": 160000, "rew": 964.87, "rew_std": 105.39, "Agent": "DDPG"}, {"env_step": 165000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 170000, "rew": 817.01, "rew_std": 366.5122, "Agent": "DDPG"}, {"env_step": 175000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 180000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 185000, "rew": 908.82, "rew_std": 252.7725, "Agent": "DDPG"}, {"env_step": 190000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 195000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 200000, "rew": 904.26, "rew_std": 287.22, "Agent": "DDPG"}, {"env_step": 205000, "rew": 862.49, "rew_std": 294.1062, "Agent": "DDPG"}, {"env_step": 210000, "rew": 990.86, "rew_std": 27.42, "Agent": "DDPG"}, {"env_step": 215000, "rew": 895.51, "rew_std": 257.5641, "Agent": "DDPG"}, {"env_step": 220000, "rew": 773.93, "rew_std": 349.0457, "Agent": "DDPG"}, {"env_step": 225000, "rew": 910.11, "rew_std": 269.67, "Agent": "DDPG"}, {"env_step": 230000, "rew": 867.81, "rew_std": 292.9672, "Agent": "DDPG"}, {"env_step": 235000, "rew": 818.76, "rew_std": 325.96, "Agent": "DDPG"}, {"env_step": 240000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 245000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 250000, "rew": 968.3, "rew_std": 71.1283, "Agent": "DDPG"}, {"env_step": 255000, "rew": 812.26, "rew_std": 375.4814, "Agent": "DDPG"}, {"env_step": 260000, "rew": 990.07, "rew_std": 29.79, "Agent": "DDPG"}, {"env_step": 265000, "rew": 982.53, "rew_std": 52.41, "Agent": "DDPG"}, {"env_step": 270000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 275000, "rew": 869.48, "rew_std": 289.0383, "Agent": "DDPG"}, {"env_step": 280000, "rew": 921.04, "rew_std": 236.88, "Agent": "DDPG"}, {"env_step": 285000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 290000, "rew": 962.56, "rew_std": 112.32, "Agent": "DDPG"}, {"env_step": 295000, "rew": 686.91, "rew_std": 392.568, "Agent": "DDPG"}, {"env_step": 300000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 305000, "rew": 908.78, "rew_std": 273.66, "Agent": "DDPG"}, {"env_step": 310000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 315000, "rew": 911.93, "rew_std": 264.21, "Agent": "DDPG"}, {"env_step": 320000, "rew": 818.29, "rew_std": 341.6617, "Agent": "DDPG"}, {"env_step": 325000, "rew": 914.95, "rew_std": 229.7549, "Agent": "DDPG"}, {"env_step": 330000, "rew": 982.79, "rew_std": 51.63, "Agent": "DDPG"}, {"env_step": 335000, "rew": 906.27, "rew_std": 281.19, "Agent": "DDPG"}, {"env_step": 340000, "rew": 912.32, "rew_std": 263.04, "Agent": "DDPG"}, {"env_step": 345000, "rew": 995.31, "rew_std": 14.07, "Agent": "DDPG"}, {"env_step": 350000, "rew": 914.14, "rew_std": 257.58, "Agent": "DDPG"}, {"env_step": 355000, "rew": 912.27, "rew_std": 263.19, "Agent": "DDPG"}, {"env_step": 360000, "rew": 753.66, "rew_std": 377.72, "Agent": "DDPG"}, {"env_step": 365000, "rew": 923.03, "rew_std": 223.965, "Agent": "DDPG"}, {"env_step": 370000, "rew": 903.03, "rew_std": 290.91, "Agent": "DDPG"}, {"env_step": 375000, "rew": 828.6, "rew_std": 344.9558, "Agent": "DDPG"}, {"env_step": 380000, "rew": 909.52, "rew_std": 271.44, "Agent": "DDPG"}, {"env_step": 385000, "rew": 951.22, "rew_std": 146.34, "Agent": "DDPG"}, {"env_step": 390000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 395000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 400000, "rew": 964.94, "rew_std": 105.18, "Agent": "DDPG"}, {"env_step": 405000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 410000, "rew": 932.17, "rew_std": 203.49, "Agent": "DDPG"}, {"env_step": 415000, "rew": 981.03, "rew_std": 56.91, "Agent": "DDPG"}, {"env_step": 420000, "rew": 820.77, "rew_std": 337.9462, "Agent": "DDPG"}, {"env_step": 425000, "rew": 750.05, "rew_std": 388.838, "Agent": "DDPG"}, {"env_step": 430000, "rew": 990.12, "rew_std": 29.64, "Agent": "DDPG"}, {"env_step": 435000, "rew": 794.77, "rew_std": 353.8976, "Agent": "DDPG"}, {"env_step": 440000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 445000, "rew": 907.03, "rew_std": 278.91, "Agent": "DDPG"}, {"env_step": 450000, "rew": 980.83, "rew_std": 38.3643, "Agent": "DDPG"}, {"env_step": 455000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 460000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 465000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 470000, "rew": 864.28, "rew_std": 287.4623, "Agent": "DDPG"}, {"env_step": 475000, "rew": 998.64, "rew_std": 4.08, "Agent": "DDPG"}, {"env_step": 480000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 485000, "rew": 917.69, "rew_std": 246.93, "Agent": "DDPG"}, {"env_step": 490000, "rew": 994.05, "rew_std": 17.85, "Agent": "DDPG"}, {"env_step": 495000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 500000, "rew": 883.9, "rew_std": 193.0312, "Agent": "DDPG"}, {"env_step": 505000, "rew": 809.55, "rew_std": 381.3104, "Agent": "DDPG"}, {"env_step": 510000, "rew": 895.14, "rew_std": 234.18, "Agent": "DDPG"}, {"env_step": 515000, "rew": 919.31, "rew_std": 242.07, "Agent": "DDPG"}, {"env_step": 520000, "rew": 821.45, "rew_std": 357.8348, "Agent": "DDPG"}, {"env_step": 525000, "rew": 883.2, "rew_std": 291.5019, "Agent": "DDPG"}, {"env_step": 530000, "rew": 882.44, "rew_std": 235.4276, "Agent": "DDPG"}, {"env_step": 535000, "rew": 925.62, "rew_std": 223.14, "Agent": "DDPG"}, {"env_step": 540000, "rew": 962.11, "rew_std": 113.67, "Agent": "DDPG"}, {"env_step": 545000, "rew": 916.88, "rew_std": 249.36, "Agent": "DDPG"}, {"env_step": 550000, "rew": 968.45, "rew_std": 94.65, "Agent": "DDPG"}, {"env_step": 555000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 560000, "rew": 936.39, "rew_std": 138.9512, "Agent": "DDPG"}, {"env_step": 565000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 570000, "rew": 901.64, "rew_std": 285.901, "Agent": "DDPG"}, {"env_step": 575000, "rew": 860.19, "rew_std": 289.7419, "Agent": "DDPG"}, {"env_step": 580000, "rew": 794.28, "rew_std": 342.0737, "Agent": "DDPG"}, {"env_step": 585000, "rew": 908.6, "rew_std": 274.2, "Agent": "DDPG"}, {"env_step": 590000, "rew": 980.7, "rew_std": 57.9, "Agent": "DDPG"}, {"env_step": 595000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 600000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 605000, "rew": 944.19, "rew_std": 167.43, "Agent": "DDPG"}, {"env_step": 610000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 615000, "rew": 822.83, "rew_std": 338.3354, "Agent": "DDPG"}, {"env_step": 620000, "rew": 996.75, "rew_std": 9.75, "Agent": "DDPG"}, {"env_step": 625000, "rew": 876.11, "rew_std": 290.0732, "Agent": "DDPG"}, {"env_step": 630000, "rew": 829.63, "rew_std": 344.1681, "Agent": "DDPG"}, {"env_step": 635000, "rew": 851.7, "rew_std": 307.4943, "Agent": "DDPG"}, {"env_step": 640000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 645000, "rew": 914.73, "rew_std": 227.7837, "Agent": "DDPG"}, {"env_step": 650000, "rew": 780.85, "rew_std": 353.241, "Agent": "DDPG"}, {"env_step": 655000, "rew": 828.64, "rew_std": 346.8068, "Agent": "DDPG"}, {"env_step": 660000, "rew": 920.6, "rew_std": 238.2, "Agent": "DDPG"}, {"env_step": 665000, "rew": 695.43, "rew_std": 360.9379, "Agent": "DDPG"}, {"env_step": 670000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 675000, "rew": 889.81, "rew_std": 275.4378, "Agent": "DDPG"}, {"env_step": 680000, "rew": 921.47, "rew_std": 235.59, "Agent": "DDPG"}, {"env_step": 685000, "rew": 914.11, "rew_std": 257.67, "Agent": "DDPG"}, {"env_step": 690000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 695000, "rew": 912.09, "rew_std": 263.73, "Agent": "DDPG"}, {"env_step": 700000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 705000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 710000, "rew": 992.54, "rew_std": 22.38, "Agent": "DDPG"}, {"env_step": 715000, "rew": 908.83, "rew_std": 273.51, "Agent": "DDPG"}, {"env_step": 720000, "rew": 971.07, "rew_std": 86.79, "Agent": "DDPG"}, {"env_step": 725000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 730000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 735000, "rew": 989.89, "rew_std": 30.33, "Agent": "DDPG"}, {"env_step": 740000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 745000, "rew": 978.06, "rew_std": 44.4382, "Agent": "DDPG"}, {"env_step": 750000, "rew": 934.12, "rew_std": 197.64, "Agent": "DDPG"}, {"env_step": 755000, "rew": 918.17, "rew_std": 245.49, "Agent": "DDPG"}, {"env_step": 760000, "rew": 982.55, "rew_std": 52.35, "Agent": "DDPG"}, {"env_step": 765000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 770000, "rew": 906.26, "rew_std": 281.22, "Agent": "DDPG"}, {"env_step": 775000, "rew": 907.98, "rew_std": 276.06, "Agent": "DDPG"}, {"env_step": 780000, "rew": 849.33, "rew_std": 303.7142, "Agent": "DDPG"}, {"env_step": 785000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 790000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 795000, "rew": 963.47, "rew_std": 109.59, "Agent": "DDPG"}, {"env_step": 800000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 805000, "rew": 885.71, "rew_std": 283.8073, "Agent": "DDPG"}, {"env_step": 810000, "rew": 909.16, "rew_std": 272.52, "Agent": "DDPG"}, {"env_step": 815000, "rew": 887.46, "rew_std": 232.1516, "Agent": "DDPG"}, {"env_step": 820000, "rew": 990.9, "rew_std": 27.3, "Agent": "DDPG"}, {"env_step": 825000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 830000, "rew": 915.07, "rew_std": 254.79, "Agent": "DDPG"}, {"env_step": 835000, "rew": 992.61, "rew_std": 22.17, "Agent": "DDPG"}, {"env_step": 840000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 845000, "rew": 900.96, "rew_std": 297.12, "Agent": "DDPG"}, {"env_step": 850000, "rew": 924.3, "rew_std": 227.1, "Agent": "DDPG"}, {"env_step": 855000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 860000, "rew": 910.32, "rew_std": 269.04, "Agent": "DDPG"}, {"env_step": 865000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 870000, "rew": 972.08, "rew_std": 83.76, "Agent": "DDPG"}, {"env_step": 875000, "rew": 910.32, "rew_std": 269.04, "Agent": "DDPG"}, {"env_step": 880000, "rew": 907.29, "rew_std": 278.13, "Agent": "DDPG"}, {"env_step": 885000, "rew": 890.26, "rew_std": 269.6544, "Agent": "DDPG"}, {"env_step": 890000, "rew": 951.63, "rew_std": 120.6337, "Agent": "DDPG"}, {"env_step": 895000, "rew": 929.04, "rew_std": 212.88, "Agent": "DDPG"}, {"env_step": 900000, "rew": 925.66, "rew_std": 193.9828, "Agent": "DDPG"}, {"env_step": 905000, "rew": 914.34, "rew_std": 256.98, "Agent": "DDPG"}, {"env_step": 910000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 915000, "rew": 973.56, "rew_std": 79.32, "Agent": "DDPG"}, {"env_step": 920000, "rew": 834.16, "rew_std": 333.6571, "Agent": "DDPG"}, {"env_step": 925000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 930000, "rew": 818.05, "rew_std": 364.085, "Agent": "DDPG"}, {"env_step": 935000, "rew": 847.89, "rew_std": 308.9834, "Agent": "DDPG"}, {"env_step": 940000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 945000, "rew": 963.11, "rew_std": 110.67, "Agent": "DDPG"}, {"env_step": 950000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 955000, "rew": 905.48, "rew_std": 283.56, "Agent": "DDPG"}, {"env_step": 960000, "rew": 942.27, "rew_std": 146.4769, "Agent": "DDPG"}, {"env_step": 965000, "rew": 853.11, "rew_std": 275.556, "Agent": "DDPG"}, {"env_step": 970000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 975000, "rew": 912.17, "rew_std": 263.49, "Agent": "DDPG"}, {"env_step": 980000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 985000, "rew": 923.86, "rew_std": 228.42, "Agent": "DDPG"}, {"env_step": 990000, "rew": 854.05, "rew_std": 314.9146, "Agent": "DDPG"}, {"env_step": 995000, "rew": 736.91, "rew_std": 403.1681, "Agent": "DDPG"}, {"env_step": 1000000, "rew": 924.53, "rew_std": 226.41, "Agent": "DDPG"}, {"env_step": 1005000, "rew": 996.16, "rew_std": 11.52, "Agent": "DDPG"}, {"env_step": 1010000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 1015000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 1020000, "rew": 840.45, "rew_std": 257.3666, "Agent": "DDPG"}, {"env_step": 1025000, "rew": 822.64, "rew_std": 354.8743, "Agent": "DDPG"}, {"env_step": 1030000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 1035000, "rew": 910.85, "rew_std": 267.45, "Agent": "DDPG"}, {"env_step": 1040000, "rew": 912.68, "rew_std": 261.96, "Agent": "DDPG"}, {"env_step": 1045000, "rew": 945.21, "rew_std": 164.37, "Agent": "DDPG"}, {"env_step": 1050000, "rew": 980.2, "rew_std": 59.4, "Agent": "DDPG"}, {"env_step": 1055000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 1060000, "rew": 816.61, "rew_std": 366.8583, "Agent": "DDPG"}, {"env_step": 1065000, "rew": 908.51, "rew_std": 274.47, "Agent": "DDPG"}, {"env_step": 1070000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 1075000, "rew": 907.18, "rew_std": 278.46, "Agent": "DDPG"}, {"env_step": 1080000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 1085000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 1090000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 1095000, "rew": 980.25, "rew_std": 59.25, "Agent": "DDPG"}, {"env_step": 1100000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 1105000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 1110000, "rew": 910.12, "rew_std": 269.64, "Agent": "DDPG"}, {"env_step": 1115000, "rew": 766.1, "rew_std": 364.7707, "Agent": "DDPG"}, {"env_step": 1120000, "rew": 908.51, "rew_std": 264.2015, "Agent": "DDPG"}, {"env_step": 1125000, "rew": 958.67, "rew_std": 123.99, "Agent": "DDPG"}, {"env_step": 1130000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 1135000, "rew": 994.92, "rew_std": 15.24, "Agent": "DDPG"}, {"env_step": 1140000, "rew": 971.41, "rew_std": 85.77, "Agent": "DDPG"}, {"env_step": 1145000, "rew": 925.66, "rew_std": 223.02, "Agent": "DDPG"}, {"env_step": 1150000, "rew": 907.61, "rew_std": 277.17, "Agent": "DDPG"}, {"env_step": 1155000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 1160000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 1165000, "rew": 851.25, "rew_std": 299.4327, "Agent": "DDPG"}, {"env_step": 1170000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 1175000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 1180000, "rew": 994.58, "rew_std": 16.26, "Agent": "DDPG"}, {"env_step": 1185000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 1190000, "rew": 990.83, "rew_std": 27.51, "Agent": "DDPG"}, {"env_step": 1195000, "rew": 911.21, "rew_std": 266.37, "Agent": "DDPG"}, {"env_step": 1200000, "rew": 905.24, "rew_std": 284.28, "Agent": "DDPG"}, {"env_step": 1205000, "rew": 943.31, "rew_std": 170.07, "Agent": "DDPG"}, {"env_step": 1210000, "rew": 990.66, "rew_std": 28.02, "Agent": "DDPG"}, {"env_step": 1215000, "rew": 954.84, "rew_std": 135.48, "Agent": "DDPG"}, {"env_step": 1220000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 1225000, "rew": 990.61, "rew_std": 28.17, "Agent": "DDPG"}, {"env_step": 1230000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 1235000, "rew": 962.42, "rew_std": 112.74, "Agent": "DDPG"}, {"env_step": 1240000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 1245000, "rew": 802.56, "rew_std": 334.6394, "Agent": "DDPG"}, {"env_step": 1250000, "rew": 1000.0, "rew_std": 0.0, "Agent": "DDPG"}, {"env_step": 0, "rew": 5.85, "rew_std": 1.136, "Agent": "NPG"}, {"env_step": 30720, "rew": 59.57, "rew_std": 12.752, "Agent": "NPG"}, {"env_step": 61440, "rew": 963.52, "rew_std": 45.1707, "Agent": "NPG"}, {"env_step": 92160, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 122880, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 153600, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 184320, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 215040, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 245760, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 276480, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 307200, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 337920, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 368640, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 399360, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 430080, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 460800, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 491520, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 522240, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 552960, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 583680, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 614400, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 645120, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 675840, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 706560, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 737280, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 768000, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 798720, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 829440, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 860160, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 890880, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 921600, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 952320, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 983040, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1013760, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1044480, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1075200, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1105920, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1136640, "rew": 990.08, "rew_std": 29.76, "Agent": "NPG"}, {"env_step": 1167360, "rew": 970.56, "rew_std": 62.6863, "Agent": "NPG"}, {"env_step": 1198080, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1228800, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1259520, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1290240, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1320960, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1351680, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1382400, "rew": 980.4, "rew_std": 58.8, "Agent": "NPG"}, {"env_step": 1413120, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1443840, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1474560, "rew": 980.64, "rew_std": 58.08, "Agent": "NPG"}, {"env_step": 1505280, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1536000, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1566720, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1597440, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1628160, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1658880, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1689600, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1720320, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1751040, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1781760, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1812480, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1843200, "rew": 990.07, "rew_std": 29.79, "Agent": "NPG"}, {"env_step": 1873920, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1904640, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1935360, "rew": 970.19, "rew_std": 89.43, "Agent": "NPG"}, {"env_step": 1966080, "rew": 1000.0, "rew_std": 0.0, "Agent": "NPG"}, {"env_step": 1996800, "rew": 980.21, "rew_std": 59.37, "Agent": "NPG"}, {"env_step": 2027520, "rew": 980.1, "rew_std": 59.7, "Agent": "NPG"}, {"env_step": 2058240, "rew": 970.14, "rew_std": 89.58, "Agent": "NPG"}, {"env_step": 2088960, "rew": 980.11, "rew_std": 59.67, "Agent": "NPG"}, {"env_step": 2119680, "rew": 970.14, "rew_std": 89.58, "Agent": "NPG"}, {"env_step": 2150400, "rew": 940.28, "rew_std": 179.16, "Agent": "NPG"}, {"env_step": 2181120, "rew": 950.22, "rew_std": 149.34, "Agent": "NPG"}, {"env_step": 2211840, "rew": 970.16, "rew_std": 89.52, "Agent": "NPG"}, {"env_step": 2242560, "rew": 950.24, "rew_std": 149.28, "Agent": "NPG"}, {"env_step": 2273280, "rew": 940.28, "rew_std": 179.16, "Agent": "NPG"}, {"env_step": 2304000, "rew": 970.12, "rew_std": 89.64, "Agent": "NPG"}, {"env_step": 2334720, "rew": 960.2, "rew_std": 119.4, "Agent": "NPG"}, {"env_step": 2365440, "rew": 940.35, "rew_std": 178.95, "Agent": "NPG"}, {"env_step": 2396160, "rew": 980.13, "rew_std": 59.61, "Agent": "NPG"}, {"env_step": 2426880, "rew": 960.17, "rew_std": 119.49, "Agent": "NPG"}, {"env_step": 2457600, "rew": 980.15, "rew_std": 59.55, "Agent": "NPG"}, {"env_step": 2488320, "rew": 930.39, "rew_std": 208.83, "Agent": "NPG"}, {"env_step": 2519040, "rew": 960.17, "rew_std": 119.49, "Agent": "NPG"}, {"env_step": 2549760, "rew": 950.24, "rew_std": 149.28, "Agent": "NPG"}, {"env_step": 2580480, "rew": 910.42, "rew_std": 237.4632, "Agent": "NPG"}, {"env_step": 2611200, "rew": 930.35, "rew_std": 208.95, "Agent": "NPG"}, {"env_step": 2641920, "rew": 870.73, "rew_std": 259.4651, "Agent": "NPG"}, {"env_step": 2672640, "rew": 870.71, "rew_std": 259.5469, "Agent": "NPG"}, {"env_step": 2703360, "rew": 890.46, "rew_std": 229.0678, "Agent": "NPG"}, {"env_step": 2734080, "rew": 860.72, "rew_std": 282.1129, "Agent": "NPG"}, {"env_step": 2764800, "rew": 890.53, "rew_std": 220.0631, "Agent": "NPG"}, {"env_step": 2795520, "rew": 870.64, "rew_std": 267.1633, "Agent": "NPG"}, {"env_step": 2826240, "rew": 920.41, "rew_std": 165.3006, "Agent": "NPG"}, {"env_step": 2856960, "rew": 930.38, "rew_std": 140.9887, "Agent": "NPG"}, {"env_step": 2887680, "rew": 890.5, "rew_std": 268.7963, "Agent": "NPG"}, {"env_step": 2918400, "rew": 880.58, "rew_std": 242.9744, "Agent": "NPG"}, {"env_step": 2949120, "rew": 900.51, "rew_std": 198.98, "Agent": "NPG"}, {"env_step": 2979840, "rew": 910.45, "rew_std": 191.1802, "Agent": "NPG"}, {"env_step": 3010560, "rew": 930.38, "rew_std": 140.9958, "Agent": "NPG"}, {"env_step": 3041280, "rew": 930.65, "rew_std": 126.08, "Agent": "NPG"}, {"env_step": 3072000, "rew": 940.31, "rew_std": 119.38, "Agent": "NPG"}]