2022-04-24 20:44:54 +08:00

1 line
59 KiB
JSON

[{"env_step": 0, "rew": -20.979999923706053, "rew_std": 0.04000015258789063, "Agent": "c51"}, {"env_step": 100000, "rew": -20.869999885559082, "rew_std": 0.15524167570244413, "Agent": "c51"}, {"env_step": 200000, "rew": -20.560000038146974, "rew_std": 0.40298883737879937, "Agent": "c51"}, {"env_step": 300000, "rew": -18.95999994277954, "rew_std": 2.2632720366854833, "Agent": "c51"}, {"env_step": 400000, "rew": -16.210000228881835, "rew_std": 2.7750494802377017, "Agent": "c51"}, {"env_step": 500000, "rew": -15.040000057220459, "rew_std": 3.022648038181074, "Agent": "c51"}, {"env_step": 600000, "rew": -12.759999966621399, "rew_std": 5.666603835995492, "Agent": "c51"}, {"env_step": 700000, "rew": -8.17000013589859, "rew_std": 6.876634371998414, "Agent": "c51"}, {"env_step": 800000, "rew": -5.910000105202198, "rew_std": 5.658347880641881, "Agent": "c51"}, {"env_step": 900000, "rew": -2.0299999713897705, "rew_std": 7.5090678214603175, "Agent": "c51"}, {"env_step": 1000000, "rew": -1.05, "rew_std": 8.06576073888153, "Agent": "c51"}, {"env_step": 1100000, "rew": 5.750000011920929, "rew_std": 8.470448577145289, "Agent": "c51"}, {"env_step": 1200000, "rew": 11.85, "rew_std": 6.486486065226738, "Agent": "c51"}, {"env_step": 1300000, "rew": 11.839999842643739, "rew_std": 9.283232047765221, "Agent": "c51"}, {"env_step": 1400000, "rew": 10.289999675750732, "rew_std": 13.408239764024396, "Agent": "c51"}, {"env_step": 1500000, "rew": 15.300000054495674, "rew_std": 7.003264581462973, "Agent": "c51"}, {"env_step": 1600000, "rew": 15.419999885559083, "rew_std": 5.896914245313163, "Agent": "c51"}, {"env_step": 1700000, "rew": 16.47999973297119, "rew_std": 6.142116861407374, "Agent": "c51"}, {"env_step": 1800000, "rew": 18.700000381469728, "rew_std": 1.2743627474105064, "Agent": "c51"}, {"env_step": 1900000, "rew": 13.000000283122063, "rew_std": 8.335466556491935, "Agent": "c51"}, {"env_step": 2000000, "rew": 17.47499966621399, "rew_std": 3.660174086617874, "Agent": "c51"}, {"env_step": 2100000, "rew": 13.566666801770529, "rew_std": 8.47833851940157, "Agent": "c51"}, {"env_step": 2200000, "rew": 19.75, "rew_std": 0.5499992370605469, "Agent": "c51"}, {"env_step": 2300000, "rew": 14.0, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 2400000, "rew": 19.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 2500000, "rew": 15.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 2600000, "rew": 18.200000762939453, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 2700000, "rew": 19.0, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 2800000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 2900000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 3000000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 3100000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 3200000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 3300000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 3400000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 3500000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 3600000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 3700000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 3800000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 3900000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 4000000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 4100000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 4200000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 4300000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 4400000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 4500000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 4600000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 4700000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 4800000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 4900000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 5000000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 5100000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 5200000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 5300000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 5400000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 5500000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 5600000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 5700000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 5800000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 5900000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 6000000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 6100000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 6200000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 6300000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 6400000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 6500000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 6600000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 6700000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 6800000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 6900000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 7000000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 7100000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 7200000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 7300000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 7400000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 7500000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 7600000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 7700000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 7800000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 7900000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 8000000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 8100000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 8200000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 8300000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 8400000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 8500000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 8600000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 8700000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 8800000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 8900000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 9000000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 9100000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 9200000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 9300000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 9400000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 9500000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 9600000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 9700000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 9800000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 9900000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 10000000, "rew": 20.600000381469727, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 0, "rew": -20.979999923706053, "rew_std": 0.04000015258789063, "Agent": "dqn"}, {"env_step": 100000, "rew": -20.689999961853026, "rew_std": 0.5281095979692643, "Agent": "dqn"}, {"env_step": 200000, "rew": -18.38000020980835, "rew_std": 2.5906757312772744, "Agent": "dqn"}, {"env_step": 300000, "rew": -18.030000019073487, "rew_std": 1.7245580854624265, "Agent": "dqn"}, {"env_step": 400000, "rew": -13.899999952316284, "rew_std": 3.808936970212056, "Agent": "dqn"}, {"env_step": 500000, "rew": -5.709999942779541, "rew_std": 9.006936246078585, "Agent": "dqn"}, {"env_step": 600000, "rew": -1.0700000286102296, "rew_std": 8.908540906843577, "Agent": "dqn"}, {"env_step": 700000, "rew": 6.160000026226044, "rew_std": 7.3988107178341656, "Agent": "dqn"}, {"env_step": 800000, "rew": 15.04000015258789, "rew_std": 5.2547504042740645, "Agent": "dqn"}, {"env_step": 900000, "rew": 19.755555470784504, "rew_std": 0.4374447957623508, "Agent": "dqn"}, {"env_step": 1000000, "rew": 19.983332951863606, "rew_std": 0.5814256919850659, "Agent": "dqn"}, {"env_step": 1100000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 1200000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 1300000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 1400000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 1500000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 1600000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 1700000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 1800000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 1900000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 2000000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 2100000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 2200000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 2300000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 2400000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 2500000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 2600000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 2700000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 2800000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 2900000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 3000000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 3100000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 3200000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 3300000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 3400000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 3500000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 3600000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 3700000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 3800000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 3900000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 4000000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 4100000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 4200000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 4300000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 4400000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 4500000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 4600000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 4700000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 4800000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 4900000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 5000000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 5100000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 5200000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 5300000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 5400000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 5500000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 5600000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 5700000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 5800000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 5900000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 6000000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 6100000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 6200000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 6300000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 6400000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 6500000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 6600000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 6700000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 6800000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 6900000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 7000000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 7100000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 7200000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 7300000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 7400000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 7500000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 7600000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 7700000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 7800000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 7900000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 8000000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 8100000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 8200000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 8300000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 8400000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 8500000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 8600000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 8700000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 8800000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 8900000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 9000000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 9100000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 9200000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 9300000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 9400000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 9500000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 9600000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 9700000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 9800000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 9900000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 10000000, "rew": 20.25, "rew_std": 0.25, "Agent": "dqn"}, {"env_step": 0, "rew": -20.979999923706053, "rew_std": 0.04000015258789063, "Agent": "fqf"}, {"env_step": 100000, "rew": -20.879999923706055, "rew_std": 0.15999994277996732, "Agent": "fqf"}, {"env_step": 200000, "rew": -19.329999923706055, "rew_std": 1.1883183401767072, "Agent": "fqf"}, {"env_step": 300000, "rew": -18.410000228881835, "rew_std": 2.3947650818103883, "Agent": "fqf"}, {"env_step": 400000, "rew": -15.789999866485596, "rew_std": 1.8124292335112842, "Agent": "fqf"}, {"env_step": 500000, "rew": -12.899999952316284, "rew_std": 3.9191835397861126, "Agent": "fqf"}, {"env_step": 600000, "rew": -7.259999930858612, "rew_std": 6.181294202818166, "Agent": "fqf"}, {"env_step": 700000, "rew": -0.2800000667572021, "rew_std": 5.578135949422739, "Agent": "fqf"}, {"env_step": 800000, "rew": 5.889999827742576, "rew_std": 6.357428520171511, "Agent": "fqf"}, {"env_step": 900000, "rew": 12.8555555873447, "rew_std": 5.842585252592779, "Agent": "fqf"}, {"env_step": 1000000, "rew": 18.875, "rew_std": 2.6085196695608577, "Agent": "fqf"}, {"env_step": 1100000, "rew": 18.749999682108562, "rew_std": 2.6196374340932294, "Agent": "fqf"}, {"env_step": 1200000, "rew": 19.65999984741211, "rew_std": 1.051855243717263, "Agent": "fqf"}, {"env_step": 1300000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 1400000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 1500000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 1600000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 1700000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 1800000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 1900000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 2000000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 2100000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 2200000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 2300000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 2400000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 2500000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 2600000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 2700000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 2800000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 2900000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 3000000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 3100000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 3200000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 3300000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 3400000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 3500000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 3600000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 3700000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 3800000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 3900000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 4000000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 4100000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 4200000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 4300000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 4400000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 4500000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 4600000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 4700000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 4800000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 4900000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 5000000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 5100000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 5200000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 5300000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 5400000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 5500000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 5600000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 5700000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 5800000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 5900000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 6000000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 6100000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 6200000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 6300000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 6400000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 6500000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 6600000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 6700000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 6800000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 6900000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 7000000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 7100000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 7200000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 7300000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 7400000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 7500000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 7600000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 7700000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 7800000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 7900000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 8000000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 8100000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 8200000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 8300000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 8400000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 8500000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 8600000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 8700000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 8800000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 8900000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 9000000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 9100000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 9200000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 9300000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 9400000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 9500000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 9600000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 9700000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 9800000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 9900000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 10000000, "rew": 20.399999618530273, "rew_std": 0.39999961853027344, "Agent": "fqf"}, {"env_step": 0, "rew": -21.0, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 100000, "rew": -20.870000076293945, "rew_std": 0.27221299202092436, "Agent": "qrdqn"}, {"env_step": 200000, "rew": -19.48000011444092, "rew_std": 1.2023307411527404, "Agent": "qrdqn"}, {"env_step": 300000, "rew": -16.780000019073487, "rew_std": 2.1613883342785347, "Agent": "qrdqn"}, {"env_step": 400000, "rew": -12.920000219345093, "rew_std": 3.473845164617662, "Agent": "qrdqn"}, {"env_step": 500000, "rew": -7.060000002384186, "rew_std": 6.094456461922503, "Agent": "qrdqn"}, {"env_step": 600000, "rew": -3.779999941587448, "rew_std": 6.045295632144355, "Agent": "qrdqn"}, {"env_step": 700000, "rew": 9.749999952316283, "rew_std": 6.640368991575429, "Agent": "qrdqn"}, {"env_step": 800000, "rew": 15.269999933242797, "rew_std": 4.12966090763813, "Agent": "qrdqn"}, {"env_step": 900000, "rew": 19.622222052680122, "rew_std": 1.2916639583656102, "Agent": "qrdqn"}, {"env_step": 1000000, "rew": 20.09999990463257, "rew_std": 0.3162274644388989, "Agent": "qrdqn"}, {"env_step": 1100000, "rew": 19.899999618530273, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 1200000, "rew": 19.899999618530273, "rew_std": 0.10000038146972656, "Agent": "qrdqn"}, {"env_step": 1300000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 1400000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 1500000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 1600000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 1700000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 1800000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 1900000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 2000000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 2100000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 2200000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 2300000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 2400000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 2500000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 2600000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 2700000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 2800000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 2900000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 3000000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 3100000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 3200000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 3300000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 3400000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 3500000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 3600000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 3700000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 3800000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 3900000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 4000000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 4100000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 4200000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 4300000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 4400000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 4500000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 4600000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 4700000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 4800000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 4900000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 5000000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 5100000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 5200000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 5300000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 5400000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 5500000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 5600000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 5700000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 5800000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 5900000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 6000000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 6100000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 6200000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 6300000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 6400000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 6500000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 6600000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 6700000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 6800000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 6900000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 7000000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 7100000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 7200000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 7300000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 7400000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 7500000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 7600000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 7700000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 7800000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 7900000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 8000000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 8100000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 8200000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 8300000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 8400000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 8500000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 8600000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 8700000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 8800000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 8900000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 9000000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 9100000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 9200000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 9300000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 9400000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 9500000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 9600000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 9700000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 9800000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 9900000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 10000000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "qrdqn"}, {"env_step": 0, "rew": -20.969999885559083, "rew_std": 0.06403148663413369, "Agent": "iqn"}, {"env_step": 100000, "rew": -19.1300000667572, "rew_std": 5.345100609195572, "Agent": "iqn"}, {"env_step": 200000, "rew": -19.34000015258789, "rew_std": 1.09380072496787, "Agent": "iqn"}, {"env_step": 300000, "rew": -18.3, "rew_std": 1.1471704685545094, "Agent": "iqn"}, {"env_step": 400000, "rew": -14.660000038146972, "rew_std": 2.7383207958984883, "Agent": "iqn"}, {"env_step": 500000, "rew": -9.659999978542327, "rew_std": 5.29871682181189, "Agent": "iqn"}, {"env_step": 600000, "rew": -8.680000057816505, "rew_std": 4.040495106986447, "Agent": "iqn"}, {"env_step": 700000, "rew": 2.8499999545514583, "rew_std": 6.374519581488704, "Agent": "iqn"}, {"env_step": 800000, "rew": 7.970000147819519, "rew_std": 8.160275826601659, "Agent": "iqn"}, {"env_step": 900000, "rew": 17.166666507720947, "rew_std": 4.651164654639624, "Agent": "iqn"}, {"env_step": 1000000, "rew": 17.849999984105427, "rew_std": 4.5853935091484725, "Agent": "iqn"}, {"env_step": 1100000, "rew": 18.260000038146973, "rew_std": 1.9652988864635694, "Agent": "iqn"}, {"env_step": 1200000, "rew": 18.68000030517578, "rew_std": 2.9047550585330666, "Agent": "iqn"}, {"env_step": 1300000, "rew": 19.600000381469727, "rew_std": 0.39999961853027344, "Agent": "iqn"}, {"env_step": 1400000, "rew": 18.799999237060547, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 1500000, "rew": 17.0, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 1600000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 1700000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 1800000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 1900000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 2000000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 2100000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 2200000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 2300000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 2400000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 2500000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 2600000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 2700000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 2800000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 2900000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 3000000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 3100000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 3200000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 3300000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 3400000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 3500000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 3600000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 3700000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 3800000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 3900000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 4000000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 4100000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 4200000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 4300000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 4400000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 4500000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 4600000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 4700000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 4800000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 4900000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 5000000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 5100000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 5200000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 5300000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 5400000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 5500000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 5600000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 5700000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 5800000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 5900000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 6000000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 6100000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 6200000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 6300000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 6400000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 6500000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 6600000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 6700000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 6800000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 6900000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 7000000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 7100000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 7200000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 7300000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 7400000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 7500000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 7600000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 7700000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 7800000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 7900000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 8000000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 8100000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 8200000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 8300000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 8400000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 8500000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 8600000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 8700000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 8800000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 8900000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 9000000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 9100000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 9200000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 9300000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 9400000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 9500000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 9600000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 9700000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 9800000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 9900000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 10000000, "rew": 20.700000762939453, "rew_std": 0.0, "Agent": "iqn"}, {"env_step": 0, "rew": -21.0, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 100000, "rew": -20.979999923706053, "rew_std": 0.04000015258789063, "Agent": "rainbow"}, {"env_step": 200000, "rew": -20.439999961853026, "rew_std": 0.611882543624649, "Agent": "rainbow"}, {"env_step": 300000, "rew": -20.05, "rew_std": 1.0984076053899456, "Agent": "rainbow"}, {"env_step": 400000, "rew": -18.579999923706055, "rew_std": 1.1417527594487265, "Agent": "rainbow"}, {"env_step": 500000, "rew": -16.669999980926512, "rew_std": 2.142918529337897, "Agent": "rainbow"}, {"env_step": 600000, "rew": -14.539999961853027, "rew_std": 3.4153184124021854, "Agent": "rainbow"}, {"env_step": 700000, "rew": -11.319999885559081, "rew_std": 2.876734170162213, "Agent": "rainbow"}, {"env_step": 800000, "rew": -10.470000064373016, "rew_std": 4.46520999148195, "Agent": "rainbow"}, {"env_step": 900000, "rew": -2.170000058412552, "rew_std": 4.194055360234164, "Agent": "rainbow"}, {"env_step": 1000000, "rew": -1.1700000524520875, "rew_std": 7.9131599288409395, "Agent": "rainbow"}, {"env_step": 1100000, "rew": 4.420000007003546, "rew_std": 8.925671038750298, "Agent": "rainbow"}, {"env_step": 1200000, "rew": 4.199999978972806, "rew_std": 7.79358685682886, "Agent": "rainbow"}, {"env_step": 1300000, "rew": 4.3666667805777655, "rew_std": 9.006787650672438, "Agent": "rainbow"}, {"env_step": 1400000, "rew": 8.224999904632568, "rew_std": 5.813507857159169, "Agent": "rainbow"}, {"env_step": 1500000, "rew": 10.48749989271164, "rew_std": 5.611915177475383, "Agent": "rainbow"}, {"env_step": 1600000, "rew": 10.325000084936619, "rew_std": 7.195441264466608, "Agent": "rainbow"}, {"env_step": 1700000, "rew": 5.216666638851166, "rew_std": 8.010496691447514, "Agent": "rainbow"}, {"env_step": 1800000, "rew": 7.8833333651224775, "rew_std": 8.73506665798113, "Agent": "rainbow"}, {"env_step": 1900000, "rew": 10.416666527589163, "rew_std": 7.064799091845216, "Agent": "rainbow"}, {"env_step": 2000000, "rew": 14.739999961853027, "rew_std": 3.559550394534507, "Agent": "rainbow"}, {"env_step": 2100000, "rew": 16.82000026702881, "rew_std": 2.790985522657408, "Agent": "rainbow"}, {"env_step": 2200000, "rew": 14.699999809265137, "rew_std": 3.199374665910315, "Agent": "rainbow"}, {"env_step": 2300000, "rew": 16.800000190734863, "rew_std": 1.987460835388907, "Agent": "rainbow"}, {"env_step": 2400000, "rew": 16.649999856948853, "rew_std": 3.9150350231246187, "Agent": "rainbow"}, {"env_step": 2500000, "rew": 18.700000127156574, "rew_std": 1.8384774512584698, "Agent": "rainbow"}, {"env_step": 2600000, "rew": 9.5, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 2700000, "rew": 16.100000381469727, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 2800000, "rew": 15.5, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 2900000, "rew": 15.600000381469727, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 3000000, "rew": -4.300000190734863, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 3100000, "rew": 17.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 3200000, "rew": 17.799999237060547, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 3300000, "rew": 19.100000381469727, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 3400000, "rew": 19.5, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 3500000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 3600000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 3700000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 3800000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 3900000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 4000000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 4100000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 4200000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 4300000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 4400000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 4500000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 4600000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 4700000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 4800000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 4900000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 5000000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 5100000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 5200000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 5300000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 5400000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 5500000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 5600000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 5700000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 5800000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 5900000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 6000000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 6100000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 6200000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 6300000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 6400000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 6500000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 6600000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 6700000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 6800000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 6900000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 7000000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 7100000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 7200000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 7300000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 7400000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 7500000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 7600000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 7700000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 7800000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 7900000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 8000000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 8100000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 8200000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 8300000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 8400000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 8500000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 8600000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 8700000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 8800000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 8900000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 9000000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 9100000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 9200000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 9300000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 9400000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 9500000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 9600000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 9700000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 9800000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 9900000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 10000000, "rew": 20.200000762939453, "rew_std": 0.0, "Agent": "rainbow"}, {"env_step": 0, "rew": -20.75, "rew_std": 0.34132100802270626, "Agent": "ppo"}, {"env_step": 100000, "rew": -20.61000003814697, "rew_std": 0.32695557164785227, "Agent": "ppo"}, {"env_step": 200000, "rew": -19.98000011444092, "rew_std": 0.5793098790055098, "Agent": "ppo"}, {"env_step": 300000, "rew": -17.55, "rew_std": 2.648112510163754, "Agent": "ppo"}, {"env_step": 400000, "rew": -13.260000038146973, "rew_std": 4.553284472142394, "Agent": "ppo"}, {"env_step": 500000, "rew": -9.600000047683716, "rew_std": 5.175519361004068, "Agent": "ppo"}, {"env_step": 600000, "rew": -8.650000131130218, "rew_std": 5.414471552623239, "Agent": "ppo"}, {"env_step": 700000, "rew": -4.4400000154972075, "rew_std": 5.544041881025165, "Agent": "ppo"}, {"env_step": 800000, "rew": 0.6799999058246613, "rew_std": 7.877410761852243, "Agent": "ppo"}, {"env_step": 900000, "rew": 5.640000033378601, "rew_std": 6.771735266186935, "Agent": "ppo"}, {"env_step": 1000000, "rew": 5.6600001603364944, "rew_std": 7.132489235026172, "Agent": "ppo"}, {"env_step": 1100000, "rew": 6.7699999690055845, "rew_std": 6.8543488111854005, "Agent": "ppo"}, {"env_step": 1200000, "rew": 11.959999895095825, "rew_std": 4.759663803505452, "Agent": "ppo"}, {"env_step": 1300000, "rew": 13.499999952316283, "rew_std": 4.599999950243093, "Agent": "ppo"}, {"env_step": 1400000, "rew": 13.460000038146973, "rew_std": 4.538986609617991, "Agent": "ppo"}, {"env_step": 1500000, "rew": 13.359999942779542, "rew_std": 4.740295478528203, "Agent": "ppo"}, {"env_step": 1600000, "rew": 15.47999997138977, "rew_std": 3.309924420995019, "Agent": "ppo"}, {"env_step": 1700000, "rew": 13.88000020980835, "rew_std": 3.9776378782724717, "Agent": "ppo"}, {"env_step": 1800000, "rew": 16.680000019073486, "rew_std": 2.098475869175282, "Agent": "ppo"}, {"env_step": 1900000, "rew": 15.039999866485596, "rew_std": 3.2720634721834996, "Agent": "ppo"}, {"env_step": 2000000, "rew": 16.200000190734862, "rew_std": 2.0079841339730997, "Agent": "ppo"}, {"env_step": 2100000, "rew": 16.709999752044677, "rew_std": 2.592083999305904, "Agent": "ppo"}, {"env_step": 2200000, "rew": 17.93000011444092, "rew_std": 1.5020321173047337, "Agent": "ppo"}, {"env_step": 2300000, "rew": 16.13333299424913, "rew_std": 4.134945780702597, "Agent": "ppo"}, {"env_step": 2400000, "rew": 16.46666653951009, "rew_std": 2.9988884554980983, "Agent": "ppo"}, {"env_step": 2500000, "rew": 17.266666624281143, "rew_std": 1.7549928259554646, "Agent": "ppo"}, {"env_step": 2600000, "rew": 17.63333363003201, "rew_std": 1.300427226972741, "Agent": "ppo"}, {"env_step": 2700000, "rew": 16.8111113442315, "rew_std": 2.6534861585374485, "Agent": "ppo"}, {"env_step": 2800000, "rew": 17.000000211927627, "rew_std": 2.82999802642146, "Agent": "ppo"}, {"env_step": 2900000, "rew": 16.97777779897054, "rew_std": 2.5494127247858547, "Agent": "ppo"}, {"env_step": 3000000, "rew": 17.81250011920929, "rew_std": 1.6593954848338575, "Agent": "ppo"}, {"env_step": 3100000, "rew": 17.06250011920929, "rew_std": 2.284697851779331, "Agent": "ppo"}, {"env_step": 3200000, "rew": 16.975000381469727, "rew_std": 2.1057958062253594, "Agent": "ppo"}, {"env_step": 3300000, "rew": 16.824999809265137, "rew_std": 2.9625790227338165, "Agent": "ppo"}, {"env_step": 3400000, "rew": 18.1875, "rew_std": 2.531519990815377, "Agent": "ppo"}, {"env_step": 3500000, "rew": 16.71666669845581, "rew_std": 2.412755415928967, "Agent": "ppo"}, {"env_step": 3600000, "rew": 16.46666669845581, "rew_std": 3.901566607031345, "Agent": "ppo"}, {"env_step": 3700000, "rew": 16.166666666666668, "rew_std": 2.739626889190835, "Agent": "ppo"}, {"env_step": 3800000, "rew": 17.300000190734863, "rew_std": 2.78926494928614, "Agent": "ppo"}, {"env_step": 3900000, "rew": 18.09999990463257, "rew_std": 2.077658824212887, "Agent": "ppo"}, {"env_step": 4000000, "rew": 17.019999504089355, "rew_std": 1.4483091764261082, "Agent": "ppo"}, {"env_step": 4100000, "rew": 18.620000076293945, "rew_std": 1.2253983415940415, "Agent": "ppo"}, {"env_step": 4200000, "rew": 18.35999984741211, "rew_std": 2.2526428387365733, "Agent": "ppo"}, {"env_step": 4300000, "rew": 19.0, "rew_std": 0.6519197285159748, "Agent": "ppo"}, {"env_step": 4400000, "rew": 18.975000381469727, "rew_std": 1.3141059206073868, "Agent": "ppo"}, {"env_step": 4500000, "rew": 19.625, "rew_std": 0.3897113582892007, "Agent": "ppo"}, {"env_step": 4600000, "rew": 19.566666920979817, "rew_std": 0.684754539003982, "Agent": "ppo"}, {"env_step": 4700000, "rew": 15.199999809265137, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 4800000, "rew": 17.200000762939453, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 4900000, "rew": 16.799999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 5000000, "rew": 18.700000762939453, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 5100000, "rew": 16.100000381469727, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 5200000, "rew": 17.700000762939453, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 5300000, "rew": 17.700000762939453, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 5400000, "rew": 17.600000381469727, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 5500000, "rew": 16.700000762939453, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 5600000, "rew": 19.399999618530273, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 5700000, "rew": 19.100000381469727, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 5800000, "rew": 18.5, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 5900000, "rew": 18.700000762939453, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 6000000, "rew": 19.600000381469727, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 6100000, "rew": 19.0, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 6200000, "rew": 19.0, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 6300000, "rew": 19.100000381469727, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 6400000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 6500000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 6600000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 6700000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 6800000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 6900000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 7000000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 7100000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 7200000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 7300000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 7400000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 7500000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 7600000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 7700000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 7800000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 7900000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 8000000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 8100000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 8200000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 8300000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 8400000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 8500000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 8600000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 8700000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 8800000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 8900000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 9000000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 9100000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 9200000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 9300000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 9400000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 9500000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 9600000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 9700000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 9800000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 9900000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}, {"env_step": 10000000, "rew": 20.299999237060547, "rew_std": 0.0, "Agent": "ppo"}]