diff --git a/tianshou/optimizer/README.md b/tianshou/optimizer/README.md new file mode 100644 index 0000000..1b39f0d --- /dev/null +++ b/tianshou/optimizer/README.md @@ -0,0 +1,11 @@ +# Optimizer for policy gradient methods +TODO: +vanilla +introduce a baseline +REINFORCE +TRPO +PPO +GAE +NAF +DPG +ACKTR \ No newline at end of file