diff --git a/tianshou/core/README.md b/tianshou/core/README.md new file mode 100644 index 0000000..2ef89eb --- /dev/null +++ b/tianshou/core/README.md @@ -0,0 +1,24 @@ +# Core + +## Optimizer +TODO: + +### policy based: + +Vanilla + +Baseline + +TRPO + +PPO + +NAF + +GAE + +DPG + +### value based: + +TD diff --git a/tianshou/optimizer/README.md b/tianshou/optimizer/README.md index 31775ae..e80c0d8 100644 --- a/tianshou/optimizer/README.md +++ b/tianshou/optimizer/README.md @@ -1,11 +1,20 @@ # Optimizer for policy gradient methods TODO: + vanilla -introduce a baseline + +baseline + REINFORCE + TRPO + PPO + GAE + NAF + DPG -ACKTR \ No newline at end of file + +ACKTR \ No newline at end of file