From e6cad0bce953da093cef5cf5a56ffac86bdb77d0 Mon Sep 17 00:00:00 2001 From: Tongzheng Ren Date: Mon, 6 Nov 2017 15:17:55 +0800 Subject: [PATCH] architecture design patch --- README.md | 25 +++++++++++++++++++++++++ tianshou/optimizer/README.md | 20 -------------------- 2 files changed, 25 insertions(+), 20 deletions(-) delete mode 100644 tianshou/optimizer/README.md diff --git a/README.md b/README.md index 3ccb5cb..883e965 100644 --- a/README.md +++ b/README.md @@ -1,2 +1,27 @@ # tianshou Tianshou(天授) is a reinforcement learning platform. +## data +TODO: + +Replay Memory + +Multiple wirter/reader + +Importance sampling + +## simulator +go(for AlphaGo) + +## environment +gym + +## core +TODO: + +Optimizer + +MCTS + +## agent (optional) + +DQNAgent etc. diff --git a/tianshou/optimizer/README.md b/tianshou/optimizer/README.md deleted file mode 100644 index e80c0d8..0000000 --- a/tianshou/optimizer/README.md +++ /dev/null @@ -1,20 +0,0 @@ -# Optimizer for policy gradient methods -TODO: - -vanilla - -baseline - -REINFORCE - -TRPO - -PPO - -GAE - -NAF - -DPG - -ACKTR \ No newline at end of file