fix dqn zero eps (#52)

Co-authored-by: liyan <liyan1@digisky.com>
2020-05-21 11:35:41 +08:00 · 2020-05-21 11:35:41 +08:00 · 6237cc0d52
commit 6237cc0d52
parent 57bca16f94
1 changed files with 4 additions and 3 deletions
--- a/tianshou/policy/modelfree/dqn.py
+++ b/tianshou/policy/modelfree/dqn.py
@ -150,9 +150,10 @@ class DQNPolicy(BasePolicy):
        # add eps to act
        if eps is None:
            eps = self.eps
-        for i in range(len(q)):
+        if not np.isclose(eps, 0):
-            if np.random.rand() < eps:
+            for i in range(len(q)):
-                act[i] = np.random.randint(q.shape[1])
+                if np.random.rand() < eps:
                    act[i] = np.random.randint(q.shape[1])
        return Batch(logits=q, act=act, state=h)
    def learn(self, batch: Batch, **kwargs) -> Dict[str, float]: