from __future__ import absolute_import def test_policy_in_env(policy, env): # make another env as the original is for training data collection env_ = env pass