Fix: SamplingConfig.start_timesteps_random was not used

This commit is contained in:
Dominik Jain 2023-12-14 11:47:32 +01:00
parent ea48cc2989
commit 3caa3805f0

View File

@ -115,7 +115,10 @@ class AgentFactory(ABC, ToStringMixin):
train_collector = Collector(policy, train_envs, buffer, exploration_noise=True)
test_collector = Collector(policy, envs.test_envs)
if self.sampling_config.start_timesteps > 0:
train_collector.collect(n_step=self.sampling_config.start_timesteps, random=True)
train_collector.collect(
n_step=self.sampling_config.start_timesteps,
random=self.sampling_config.start_timesteps_random,
)
return train_collector, test_collector
def set_policy_wrapper_factory(