212 B
212 B
network.managed_placeholders.keys()
data_collector.raw_data.keys()
data_collector.data.keys()
['observation']
['action']
['reward']
['done_flag']
['advantage'] > ['return'] # they may appear simultaneously