213 B
213 B
network.managed_placeholders.keys()
data_collector.raw_data.keys()
data_collector.data.keys()
['observation']
['action']
['reward']
['start_flag']
['advantage'] > ['return'] # they may appear simultaneously