Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							c42990c725 
							
						 
					 
					
						
						
							
							add rllib result and fix pep8  
						
						
						
						
					 
					
						2020-03-28 09:43:35 +08:00 
						 
				 
			
				
					
						
							
							
								Minghao Zhang 
							
						 
					 
					
						
						
							
							
						
						
						
							
						
						
							77068af526 
							
						 
					 
					
						
						
							
							add examples, fix some bugs ( #5 )  
						
						... 
						
						
						
						* update atari.py
* fix setup.py
pass the pytest
* fix setup.py
pass the pytest
* add args "render"
* change the tensorboard writter
* change the tensorboard writter
* change device, render, tensorboard log location
* change device, render, tensorboard log location
* remove some wrong local files
* fix some tab mistakes and the envs name in continuous/test_xx.py
* add examples and point robot maze environment
* fix some bugs during testing examples
* add dqn network and fix some args
* change back the tensorboard writter's frequency to ensure ppo and a2c can write things normally
* add a warning to collector
* rm some unrelated files
* reformat
* fix a bug in test_dqn due to the model wrong selection 
						
						
					 
					
						2020-03-28 07:27:18 +08:00 
						 
				 
			
				
					
						
							
							
								sproblvem 
							
						 
					 
					
						
						
							
							
						
						
						
							
						
						
							acb93502cf 
							
						 
					 
					
						
						
							
							Update README.md  
						
						... 
						
						
						
						change "Framework" to "Task" 
						
						
					 
					
						2020-03-27 16:52:07 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							044aae4355 
							
						 
					 
					
						
						
							
							add baseline and rlpyt result  
						
						
						
						
					 
					
						2020-03-27 16:24:07 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							44f911bc31 
							
						 
					 
					
						
						
							
							add pytorch drl result  
						
						
						
						
					 
					
						2020-03-27 09:04:29 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							519f9f20d0 
							
						 
					 
					
						
						
							
							update readme  
						
						
						
						
					 
					
						2020-03-26 17:32:51 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							c505cd8205 
							
						 
					 
					
						
						
							
							update readme  
						
						
						
						
					 
					
						2020-03-26 11:42:34 +08:00 
						 
				 
			
				
					
						
							
							
								Minghao Zhang 
							
						 
					 
					
						
						
							
							
						
						
						
							
						
						
							3c0a09fefd 
							
						 
					 
					
						
						
							
							minor reformat ( #2 )  
						
						... 
						
						
						
						* update atari.py
* fix setup.py
pass the pytest
* fix setup.py
pass the pytest 
						
						
					 
					
						2020-03-26 09:01:20 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							fdc969b830 
							
						 
					 
					
						
						
							
							fix collector  
						
						
						
						
					 
					
						2020-03-25 14:08:28 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							e95218e295 
							
						 
					 
					
						
						
							
							sac  
						
						
						
						
					 
					
						2020-03-23 17:17:41 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							30a0fc079c 
							
						 
					 
					
						
						
							
							td3  
						
						
						
						
					 
					
						2020-03-23 11:34:52 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							a87563b8e6 
							
						 
					 
					
						
						
							
							add demo of ppo continuous action task  
						
						
						
						
					 
					
						2020-03-21 17:04:42 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							c173f7bfbc 
							
						 
					 
					
						
						
							
							fix ddpg  
						
						
						
						
					 
					
						2020-03-21 15:31:31 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							8bd8246b16 
							
						 
					 
					
						
						
							
							refract test code  
						
						
						
						
					 
					
						2020-03-21 10:58:01 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							d64d78d769 
							
						 
					 
					
						
						
							
							seed???  
						
						
						
						
					 
					
						2020-03-20 21:51:09 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							75364cd986 
							
						 
					 
					
						
						
							
							ppo and early stop  
						
						
						
						
					 
					
						2020-03-20 19:52:29 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							c87fe3c18c 
							
						 
					 
					
						
						
							
							add trainer  
						
						
						
						
					 
					
						2020-03-19 17:23:46 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							9c5417dd51 
							
						 
					 
					
						
						
							
							change env to vecenv for higher code coverage rate  
						
						
						
						
					 
					
						2020-03-18 21:56:03 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							64bab0b6a0 
							
						 
					 
					
						
						
							
							ddpg  
						
						
						
						
					 
					
						2020-03-18 21:45:41 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							6e563fe61a 
							
						 
					 
					
						
						
							
							a2c  
						
						
						
						
					 
					
						2020-03-17 20:22:37 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							fd621971e5 
							
						 
					 
					
						
						
							
							fix bug in test  
						
						
						
						
					 
					
						2020-03-17 15:16:30 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							39de63592f 
							
						 
					 
					
						
						
							
							finish pg  
						
						
						
						
					 
					
						2020-03-17 11:37:31 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							8b0b970c9b 
							
						 
					 
					
						
						
							
							add speed stat  
						
						
						
						
					 
					
						2020-03-16 15:04:58 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							cef5de8b83 
							
						 
					 
					
						
						
							
							fix some bugs  
						
						
						
						
					 
					
						2020-03-16 11:11:29 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							5983c6b33d 
							
						 
					 
					
						
						
							
							finish dqn  
						
						
						
						
					 
					
						2020-03-15 17:41:00 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							c804662457 
							
						 
					 
					
						
						
							
							add cache buf in collector  
						
						
						
						
					 
					
						2020-03-14 21:48:31 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							543e57cdbd 
							
						 
					 
					
						
						
							
							clear  
						
						
						
						
					 
					
						2020-03-13 21:47:17 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							f16e05c0e7 
							
						 
					 
					
						
						
							
							maybe finished collector?  
						
						
						
						
					 
					
						2020-03-13 17:49:22 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							f58c1397c6 
							
						 
					 
					
						
						
							
							half of collector  
						
						
						
						
					 
					
						2020-03-12 22:20:33 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							4a1a7dd670 
							
						 
					 
					
						
						
							
							fix a bug  
						
						
						
						
					 
					
						2020-03-11 18:02:19 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							6632e47b9d 
							
						 
					 
					
						
						
							
							add test_buffer  
						
						
						
						
					 
					
						2020-03-11 17:28:51 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							04557fdb82 
							
						 
					 
					
						
						
							
							env test \ ray  
						
						
						
						
					 
					
						2020-03-11 16:14:53 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							7533e5b0ac 
							
						 
					 
					
						
						
							
							add first test  
						
						
						
						
					 
					
						2020-03-11 10:56:38 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							5550aed0a1 
							
						 
					 
					
						
						
							
							flake8 fix  
						
						
						
						
					 
					
						2020-03-11 09:38:14 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							776acd9f13 
							
						 
					 
					
						
						
							
							github ci  
						
						
						
						
					 
					
						2020-03-11 09:18:28 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							0dfb900e29 
							
						 
					 
					
						
						
							
							env and data  
						
						
						
						
					 
					
						2020-03-11 09:09:56 +08:00 
						 
				 
			
				
					
						
							
							
								Trinkle23897 
							
						 
					 
					
						
						
						
						
							
						
						
							0c944eab68 
							
						 
					 
					
						
						
							
							init  
						
						
						
						
					 
					
						2020-03-09 11:38:04 +08:00