NM512
							
						 
					 | 
					
						
						
						
						
							
						
						
							0eb66997fb
							
						
					 | 
					
						
						
							
							learnable initial state options for RSSM
						
						
						
						
						
						
					 | 
					
						2023-04-29 07:54:03 +09:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								NM512
							
						 
					 | 
					
						
						
						
						
							
						
						
							1328ff1088
							
						
					 | 
					
						
						
							
							sampling from the replay buffer across episodes
						
						
						
						
						
						
					 | 
					
						2023-04-29 07:43:02 +09:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								NM512
							
						 
					 | 
					
						
						
						
						
							
						
						
							12cccd8475
							
						
					 | 
					
						
						
							
							addition of "is_first" and "is_terminal" for envs
						
						
						
						
						
						
					 | 
					
						2023-04-29 07:34:27 +09:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								NM512
							
						 
					 | 
					
						
						
						
						
							
						
						
							3d0e2c8b5a
							
						
					 | 
					
						
						
							
							added .vscode to .gitignore
						
						
						
						
						
						
					 | 
					
						2023-04-29 07:30:34 +09:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								NM512
							
						 
					 | 
					
						
						
						
						
							
						
						
							2a8b44eb0c
							
						
					 | 
					
						
						
							
							erased unnecessary code
						
						
						
						
						
						
					 | 
					
						2023-04-27 07:42:08 +09:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								NM512
							
						 
					 | 
					
						
						
						
						
							
						
						
							432a359bcf
							
						
					 | 
					
						
						
							
							put running episode into replay buffer
						
						
						
						
						
						
					 | 
					
						2023-04-24 06:25:17 +09:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								NM512
							
						 
					 | 
					
						
						
						
						
							
						
						
							6f0e6c6963
							
						
					 | 
					
						
						
							
							applied formatter to envs
						
						
						
						
						
						
					 | 
					
						2023-04-23 22:52:30 +09:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								NM512
							
						 
					 | 
					
						
						
						
						
							
						
						
							628b856c63
							
						
					 | 
					
						
						
							
							changed the discount head to predict terminal
						
						
						
						
						
						
					 | 
					
						2023-04-22 09:34:23 +09:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								NM512
							
						 
					 | 
					
						
						
							
							
						
						
						
							
						
						
							16151efb3c
							
						
					 | 
					
						
						
							
							Merge pull request #6 from truncs/main
						
						
						
						
						
						
						
						That is correct.
Thanks for your contribution! 
						
						
					 | 
					
						2023-04-22 09:19:44 +09:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Aditya
							
						 
					 | 
					
						
						
						
						
							
						
						
							52782d31e3
							
						
					 | 
					
						
						
							
							terminal value is along the sequence dim
						
						
						
						
						
						
					 | 
					
						2023-04-20 19:05:18 -07:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								NM512
							
						 
					 | 
					
						
						
						
						
							
						
						
							1e070a3daf
							
						
					 | 
					
						
						
							
							cleaned up envs
						
						
						
						
						
						
					 | 
					
						2023-04-15 23:16:43 +09:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								NM512
							
						 
					 | 
					
						
						
						
						
							
						
						
							fba87a33e0
							
						
					 | 
					
						
						
							
							applied formatter to tools
						
						
						
						
						
						
					 | 
					
						2023-04-15 15:28:09 +09:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								NM512
							
						 
					 | 
					
						
						
						
						
							
						
						
							55ed69bdf7
							
						
					 | 
					
						
						
							
							fix bug when using envs > 1
						
						
						
						
						
						
					 | 
					
						2023-04-15 15:25:25 +09:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								NM512
							
						 
					 | 
					
						
						
						
						
							
						
						
							cd935b7dd9
							
						
					 | 
					
						
						
							
							set default replay buffer size as 1M
						
						
						
						
						
						
					 | 
					
						2023-04-05 21:38:51 +09:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								NM512
							
						 
					 | 
					
						
						
						
						
							
						
						
							57ac1c11d3
							
						
					 | 
					
						
						
							
							replaced all tf function to torch
						
						
						
						
						
						
					 | 
					
						2023-04-03 08:06:34 +09:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								NM512
							
						 
					 | 
					
						
						
						
						
							
						
						
							8bd69bfcd4
							
						
					 | 
					
						
						
							
							bug fix when using multiple environments
						
						
						
						
						
						
					 | 
					
						2023-04-03 08:00:16 +09:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								NM512
							
						 
					 | 
					
						
						
						
						
							
						
						
							942eae10a9
							
						
					 | 
					
						
						
							
							updated result, requirements and torch version
						
						
						
						
						
						
					 | 
					
						2023-03-24 07:51:57 +09:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								NM512
							
						 
					 | 
					
						
						
						
						
							
						
						
							2504426164
							
						
					 | 
					
						
						
							
							updated results
						
						
						
						
						
						
					 | 
					
						2023-03-20 21:00:01 +09:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								NM512
							
						 
					 | 
					
						
						
						
						
							
						
						
							5ad0f6e9ca
							
						
					 | 
					
						
						
							
							clear eval episodes for saving memory
						
						
						
						
						
						
					 | 
					
						2023-03-20 20:55:06 +09:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								NM512
							
						 
					 | 
					
						
						
						
						
							
						
						
							44f8edc115
							
						
					 | 
					
						
						
							
							updated results
						
						
						
						
						
						
					 | 
					
						2023-03-18 19:07:12 +09:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								NM512
							
						 
					 | 
					
						
						
						
						
							
						
						
							6273444394
							
						
					 | 
					
						
						
							
							modified based on author's implementation
						
						
						
						
						
						
					 | 
					
						2023-03-18 08:38:23 +09:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								NM512
							
						 
					 | 
					
						
						
						
						
							
						
						
							a678a509b9
							
						
					 | 
					
						
						
							
							updated results
						
						
						
						
						
						
					 | 
					
						2023-02-18 14:42:22 +09:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								NM512
							
						 
					 | 
					
						
						
						
						
							
						
						
							f96ad071d1
							
						
					 | 
					
						
						
							
							modified network structures to match the paper
						
						
						
						
						
						
					 | 
					
						2023-02-18 10:13:02 +09:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								NM512
							
						 
					 | 
					
						
						
						
						
							
						
						
							fb5c21557a
							
						
					 | 
					
						
						
							
							Initial Commit
						
						
						
						
						
						
					 | 
					
						2023-02-12 22:35:25 +09:00 | 
					
					
						
						
							
							
							
						
					 |