| 
									
										
										
										
											2020-03-18 21:45:41 +08:00
										 |  |  | import numpy as np | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | class OUNoise(object): | 
					
						
							| 
									
										
										
										
											2020-04-05 18:34:45 +08:00
										 |  |  |     """Class for Ornstein-Uhlenbeck process, as used for exploration in DDPG.
 | 
					
						
							| 
									
										
										
										
											2020-04-03 21:28:12 +08:00
										 |  |  |     Usage: | 
					
						
							|  |  |  |     :: | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         # init | 
					
						
							|  |  |  |         self.noise = OUNoise() | 
					
						
							|  |  |  |         # generate noise | 
					
						
							|  |  |  |         noise = self.noise(logits.shape, eps) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     For required parameters, you can refer to the stackoverflow page. However, | 
					
						
							|  |  |  |     our experiment result shows that (similar to OpenAI SpinningUp) using | 
					
						
							|  |  |  |     vanilla gaussian process has little difference from using the | 
					
						
							|  |  |  |     Ornstein-Uhlenbeck process. | 
					
						
							|  |  |  |     """
 | 
					
						
							| 
									
										
										
										
											2020-03-18 21:45:41 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  |     def __init__(self, sigma=0.3, theta=0.15, dt=1e-2, x0=None): | 
					
						
							|  |  |  |         self.alpha = theta * dt | 
					
						
							|  |  |  |         self.beta = sigma * np.sqrt(dt) | 
					
						
							|  |  |  |         self.x0 = x0 | 
					
						
							|  |  |  |         self.reset() | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def __call__(self, size, mu=.1): | 
					
						
							| 
									
										
										
										
											2020-04-05 18:34:45 +08:00
										 |  |  |         """Generate new noise. Return a ``numpy.ndarray`` which size is equal
 | 
					
						
							|  |  |  |         to ``size``. | 
					
						
							| 
									
										
										
										
											2020-04-03 21:28:12 +08:00
										 |  |  |         """
 | 
					
						
							| 
									
										
										
										
											2020-03-18 21:45:41 +08:00
										 |  |  |         if self.x is None or self.x.shape != size: | 
					
						
							|  |  |  |             self.x = 0 | 
					
						
							| 
									
										
										
										
											2020-03-28 09:43:35 +08:00
										 |  |  |         r = self.beta * np.random.normal(size=size) | 
					
						
							|  |  |  |         self.x = self.x + self.alpha * (mu - self.x) + r | 
					
						
							| 
									
										
										
										
											2020-03-18 21:45:41 +08:00
										 |  |  |         return self.x | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def reset(self): | 
					
						
							| 
									
										
										
										
											2020-04-05 18:34:45 +08:00
										 |  |  |         """Reset to the initial state.""" | 
					
						
							| 
									
										
										
										
											2020-03-18 21:45:41 +08:00
										 |  |  |         self.x = None |