| 
						
					 | 
					
						
						
						
						
							
						
						
							2e0f46b0f3
							
						
					 | 
					
						
						
							
							Fixing ser/deser bug (cloudpickle cant handle some enums)
						
						
						
						
						
					 | 
					
						2022-07-15 18:45:38 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							a86d19053d
							
						
					 | 
					
						
						
							
							Smashing bugs (dimension mismatch between Normal and
						
						
						
						
						
						
						
						Independent/MultivariateNormal) 
						
					 | 
					
						2022-07-15 15:46:31 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							ab557a8856
							
						
					 | 
					
						
						
							
							Making MultivariateNormal Policies work (and porting Normal to
						
						
						
						
						
						
						
						Independent) 
						
					 | 
					
						2022-07-15 15:03:51 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							b1ed9fc2b8
							
						
					 | 
					
						
						
							
							Renamed TRL_PG to PPO
						
						
						
						
						
					 | 
					
						2022-07-13 19:51:33 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							1706bea571
							
						
					 | 
					
						
						
							
							Testing SDC
						
						
						
						
						
					 | 
					
						2022-07-13 19:39:09 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							3304fd49f6
							
						
					 | 
					
						
						
							
							Working on UniversalGaussianDistribution
						
						
						
						
						
					 | 
					
						2022-07-13 19:38:57 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							fae19509bc
							
						
					 | 
					
						
						
							
							Implemented Policies with Contextual Covariance
						
						
						
						
						
					 | 
					
						2022-07-13 19:38:20 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							41e4170b2f
							
						
					 | 
					
						
						
							
							Fixes + spherical_chol
						
						
						
						
						
					 | 
					
						2022-07-11 17:28:08 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							e4440428f8
							
						
					 | 
					
						
						
							
							Working on SDC
						
						
						
						
						
					 | 
					
						2022-07-11 11:55:23 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							4c4b12ee0e
							
						
					 | 
					
						
						
							
							Allow cloning UniversalGaussianDistribution (new_dist_like)
						
						
						
						
						
					 | 
					
						2022-07-09 14:46:11 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							c08ea1cb91
							
						
					 | 
					
						
						
							
							Making UniversalGaussianDistribution ready for tanh-squashing-support
						
						
						
						
						
					 | 
					
						2022-07-09 14:33:07 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							249754ee89
							
						
					 | 
					
						
						
							
							Wrote a little helper-function to generate all allowed combinations of
						
						
						
						
						
						
						
						cov-parameterizations 
						
					 | 
					
						2022-07-09 14:03:56 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							e09950b30c
							
						
					 | 
					
						
						
							
							Work on Contextual Covariances
						
						
						
						
						
					 | 
					
						2022-07-09 12:26:39 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							aacacebfc4
							
						
					 | 
					
						
						
							
							Fixed license
						
						
						
						
						
					 | 
					
						2022-07-06 13:26:33 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							0911a04e98
							
						
					 | 
					
						
						
							
							Factored out Gaussian Collection for RolloutBuffer
						
						
						
						
						
					 | 
					
						2022-07-04 21:21:16 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							1f3eac5398
							
						
					 | 
					
						
						
							
							Cleanup
						
						
						
						
						
					 | 
					
						2022-07-02 16:42:14 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							92204c448f
							
						
					 | 
					
						
						
							
							Testing kl-projection (it's working!)
						
						
						
						
						
					 | 
					
						2022-07-02 16:41:25 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							ad7ed0071b
							
						
					 | 
					
						
						
							
							Silence!
						
						
						
						
						
					 | 
					
						2022-07-01 20:02:29 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							91f64c10d7
							
						
					 | 
					
						
						
							
							Fixed bug with initialization of buffer
						
						
						
						
						
					 | 
					
						2022-07-01 20:02:09 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							0dc9edf112
							
						
					 | 
					
						
						
							
							We no longer use venv (breaks cpp_projection...)
						
						
						
						
						
					 | 
					
						2022-07-01 19:52:22 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							14100cccc8
							
						
					 | 
					
						
						
							
							Working on SDC-impl.
						
						
						
						
						
					 | 
					
						2022-07-01 15:14:41 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							4f2e75b7ae
							
						
					 | 
					
						
						
							
							Slimmed 3rd-party-licenses
						
						
						
						
						
					 | 
					
						2022-07-01 14:03:50 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							90b3c68a56
							
						
					 | 
					
						
						
							
							Maybe better licensing
						
						
						
						
						
					 | 
					
						2022-07-01 13:59:07 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							cc51547681
							
						
					 | 
					
						
						
							
							Fixed CppProjection in requirements
						
						
						
						
						
					 | 
					
						2022-07-01 13:47:04 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							84d1cda96c
							
						
					 | 
					
						
						
							
							Trying to get kl to work
						
						
						
						
						
					 | 
					
						2022-07-01 13:45:58 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							9d7ce73a0b
							
						
					 | 
					
						
						
							
							README: We also have to install cpp_projection
						
						
						
						
						
					 | 
					
						2022-07-01 12:30:29 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							111b1b846d
							
						
					 | 
					
						
						
							
							Now we even include a setup.py
						
						
						
						
						
					 | 
					
						2022-07-01 12:22:27 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							81ae3e3707
							
						
					 | 
					
						
						
							
							Finalized venv support and added installation-instructions
						
						
						
						
						
					 | 
					
						2022-07-01 12:19:57 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							f25d7a103b
							
						
					 | 
					
						
						
							
							Now ready to pvenv
						
						
						
						
						
					 | 
					
						2022-07-01 12:03:20 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							2626ec82a6
							
						
					 | 
					
						
						
							
							Added code-src-note
						
						
						
						
						
					 | 
					
						2022-07-01 11:52:50 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							ab1b269af9
							
						
					 | 
					
						
						
							
							Allow checking whether a dist is contextual
						
						
						
						
						
					 | 
					
						2022-07-01 11:52:14 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							a8b9c63965
							
						
					 | 
					
						
						
							
							Making dez covariances contextual
						
						
						
						
						
					 | 
					
						2022-07-01 11:29:12 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							155a298e41
							
						
					 | 
					
						
						
							
							Switching to new icon
						
						
						
						
						
					 | 
					
						2022-06-30 21:02:22 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							7e7ba65e51
							
						
					 | 
					
						
						
							
							Testing alternative icon
						
						
						
						
						
					 | 
					
						2022-06-30 21:01:25 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							2e378d0a7d
							
						
					 | 
					
						
						
							
							Rebranding to Metastable Baselines
						
						
						
						
						
					 | 
					
						2022-06-30 20:40:30 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							30c9e93967
							
						
					 | 
					
						
						
							
							Fixed replay
						
						
						
						
						
					 | 
					
						2022-06-29 17:02:40 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							28561b9bb2
							
						
					 | 
					
						
						
							
							Allow manual early stopping of training (Ctrl+C)
						
						
						
						
						
					 | 
					
						2022-06-29 12:46:57 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							e8d423f91f
							
						
					 | 
					
						
						
							
							Testing the new WassersteinProjectionLayer
						
						
						
						
						
					 | 
					
						2022-06-29 12:46:37 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							4e77190d8e
							
						
					 | 
					
						
						
							
							Fixed chol not expanding bug and function to shrink chol to diag
						
						
						
						
						
					 | 
					
						2022-06-29 12:44:13 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							7c117cfca5
							
						
					 | 
					
						
						
							
							Added possibility to load models and run hem again (currently bugged)
						
						
						
						
						
					 | 
					
						2022-06-29 12:43:21 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							416dde202d
							
						
					 | 
					
						
						
							
							Factored out frob_sq and perf improvement for spd input
						
						
						
						
						
					 | 
					
						2022-06-27 13:44:08 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							f4c87c9cdc
							
						
					 | 
					
						
						
							
							Better handling of diagonal-covariance as vector and matrix
						
						
						
						
						
					 | 
					
						2022-06-26 18:14:12 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							bc61a6db32
							
						
					 | 
					
						
						
							
							Refactored some stuff out
						
						
						
						
						
					 | 
					
						2022-06-26 16:39:37 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							edf00553dd
							
						
					 | 
					
						
						
							
							Renamed our RolloutBuffer and testing the FrobeniusProjectionLayer
						
						
						
						
						
					 | 
					
						2022-06-26 16:39:06 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							024a9a0265
							
						
					 | 
					
						
						
							
							StillTesting
						
						
						
						
						
					 | 
					
						2022-06-26 16:38:46 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							80741776d2
							
						
					 | 
					
						
						
							
							Removed old comments
						
						
						
						
						
					 | 
					
						2022-06-25 21:56:07 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							b8488c531b
							
						
					 | 
					
						
						
							
							Implemented TRLRolloutBuffer
						
						
						
						
						
					 | 
					
						2022-06-25 21:47:39 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							60c954c8c1
							
						
					 | 
					
						
						
							
							LunarLanderContinuous-v2 is our new default test-env
						
						
						
						
						
					 | 
					
						2022-06-25 21:47:21 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							cf5a2e82fc
							
						
					 | 
					
						
						
							
							mean and std are now saved to the rollout
						
						
						
						
						
					 | 
					
						2022-06-25 18:29:55 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
						
						
							
						
						
							df21e1dc3f
							
						
					 | 
					
						
						
							
							Fixed reference to gym.spaces
						
						
						
						
						
					 | 
					
						2022-06-25 17:49:46 +02:00 | 
					
					
						
						
							
							
							
						
					 |