saicpp commited on
Commit
c148c08
·
verified ·
1 Parent(s): d37c834

Finished v6 of model of unit 1

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 231.51 +/- 51.08
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 268.48 +/- 21.87
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7a8e71966d40>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7a8e71966dd0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7a8e71966e60>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7a8e71966ef0>", "_build": "<function ActorCriticPolicy._build at 0x7a8e71966f80>", "forward": "<function ActorCriticPolicy.forward at 0x7a8e71967010>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7a8e719670a0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7a8e71967130>", "_predict": "<function ActorCriticPolicy._predict at 0x7a8e719671c0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7a8e71967250>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7a8e719672e0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7a8e71967370>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7a8e72290180>"}, "verbose": 0, "policy_kwargs": {}, "num_timesteps": 131072, "_total_timesteps": 100000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1724931803726300587, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": null, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.3107200000000001, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVHwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHCihxgiNbWMAWyUTRUBjAF0lEdAnT30BXCCSXV9lChoBkdAcYvZKFqSHWgHTREBaAhHQJ0/JT6zmfZ1fZQoaAZHQHCJrX+VC5VoB00NAWgIR0CdPyVzp5eJdX2UKGgGR0BuimbqhUR4aAdL+GgIR0CdQbgGbCrMdX2UKGgGR0BguNiONo8IaAdN6ANoCEdAnUHwzUI9knV9lChoBkdAb/oukk8ifWgHS+hoCEdAnULHa8Hv+nV9lChoBkdAcNzHiFTNuGgHTacBaAhHQJ1Dpk+X7ch1fZQoaAZHQDjZ3GGVRk5oB0vpaAhHQJ1FpJf6XSl1fZQoaAZHQGJ2mZmZmZpoB03oA2gIR0CdRssqril0dX2UKGgGR0BicicEvCdjaAdN6ANoCEdAnUmPUWl/IHV9lChoBkdAR8rHn2ZiNWgHS9hoCEdAnUmv3FkxynV9lChoBkdAcjhm3OObRWgHS/NoCEdAnUmxFuvU0HV9lChoBkdAbzFQTmGM42gHTQkCaAhHQJ1PWdRR/Ex1fZQoaAZHQGzTGnn+yZ9oB02rAWgIR0CdUBHmig01dX2UKGgGR0BxGb7+DOC5aAdNFAFoCEdAnVJAPiDM/3V9lChoBkdAcgPenAIppmgHTQwBaAhHQJ1SxuGbkOt1fZQoaAZHQHHLJwn6VMVoB00SAWgIR0CdVSLdN34cdX2UKGgGR8BJoXZXdTHbaAdL12gIR0CdVWAgPmPpdX2UKGgGR0BuDJ2r4nF6aAdL+WgIR0CdVvdTo+wDdX2UKGgGR0BxVzmeUY8/aAdNBwFoCEdAnVeSGnGbTnV9lChoBkdAZgd+jM3ZPGgHTegDaAhHQJ1Xp+w1R+B1fZQoaAZHQG+pIhQm/nJoB0v6aAhHQJ1a8SL61st1fZQoaAZHQHFB6QRwqAloB0vlaAhHQJ1c2WLP2PF1fZQoaAZHQF+KG8274BVoB03oA2gIR0CdXYMfA9FGdX2UKGgGR0BwSTgLqlguaAdNCwFoCEdAnV4F0YCQtHV9lChoBkdAb8Xzp5eJHmgHTdMBaAhHQJ1eeP5pJwt1fZQoaAZHQHGbQp8WsRxoB0vkaAhHQJ1fBouf29N1fZQoaAZHQHDjYKhL5ARoB01gAWgIR0CdX8fiPyTZdX2UKGgGR0BvLDU3GXHBaAdL82gIR0CdX9GgzxgBdX2UKGgGR0BwZrd2xIJ7aAdNCgFoCEdAnWKtLlFMI3V9lChoBkdAcMy6eGwiaGgHTRMBaAhHQJ1jGdUbT+h1fZQoaAZHQGAbQUHpr1xoB03oA2gIR0CdZgLPldTpdX2UKGgGR0BFTYkVvddnaAdL1mgIR0CdZjmdiDujdX2UKGgGR0ByMwOLBKtgaAdNEwFoCEdAnWZ1oUSIxnV9lChoBkdAYfPqHGjsU2gHTegDaAhHQJ1mdh6Skj51fZQoaAZHQHFg0UTL4etoB0vnaAhHQJ3MpS1maph1fZQoaAZHQHImnxjJ+2FoB0vRaAhHQJ3NjNY8uBd1fZQoaAZHQG/GBomG/N9oB02kAWgIR0CdzbIAwPAgdX2UKGgGR0ByNI61b7j1aAdNBwFoCEdAnc7mjwhGIHV9lChoBkdAbEN9ph4MW2gHTbEDaAhHQJ3QJ5le4Td1fZQoaAZHQHBZwnQY1pFoB01cAWgIR0Cd0E7N0NjLdX2UKGgGR0BBVXs5XEIgaAdLyWgIR0Cd0J29L6DXdX2UKGgGR0BsABC2MKkVaAdNJgFoCEdAndDrUb1h9nV9lChoBkdAYs7V6NVBEGgHTegDaAhHQJ3UmkSElE91fZQoaAZHQFzqf779AHFoB03oA2gIR0Cd1M2zOX3QdX2UKGgGR0Bxoo7/4qPPaAdNCAFoCEdAndWosunMuHV9lChoBkdAcDPX8O09hmgHTRYBaAhHQJ3WirfcesB1fZQoaAZHQDdkxubZvk1oB0u9aAhHQJ3XZl5GBnV1fZQoaAZHQG4jhhx5s0poB0v7aAhHQJ3XeDdxhlV1fZQoaAZHQHG1AIyCWeJoB00dAWgIR0Cd2KrwvxpddX2UKGgGR0Bw2JUT+NtJaAdNQAFoCEdAndknf2saKnV9lChoBkdAcof9YOlO5GgHS+loCEdAndlP+GXXy3V9lChoBkdAbLAT6i0v5GgHS+JoCEdAnd1U6cRUWHV9lChoBkdAcMB37UG3WmgHS/xoCEdAnd6jlkpZwHV9lChoBkdAb3sGFi8WbmgHS+9oCEdAnd8aBqbjLnV9lChoBkdAcc24qwyIpGgHS/poCEdAneCyMo+fRXV9lChoBkdAb/KkP+XJHWgHTQ0BaAhHQJ3jkFB6a9d1fZQoaAZHQG1gVMuez2RoB00SAWgIR0Cd48INVinYdX2UKGgGR0BvZwbdadMCaAdL62gIR0Cd5FXK8tf5dX2UKGgGR0Blz+cc2itaaAdN6AFoCEdAneZxwl0HQnV9lChoBkdAbU+ADJU5uWgHTSUBaAhHQJ3nj+6y0KJ1fZQoaAZHQHLGtZNfw7VoB01bAWgIR0Cd6h1yvLX+dX2UKGgGR0BxLWTGHYYjaAdL/GgIR0Cd7a/CqIacdX2UKGgGR0Bxsi2H+IdmaAdNOgFoCEdAne8wvlEJB3V9lChoBkdAWzYDhcZ9/mgHTegDaAhHQJ3xH58BuGd1fZQoaAZHQG+vnOryUcJoB0v1aAhHQJ3xtrgwXZZ1fZQoaAZHQG1du4gA6uJoB0v6aAhHQJ3yg9mpVCJ1fZQoaAZHQG2cMQNCqp9oB03DA2gIR0Cd9HTTfBN3dX2UKGgGR0BvhLEcbR4RaAdNhAFoCEdAnfan/tICl3V9lChoBkdAcZM+uNgjQmgHTQYBaAhHQJ338EzO5ax1fZQoaAZHQHBlSmdiDuloB01CAWgIR0Cd+NF4LThHdX2UKGgGR0Bex52pyZKGaAdN6ANoCEdAnfqDL0SRKnV9lChoBkdAXDhHz6JqI2gHTegDaAhHQJ36wLUkOZt1fZQoaAZHQHCPHeaa1CxoB00IAWgIR0Cd+/ECeVcEdX2UKGgGR0Bvxiwt8NQTaAdL3mgIR0Cd/E/1xsEadX2UKGgGR0Bdm9a2WpqAaAdN6ANoCEdAnf4ztXxOL3V9lChoBkdAcSwYukDZDmgHTSUBaAhHQJ3+4B/7SAp1fZQoaAZHQHG1R+nZTQ5oB00XAWgIR0Cd/3mozeoDdX2UKGgGR0Befh4t6HCXaAdN6ANoCEdAnf/phWo3rHV9lChoBkdAcGeabF0gbWgHS/xoCEdAngAIUSIxg3V9lChoBkdAbnNqWTot+WgHS/5oCEdAngGwmReTmnV9lChoBkdAcJzV/MGHHmgHS+poCEdAngKYvvjOs3V9lChoBkdAbjoyLQ5WBGgHS+FoCEdAngPkoKD02HV9lChoBkdAcYItz0Yj0WgHS/toCEdAngZPv0AcUHV9lChoBkdAJtNiYsunM2gHS8doCEdAngcOsHSncnV9lChoBkdAcqt1Q66remgHTRoBaAhHQJ4ILMJQcgh1fZQoaAZHQGryl98Z1mtoB00SAWgIR0CeDBHG0eEJdX2UKGgGR0BgudvES/TLaAdN6ANoCEdAnhDeSB9TgnV9lChoBkdAYRFS9du50GgHTegDaAhHQJ4VHnxJ/Xp1fZQoaAZHQGOkDcVQAMloB03oA2gIR0CeGBh4+r2hdX2UKGgGR0Bt/RDZ13dLaAdNBwJoCEdAnhmn8jzI3nV9lChoBkdAckHkE9t/F2gHTQoBaAhHQJ4bFrXUYsN1fZQoaAZHQGGKrnDBMzxoB03oA2gIR0CeH6DIikftdX2UKGgGR0BxFTNX5nDjaAdL9mgIR0CeIA0Rvm5ldX2UKGgGR0BwqFfYzzmPaAdL+mgIR0CeJnPN3W4FdX2UKGgGR0Bt+BAWznieaAdL9GgIR0CeJ0zLwF1TdX2UKGgGR0Bdh5nctXgcaAdN6ANoCEdAnioMcABDHHV9lChoBkdAcETC4jKPn2gHS/hoCEdAnix0k0JnhHV9lChoBkdAXy9uIhyKemgHTegDaAhHQJ4s3OX3QD51fZQoaAZHQHG5OwTufEpoB01VAWgIR0CeLXftQbdadWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 220, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV/QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgLjAJpOJSJiIeUUpQoSwNoD05OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 2048, "gamma": 0.99, "gae_lambda": 0.95, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-6.1.85+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Thu Jun 27 21:05:47 UTC 2024", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.4.0+cu121", "GPU Enabled": "True", "Numpy": "1.26.4", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7a8e71966d40>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7a8e71966dd0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7a8e71966e60>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7a8e71966ef0>", "_build": "<function ActorCriticPolicy._build at 0x7a8e71966f80>", "forward": "<function ActorCriticPolicy.forward at 0x7a8e71967010>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7a8e719670a0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7a8e71967130>", "_predict": "<function ActorCriticPolicy._predict at 0x7a8e719671c0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7a8e71967250>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7a8e719672e0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7a8e71967370>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7a8e72290180>"}, "verbose": 0, "policy_kwargs": {}, "num_timesteps": 229376, "_total_timesteps": 200000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1724932876287872543, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": null, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.1468799999999999, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV7gsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHIrTUNKAayMAWyUS/SMAXSUR0CoGd0daMaTdX2UKGgGR0BvwnzOHFglaAdL2mgIR0CoGogTyrggdX2UKGgGR0BxI91loUSJaAdLzWgIR0CoGzTHjp9rdX2UKGgGR0ByHvHAAQxvaAdL0WgIR0CoG32CuloEdX2UKGgGR0Bxj+SIP9UCaAdLwmgIR0CoG6dnCfpVdX2UKGgGR0BuZOrGR3eOaAdLzWgIR0CoHFapxWDIdX2UKGgGR0BwZfpPhybQaAdLx2gIR0CoHI7/XGwSdX2UKGgGR0BxSuVTrE9/aAdLy2gIR0CoHLjrAxi5dX2UKGgGR0ByCiwpvxYraAdNBAFoCEdAqBzZ7NSqEXV9lChoBkdAcWYOavzOHGgHS89oCEdAqB2Kxu89OnV9lChoBkdAW53HT7VJ+WgHTegDaAhHQKgeH4pMHr11fZQoaAZHQHCYyZa3ZwpoB0vJaAhHQKgeR/95yEN1fZQoaAZHQHCNI4Qz1sdoB0vpaAhHQKgefMGHHm11fZQoaAZHQG5pLu6VdHFoB0vQaAhHQKgfSEr5IpZ1fZQoaAZHQHH0IL9deIFoB0vxaAhHQKgfWiMYMv11fZQoaAZHQHGI9n003wVoB0vdaAhHQKgfs69TP0J1fZQoaAZHQHGJIlD4QBhoB0vdaAhHQKgf0iJO32F1fZQoaAZHQHHIiRwIdENoB0vNaAhHQKggRNB4Uvh1fZQoaAZHQHI8cbR4QjFoB0vRaAhHQKggc/dIoVp1fZQoaAZHQHJdGuoxYaJoB0vqaAhHQKggiQfZElV1fZQoaAZHQHGvF0PpY9xoB0vEaAhHQKgharTYukF1fZQoaAZHQG+8Lqt5le5oB0v1aAhHQKghsgXdj5N1fZQoaAZHQHHe0KeCkGloB0vFaAhHQKgh1QdCE6F1fZQoaAZHQHCzmIoE0SBoB0vmaAhHQKgiNVJ+UhV1fZQoaAZHQHAahi5NGmVoB0vRaAhHQKgi9syBTXJ1fZQoaAZHQHDsEYfnwG5oB0vZaAhHQKgjMXvYvnN1fZQoaAZHQG8PHDJlrdpoB0vJaAhHQKgjSl54W1t1fZQoaAZHQG9G7qIJqqRoB0vEaAhHQKgjVAE+xGF1fZQoaAZHQGJp8ebNKRNoB03oA2gIR0CoI4z4L1EmdX2UKGgGR0Bx4Hin5zo2aAdLvWgIR0CoI8mukk8idX2UKGgGR0BmoAhhYvFnaAdN6ANoCEdAqCP8LpiZv3V9lChoBkdAcWxnLq2SdWgHS9VoCEdAqCQu1v2oN3V9lChoBkdAchgob4rSVmgHS9loCEdAqCTvKdQO4HV9lChoBkdAcsMS1Vo6CGgHS+loCEdAqCVjmQr+YXV9lChoBkdAcnw4oqkM1GgHS91oCEdAqCWjsQd0aXV9lChoBkdAcqI1WbPQfWgHTRIBaAhHQKgmIXm/3391fZQoaAZHQHHqpOrQw9JoB0vSaAhHQKgmbLM9r451fZQoaAZHQHDCWnjyWiVoB0vaaAhHQKgmcFoL5RF1fZQoaAZHQG9H8M3IdU9oB0vXaAhHQKgmeSqU/wB1fZQoaAZHQHIKZGax5cFoB0vYaAhHQKgmuI7eVLV1fZQoaAZHQHJs761stTVoB0v8aAhHQKgmw1mapgl1fZQoaAZHQG5aLfLs8gZoB0vSaAhHQKgm3Vqesgd1fZQoaAZHQG74BV2icoZoB0vNaAhHQKgm+pMHryF1fZQoaAZHQGRs0EPlMh5oB03oA2gIR0CoJ1z2WY4RdX2UKGgGR0By49OTJQtSaAdL72gIR0CoJ6YS6DoRdX2UKGgGR0Bx97mKZUkwaAdL3GgIR0CoKCHDziCKdX2UKGgGR0BwuIN6PbPAaAdL02gIR0CoKLIZZSvUdX2UKGgGR0Bwlo5vLowFaAdL7WgIR0CoKNmCZnctdX2UKGgGR0Bw/HAxi5NHaAdLuGgIR0CoKQu+7Dl6dX2UKGgGR0Bw5KQvHtF8aAdL02gIR0CoKXTLwF1TdX2UKGgGR0Byvy4vvjOtaAdL7GgIR0CoKZQLmZE2dX2UKGgGR0Bxmrmhdt2taAdL22gIR0CoKZ+IEbHZdX2UKGgGR0BwyoHB1s+FaAdLuWgIR0CoKaXEQ5FPdX2UKGgGR0BxuXsPatcOaAdL4GgIR0CoKfptBOYZdX2UKGgGR0BvpVgrpaA4aAdL42gIR0CoKiG1IAfddX2UKGgGR0Bv2xFXq7iAaAdLwGgIR0CoKibF85S4dX2UKGgGR0Bfkx0IToMbaAdN6ANoCEdAqCqlaW5Yo3V9lChoBkdAcdBnL7oB72gHS89oCEdAqCszAaef7XV9lChoBkdAQlSPGQ0XQGgHS5NoCEdAqCs37vXsgXV9lChoBkdAcU0OSW7e22gHS/toCEdAqCtQvDgqE3V9lChoBkdAccJuU2UB4mgHS8RoCEdAqCuXKU3XI3V9lChoBkdAcqdtix3V1GgHTVsBaAhHQKgrtXHR1HR1fZQoaAZHQHCUB+fAbhpoB0u1aAhHQKgsD0QK8cx1fZQoaAZHQHCf7AUL2HtoB0vdaAhHQKgsD8DSw4d1fZQoaAZHQGaR5wwTM7loB03oA2gIR0CoLE3hwVCYdX2UKGgGR0Bx9C4MF2V3aAdLwmgIR0CoLGEzwc5sdX2UKGgGR0Bx9yfe1rqMaAdL0GgIR0CoLIOU+s5odX2UKGgGR0Bua3zg/C66aAdL0GgIR0CoLPscIZ62dX2UKGgGR0ByMIDNhVlxaAdNHgFoCEdAqC2adQO4G3V9lChoBkdAcpHr+o99t2gHS7xoCEdAqC3AMa0hNnV9lChoBkdAcKgv114gR2gHS+toCEdAqC3ZekYXPHV9lChoBkdAc05LbHp8nmgHS8ZoCEdAqC38X1rZanV9lChoBkdAcfnwaR6ni2gHS7hoCEdAqC4QL3K0U3V9lChoBkdAb62g6EJ0GWgHS8BoCEdAqC6pS9/SY3V9lChoBkdAcKrornTy8WgHS8NoCEdAqC65sMy8BnV9lChoBkdAcBpwqy4WlGgHS8poCEdAqC8rfrKNhnV9lChoBkdAb9u2H+Idl2gHS8BoCEdAqC9DUZvUBnV9lChoBkdAcEClsP8Q7WgHS81oCEdAqC9KwdKdx3V9lChoBkdAZEiv9tMwlGgHTegDaAhHQKgvS//vOQh1fZQoaAZHQHOvAfyPMjhoB006AWgIR0CoL5kSVW0adX2UKGgGR0BxlCgVXV9XaAdNKwFoCEdAqC/hhQWN3nV9lChoBkdAcajEpAlfJGgHS9toCEdAqDAiF7D2rXV9lChoBkdAbUZd1uBMBmgHS8NoCEdAqDCQmZ3LWHV9lChoBkdAbteLmZE2HmgHS8FoCEdAqDCjzND+i3V9lChoBkdAcw8AZsKsuGgHS7RoCEdAqDCrbQC0W3V9lChoBkdAchjm6GxlhGgHS91oCEdAqDDN6C17Y3V9lChoBkdAc2+LzwtrbmgHS71oCEdAqDGIIv8IiXV9lChoBkdAcOjpaA4GU2gHS8xoCEdAqDHzayrxRXV9lChoBkdAb7SR8twrD2gHTQoBaAhHQKgyMK0lZ5l1fZQoaAZHQHFF0tRNyo5oB0u8aAhHQKgyRglWwNd1fZQoaAZHQG81WrwOOKhoB0u7aAhHQKgyTV+7UXp1fZQoaAZHQHOsSMglnh9oB0vSaAhHQKgyvXDm8ul1fZQoaAZHQHDK4keIVM5oB0uxaAhHQKgzX91EE1V1fZQoaAZHQHGC4nBtUGVoB0v7aAhHQKgzbvvSc9Z1fZQoaAZHQHAtRnvlU6xoB0vcaAhHQKgzdAgPmPp1fZQoaAZHQHMW+dCmdiFoB0vQaAhHQKgznq9Gqgh1fZQoaAZHQHGTDRD1GspoB0vUaAhHQKg1Hw6QvHt1fZQoaAZHQHMM0XYUWVNoB0vpaAhHQKg1azgMtsh1fZQoaAZHQHHw85S3soloB0v5aAhHQKg1piZv1lJ1fZQoaAZHQHDj7eVLSNRoB0vDaAhHQKg1v/4Irvt1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 360, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV/QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgLjAJpOJSJiIeUUpQoSwNoD05OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 2048, "gamma": 0.99, "gae_lambda": 0.95, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-6.1.85+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Thu Jun 27 21:05:47 UTC 2024", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.4.0+cu121", "GPU Enabled": "True", "Numpy": "1.26.4", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
ppo-LunarLander-v2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:34ca044ea8182b8431b52d6b92323ead09ae9d0504dba9cda89855340493dafe
3
- size 147272
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:005799c263107553b353926f4d34218957d640528136c2ca66647dc90ce87d17
3
+ size 147208
ppo-LunarLander-v2/data CHANGED
@@ -21,12 +21,12 @@
21
  },
22
  "verbose": 0,
23
  "policy_kwargs": {},
24
- "num_timesteps": 131072,
25
- "_total_timesteps": 100000,
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
- "start_time": 1724931803726300587,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": null,
@@ -38,17 +38,17 @@
38
  "_episode_num": 0,
39
  "use_sde": false,
40
  "sde_sample_freq": -1,
41
- "_current_progress_remaining": -0.3107200000000001,
42
  "_stats_window_size": 100,
43
  "ep_info_buffer": {
44
  ":type:": "<class 'collections.deque'>",
45
- ":serialized:": "gAWVHwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHCihxgiNbWMAWyUTRUBjAF0lEdAnT30BXCCSXV9lChoBkdAcYvZKFqSHWgHTREBaAhHQJ0/JT6zmfZ1fZQoaAZHQHCJrX+VC5VoB00NAWgIR0CdPyVzp5eJdX2UKGgGR0BuimbqhUR4aAdL+GgIR0CdQbgGbCrMdX2UKGgGR0BguNiONo8IaAdN6ANoCEdAnUHwzUI9knV9lChoBkdAb/oukk8ifWgHS+hoCEdAnULHa8Hv+nV9lChoBkdAcNzHiFTNuGgHTacBaAhHQJ1Dpk+X7ch1fZQoaAZHQDjZ3GGVRk5oB0vpaAhHQJ1FpJf6XSl1fZQoaAZHQGJ2mZmZmZpoB03oA2gIR0CdRssqril0dX2UKGgGR0BicicEvCdjaAdN6ANoCEdAnUmPUWl/IHV9lChoBkdAR8rHn2ZiNWgHS9hoCEdAnUmv3FkxynV9lChoBkdAcjhm3OObRWgHS/NoCEdAnUmxFuvU0HV9lChoBkdAbzFQTmGM42gHTQkCaAhHQJ1PWdRR/Ex1fZQoaAZHQGzTGnn+yZ9oB02rAWgIR0CdUBHmig01dX2UKGgGR0BxGb7+DOC5aAdNFAFoCEdAnVJAPiDM/3V9lChoBkdAcgPenAIppmgHTQwBaAhHQJ1SxuGbkOt1fZQoaAZHQHHLJwn6VMVoB00SAWgIR0CdVSLdN34cdX2UKGgGR8BJoXZXdTHbaAdL12gIR0CdVWAgPmPpdX2UKGgGR0BuDJ2r4nF6aAdL+WgIR0CdVvdTo+wDdX2UKGgGR0BxVzmeUY8/aAdNBwFoCEdAnVeSGnGbTnV9lChoBkdAZgd+jM3ZPGgHTegDaAhHQJ1Xp+w1R+B1fZQoaAZHQG+pIhQm/nJoB0v6aAhHQJ1a8SL61st1fZQoaAZHQHFB6QRwqAloB0vlaAhHQJ1c2WLP2PF1fZQoaAZHQF+KG8274BVoB03oA2gIR0CdXYMfA9FGdX2UKGgGR0BwSTgLqlguaAdNCwFoCEdAnV4F0YCQtHV9lChoBkdAb8Xzp5eJHmgHTdMBaAhHQJ1eeP5pJwt1fZQoaAZHQHGbQp8WsRxoB0vkaAhHQJ1fBouf29N1fZQoaAZHQHDjYKhL5ARoB01gAWgIR0CdX8fiPyTZdX2UKGgGR0BvLDU3GXHBaAdL82gIR0CdX9GgzxgBdX2UKGgGR0BwZrd2xIJ7aAdNCgFoCEdAnWKtLlFMI3V9lChoBkdAcMy6eGwiaGgHTRMBaAhHQJ1jGdUbT+h1fZQoaAZHQGAbQUHpr1xoB03oA2gIR0CdZgLPldTpdX2UKGgGR0BFTYkVvddnaAdL1mgIR0CdZjmdiDujdX2UKGgGR0ByMwOLBKtgaAdNEwFoCEdAnWZ1oUSIxnV9lChoBkdAYfPqHGjsU2gHTegDaAhHQJ1mdh6Skj51fZQoaAZHQHFg0UTL4etoB0vnaAhHQJ3MpS1maph1fZQoaAZHQHImnxjJ+2FoB0vRaAhHQJ3NjNY8uBd1fZQoaAZHQG/GBomG/N9oB02kAWgIR0CdzbIAwPAgdX2UKGgGR0ByNI61b7j1aAdNBwFoCEdAnc7mjwhGIHV9lChoBkdAbEN9ph4MW2gHTbEDaAhHQJ3QJ5le4Td1fZQoaAZHQHBZwnQY1pFoB01cAWgIR0Cd0E7N0NjLdX2UKGgGR0BBVXs5XEIgaAdLyWgIR0Cd0J29L6DXdX2UKGgGR0BsABC2MKkVaAdNJgFoCEdAndDrUb1h9nV9lChoBkdAYs7V6NVBEGgHTegDaAhHQJ3UmkSElE91fZQoaAZHQFzqf779AHFoB03oA2gIR0Cd1M2zOX3QdX2UKGgGR0Bxoo7/4qPPaAdNCAFoCEdAndWosunMuHV9lChoBkdAcDPX8O09hmgHTRYBaAhHQJ3WirfcesB1fZQoaAZHQDdkxubZvk1oB0u9aAhHQJ3XZl5GBnV1fZQoaAZHQG4jhhx5s0poB0v7aAhHQJ3XeDdxhlV1fZQoaAZHQHG1AIyCWeJoB00dAWgIR0Cd2KrwvxpddX2UKGgGR0Bw2JUT+NtJaAdNQAFoCEdAndknf2saKnV9lChoBkdAcof9YOlO5GgHS+loCEdAndlP+GXXy3V9lChoBkdAbLAT6i0v5GgHS+JoCEdAnd1U6cRUWHV9lChoBkdAcMB37UG3WmgHS/xoCEdAnd6jlkpZwHV9lChoBkdAb3sGFi8WbmgHS+9oCEdAnd8aBqbjLnV9lChoBkdAcc24qwyIpGgHS/poCEdAneCyMo+fRXV9lChoBkdAb/KkP+XJHWgHTQ0BaAhHQJ3jkFB6a9d1fZQoaAZHQG1gVMuez2RoB00SAWgIR0Cd48INVinYdX2UKGgGR0BvZwbdadMCaAdL62gIR0Cd5FXK8tf5dX2UKGgGR0Blz+cc2itaaAdN6AFoCEdAneZxwl0HQnV9lChoBkdAbU+ADJU5uWgHTSUBaAhHQJ3nj+6y0KJ1fZQoaAZHQHLGtZNfw7VoB01bAWgIR0Cd6h1yvLX+dX2UKGgGR0BxLWTGHYYjaAdL/GgIR0Cd7a/CqIacdX2UKGgGR0Bxsi2H+IdmaAdNOgFoCEdAne8wvlEJB3V9lChoBkdAWzYDhcZ9/mgHTegDaAhHQJ3xH58BuGd1fZQoaAZHQG+vnOryUcJoB0v1aAhHQJ3xtrgwXZZ1fZQoaAZHQG1du4gA6uJoB0v6aAhHQJ3yg9mpVCJ1fZQoaAZHQG2cMQNCqp9oB03DA2gIR0Cd9HTTfBN3dX2UKGgGR0BvhLEcbR4RaAdNhAFoCEdAnfan/tICl3V9lChoBkdAcZM+uNgjQmgHTQYBaAhHQJ338EzO5ax1fZQoaAZHQHBlSmdiDuloB01CAWgIR0Cd+NF4LThHdX2UKGgGR0Bex52pyZKGaAdN6ANoCEdAnfqDL0SRKnV9lChoBkdAXDhHz6JqI2gHTegDaAhHQJ36wLUkOZt1fZQoaAZHQHCPHeaa1CxoB00IAWgIR0Cd+/ECeVcEdX2UKGgGR0Bvxiwt8NQTaAdL3mgIR0Cd/E/1xsEadX2UKGgGR0Bdm9a2WpqAaAdN6ANoCEdAnf4ztXxOL3V9lChoBkdAcSwYukDZDmgHTSUBaAhHQJ3+4B/7SAp1fZQoaAZHQHG1R+nZTQ5oB00XAWgIR0Cd/3mozeoDdX2UKGgGR0Befh4t6HCXaAdN6ANoCEdAnf/phWo3rHV9lChoBkdAcGeabF0gbWgHS/xoCEdAngAIUSIxg3V9lChoBkdAbnNqWTot+WgHS/5oCEdAngGwmReTmnV9lChoBkdAcJzV/MGHHmgHS+poCEdAngKYvvjOs3V9lChoBkdAbjoyLQ5WBGgHS+FoCEdAngPkoKD02HV9lChoBkdAcYItz0Yj0WgHS/toCEdAngZPv0AcUHV9lChoBkdAJtNiYsunM2gHS8doCEdAngcOsHSncnV9lChoBkdAcqt1Q66remgHTRoBaAhHQJ4ILMJQcgh1fZQoaAZHQGryl98Z1mtoB00SAWgIR0CeDBHG0eEJdX2UKGgGR0BgudvES/TLaAdN6ANoCEdAnhDeSB9TgnV9lChoBkdAYRFS9du50GgHTegDaAhHQJ4VHnxJ/Xp1fZQoaAZHQGOkDcVQAMloB03oA2gIR0CeGBh4+r2hdX2UKGgGR0Bt/RDZ13dLaAdNBwJoCEdAnhmn8jzI3nV9lChoBkdAckHkE9t/F2gHTQoBaAhHQJ4bFrXUYsN1fZQoaAZHQGGKrnDBMzxoB03oA2gIR0CeH6DIikftdX2UKGgGR0BxFTNX5nDjaAdL9mgIR0CeIA0Rvm5ldX2UKGgGR0BwqFfYzzmPaAdL+mgIR0CeJnPN3W4FdX2UKGgGR0Bt+BAWznieaAdL9GgIR0CeJ0zLwF1TdX2UKGgGR0Bdh5nctXgcaAdN6ANoCEdAnioMcABDHHV9lChoBkdAcETC4jKPn2gHS/hoCEdAnix0k0JnhHV9lChoBkdAXy9uIhyKemgHTegDaAhHQJ4s3OX3QD51fZQoaAZHQHG5OwTufEpoB01VAWgIR0CeLXftQbdadWUu"
46
  },
47
  "ep_success_buffer": {
48
  ":type:": "<class 'collections.deque'>",
49
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
50
  },
51
- "_n_updates": 220,
52
  "observation_space": {
53
  ":type:": "<class 'gymnasium.spaces.box.Box'>",
54
  ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
 
21
  },
22
  "verbose": 0,
23
  "policy_kwargs": {},
24
+ "num_timesteps": 229376,
25
+ "_total_timesteps": 200000,
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
+ "start_time": 1724932876287872543,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": null,
 
38
  "_episode_num": 0,
39
  "use_sde": false,
40
  "sde_sample_freq": -1,
41
+ "_current_progress_remaining": -0.1468799999999999,
42
  "_stats_window_size": 100,
43
  "ep_info_buffer": {
44
  ":type:": "<class 'collections.deque'>",
45
+ ":serialized:": "gAWV7gsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHIrTUNKAayMAWyUS/SMAXSUR0CoGd0daMaTdX2UKGgGR0BvwnzOHFglaAdL2mgIR0CoGogTyrggdX2UKGgGR0BxI91loUSJaAdLzWgIR0CoGzTHjp9rdX2UKGgGR0ByHvHAAQxvaAdL0WgIR0CoG32CuloEdX2UKGgGR0Bxj+SIP9UCaAdLwmgIR0CoG6dnCfpVdX2UKGgGR0BuZOrGR3eOaAdLzWgIR0CoHFapxWDIdX2UKGgGR0BwZfpPhybQaAdLx2gIR0CoHI7/XGwSdX2UKGgGR0BxSuVTrE9/aAdLy2gIR0CoHLjrAxi5dX2UKGgGR0ByCiwpvxYraAdNBAFoCEdAqBzZ7NSqEXV9lChoBkdAcWYOavzOHGgHS89oCEdAqB2Kxu89OnV9lChoBkdAW53HT7VJ+WgHTegDaAhHQKgeH4pMHr11fZQoaAZHQHCYyZa3ZwpoB0vJaAhHQKgeR/95yEN1fZQoaAZHQHCNI4Qz1sdoB0vpaAhHQKgefMGHHm11fZQoaAZHQG5pLu6VdHFoB0vQaAhHQKgfSEr5IpZ1fZQoaAZHQHH0IL9deIFoB0vxaAhHQKgfWiMYMv11fZQoaAZHQHGI9n003wVoB0vdaAhHQKgfs69TP0J1fZQoaAZHQHGJIlD4QBhoB0vdaAhHQKgf0iJO32F1fZQoaAZHQHHIiRwIdENoB0vNaAhHQKggRNB4Uvh1fZQoaAZHQHI8cbR4QjFoB0vRaAhHQKggc/dIoVp1fZQoaAZHQHJdGuoxYaJoB0vqaAhHQKggiQfZElV1fZQoaAZHQHGvF0PpY9xoB0vEaAhHQKgharTYukF1fZQoaAZHQG+8Lqt5le5oB0v1aAhHQKghsgXdj5N1fZQoaAZHQHHe0KeCkGloB0vFaAhHQKgh1QdCE6F1fZQoaAZHQHCzmIoE0SBoB0vmaAhHQKgiNVJ+UhV1fZQoaAZHQHAahi5NGmVoB0vRaAhHQKgi9syBTXJ1fZQoaAZHQHDsEYfnwG5oB0vZaAhHQKgjMXvYvnN1fZQoaAZHQG8PHDJlrdpoB0vJaAhHQKgjSl54W1t1fZQoaAZHQG9G7qIJqqRoB0vEaAhHQKgjVAE+xGF1fZQoaAZHQGJp8ebNKRNoB03oA2gIR0CoI4z4L1EmdX2UKGgGR0Bx4Hin5zo2aAdLvWgIR0CoI8mukk8idX2UKGgGR0BmoAhhYvFnaAdN6ANoCEdAqCP8LpiZv3V9lChoBkdAcWxnLq2SdWgHS9VoCEdAqCQu1v2oN3V9lChoBkdAchgob4rSVmgHS9loCEdAqCTvKdQO4HV9lChoBkdAcsMS1Vo6CGgHS+loCEdAqCVjmQr+YXV9lChoBkdAcnw4oqkM1GgHS91oCEdAqCWjsQd0aXV9lChoBkdAcqI1WbPQfWgHTRIBaAhHQKgmIXm/3391fZQoaAZHQHHqpOrQw9JoB0vSaAhHQKgmbLM9r451fZQoaAZHQHDCWnjyWiVoB0vaaAhHQKgmcFoL5RF1fZQoaAZHQG9H8M3IdU9oB0vXaAhHQKgmeSqU/wB1fZQoaAZHQHIKZGax5cFoB0vYaAhHQKgmuI7eVLV1fZQoaAZHQHJs761stTVoB0v8aAhHQKgmw1mapgl1fZQoaAZHQG5aLfLs8gZoB0vSaAhHQKgm3Vqesgd1fZQoaAZHQG74BV2icoZoB0vNaAhHQKgm+pMHryF1fZQoaAZHQGRs0EPlMh5oB03oA2gIR0CoJ1z2WY4RdX2UKGgGR0By49OTJQtSaAdL72gIR0CoJ6YS6DoRdX2UKGgGR0Bx97mKZUkwaAdL3GgIR0CoKCHDziCKdX2UKGgGR0BwuIN6PbPAaAdL02gIR0CoKLIZZSvUdX2UKGgGR0Bwlo5vLowFaAdL7WgIR0CoKNmCZnctdX2UKGgGR0Bw/HAxi5NHaAdLuGgIR0CoKQu+7Dl6dX2UKGgGR0Bw5KQvHtF8aAdL02gIR0CoKXTLwF1TdX2UKGgGR0Byvy4vvjOtaAdL7GgIR0CoKZQLmZE2dX2UKGgGR0Bxmrmhdt2taAdL22gIR0CoKZ+IEbHZdX2UKGgGR0BwyoHB1s+FaAdLuWgIR0CoKaXEQ5FPdX2UKGgGR0BxuXsPatcOaAdL4GgIR0CoKfptBOYZdX2UKGgGR0BvpVgrpaA4aAdL42gIR0CoKiG1IAfddX2UKGgGR0Bv2xFXq7iAaAdLwGgIR0CoKibF85S4dX2UKGgGR0Bfkx0IToMbaAdN6ANoCEdAqCqlaW5Yo3V9lChoBkdAcdBnL7oB72gHS89oCEdAqCszAaef7XV9lChoBkdAQlSPGQ0XQGgHS5NoCEdAqCs37vXsgXV9lChoBkdAcU0OSW7e22gHS/toCEdAqCtQvDgqE3V9lChoBkdAccJuU2UB4mgHS8RoCEdAqCuXKU3XI3V9lChoBkdAcqdtix3V1GgHTVsBaAhHQKgrtXHR1HR1fZQoaAZHQHCUB+fAbhpoB0u1aAhHQKgsD0QK8cx1fZQoaAZHQHCf7AUL2HtoB0vdaAhHQKgsD8DSw4d1fZQoaAZHQGaR5wwTM7loB03oA2gIR0CoLE3hwVCYdX2UKGgGR0Bx9C4MF2V3aAdLwmgIR0CoLGEzwc5sdX2UKGgGR0Bx9yfe1rqMaAdL0GgIR0CoLIOU+s5odX2UKGgGR0Bua3zg/C66aAdL0GgIR0CoLPscIZ62dX2UKGgGR0ByMIDNhVlxaAdNHgFoCEdAqC2adQO4G3V9lChoBkdAcpHr+o99t2gHS7xoCEdAqC3AMa0hNnV9lChoBkdAcKgv114gR2gHS+toCEdAqC3ZekYXPHV9lChoBkdAc05LbHp8nmgHS8ZoCEdAqC38X1rZanV9lChoBkdAcfnwaR6ni2gHS7hoCEdAqC4QL3K0U3V9lChoBkdAb62g6EJ0GWgHS8BoCEdAqC6pS9/SY3V9lChoBkdAcKrornTy8WgHS8NoCEdAqC65sMy8BnV9lChoBkdAcBpwqy4WlGgHS8poCEdAqC8rfrKNhnV9lChoBkdAb9u2H+Idl2gHS8BoCEdAqC9DUZvUBnV9lChoBkdAcEClsP8Q7WgHS81oCEdAqC9KwdKdx3V9lChoBkdAZEiv9tMwlGgHTegDaAhHQKgvS//vOQh1fZQoaAZHQHOvAfyPMjhoB006AWgIR0CoL5kSVW0adX2UKGgGR0BxlCgVXV9XaAdNKwFoCEdAqC/hhQWN3nV9lChoBkdAcajEpAlfJGgHS9toCEdAqDAiF7D2rXV9lChoBkdAbUZd1uBMBmgHS8NoCEdAqDCQmZ3LWHV9lChoBkdAbteLmZE2HmgHS8FoCEdAqDCjzND+i3V9lChoBkdAcw8AZsKsuGgHS7RoCEdAqDCrbQC0W3V9lChoBkdAchjm6GxlhGgHS91oCEdAqDDN6C17Y3V9lChoBkdAc2+LzwtrbmgHS71oCEdAqDGIIv8IiXV9lChoBkdAcOjpaA4GU2gHS8xoCEdAqDHzayrxRXV9lChoBkdAb7SR8twrD2gHTQoBaAhHQKgyMK0lZ5l1fZQoaAZHQHFF0tRNyo5oB0u8aAhHQKgyRglWwNd1fZQoaAZHQG81WrwOOKhoB0u7aAhHQKgyTV+7UXp1fZQoaAZHQHOsSMglnh9oB0vSaAhHQKgyvXDm8ul1fZQoaAZHQHDK4keIVM5oB0uxaAhHQKgzX91EE1V1fZQoaAZHQHGC4nBtUGVoB0v7aAhHQKgzbvvSc9Z1fZQoaAZHQHAtRnvlU6xoB0vcaAhHQKgzdAgPmPp1fZQoaAZHQHMW+dCmdiFoB0vQaAhHQKgznq9Gqgh1fZQoaAZHQHGTDRD1GspoB0vUaAhHQKg1Hw6QvHt1fZQoaAZHQHMM0XYUWVNoB0vpaAhHQKg1azgMtsh1fZQoaAZHQHHw85S3soloB0v5aAhHQKg1piZv1lJ1fZQoaAZHQHDj7eVLSNRoB0vDaAhHQKg1v/4Irvt1ZS4="
46
  },
47
  "ep_success_buffer": {
48
  ":type:": "<class 'collections.deque'>",
49
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
50
  },
51
+ "_n_updates": 360,
52
  "observation_space": {
53
  ":type:": "<class 'gymnasium.spaces.box.Box'>",
54
  ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
ppo-LunarLander-v2/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3ae42d90d7295442a2565448bb55f7b41d8ba1247e07e9762aa52f967cc7d04d
3
  size 88490
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ed0fb3222b8e3d1085c79ed75c29a0605f9af9638d5098dbe1edcec10493e9f
3
  size 88490
ppo-LunarLander-v2/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5f0c83f956fe9fb51b3914c31b04ab9028aa064c3305dd7902e8b59ec9410738
3
  size 43762
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53aacd296c84a303605320905ed79dbab1c52103d211d37b80bc2284bd0220d1
3
  size 43762
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 231.50544469000005, "std_reward": 51.07858734698292, "is_deterministic": true, "n_eval_episodes": 100, "eval_datetime": "2024-08-29T11:50:50.570178"}
 
1
+ {"mean_reward": 268.47804281, "std_reward": 21.86590381423725, "is_deterministic": true, "n_eval_episodes": 100, "eval_datetime": "2024-08-29T12:10:09.277251"}