saicpp commited on
Commit
be73124
·
verified ·
1 Parent(s): af78708

Finished v4 of model of unit 1

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 224.56 +/- 70.42
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 223.82 +/- 62.29
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7a8e71966d40>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7a8e71966dd0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7a8e71966e60>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7a8e71966ef0>", "_build": "<function ActorCriticPolicy._build at 0x7a8e71966f80>", "forward": "<function ActorCriticPolicy.forward at 0x7a8e71967010>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7a8e719670a0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7a8e71967130>", "_predict": "<function ActorCriticPolicy._predict at 0x7a8e719671c0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7a8e71967250>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7a8e719672e0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7a8e71967370>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7a8e72290180>"}, "verbose": 0, "policy_kwargs": {}, "num_timesteps": 131072, "_total_timesteps": 100000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1724931069041287856, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": null, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.3107200000000001, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVPwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQGAxRJEpiJCMAWyUTegDjAF0lEdAkR/V0Lc9GXV9lChoBkdAZd8iwjdHlWgHTegDaAhHQJEf11SwW311fZQoaAZHQF12Em6XjVBoB03oA2gIR0CRH9f4REncdX2UKGgGR0BkAROxjawmaAdN6ANoCEdAkR/Ys3AEdXV9lChoBkdAVRt6D5CWvGgHTegDaAhHQJEf2ixmkFh1fZQoaAZHQF6r7Xg9/z9oB03oA2gIR0CRH9vc8DB/dX2UKGgGR0BjSwTIvJzUaAdN6ANoCEdAkR/d0vGp/HV9lChoBkdAY9K0IC2c8WgHTegDaAhHQJEf3obGWD91fZQoaAZHQGWTLh73PAxoB03oA2gIR0CRH9/H5rP/dX2UKGgGR0BgRGSEDhcaaAdN6ANoCEdAkSTrrgOz6nV9lChoBkdAYfMujASFoWgHTegDaAhHQJEmz3BYV7B1fZQoaAZHQGMB/w7T2FpoB03oA2gIR0CRKQa8Yht+dX2UKGgGR0BGgRe1KGtZaAdLxGgIR0CRMdMUh3aBdX2UKGgGR0BhAWkHlfZ3aAdN6ANoCEdAkUSQuM+/xnV9lChoBkdAYRP+2E0zj2gHTegDaAhHQJFLralDWsl1fZQoaAZHQGLSh/RVp9JoB03oA2gIR0CRWehDPWxydX2UKGgGR0Bg1hRMvh60aAdN6ANoCEdAkVvRNRFZxXV9lChoBkdAVef9xZMcqGgHTegDaAhHQJFb0h2W6bx1fZQoaAZHQGYbKQaJhv1oB03oA2gIR0CRW9Nke6qbdX2UKGgGR0BgFC0WuX/paAdN6ANoCEdAkVvUnLJSznV9lChoBkdAYgR1LamGd2gHTegDaAhHQJFb1cTrVvx1fZQoaAZHQGIwhBJI1+BoB03oA2gIR0CRW9cJtzjndX2UKGgGR0Bj4Y4XGff5aAdN6ANoCEdAkVvYs/Y8MnV9lChoBkdAYW2+WWyC4GgHTegDaAhHQJFb2oR7JGR1fZQoaAZHQFvalk6Lfk5oB03oA2gIR0CRW9vv0AcUdX2UKGgGR0BnFnBi1AqvaAdN6ANoCEdAkVveCf6Gg3V9lChoBkdAcJCVo6CDmWgHTeACaAhHQJHFUTewcHZ1fZQoaAZHQF305wOvt+loB03oA2gIR0CRxi2vStvGdX2UKGgGR0BKeGhdt2s8aAdLqmgIR0CRxygOSW7fdX2UKGgGR0Bjn3nEETxoaAdN6ANoCEdAkcnIHPeHi3V9lChoBkdAbaa1a4c3l2gHTaUBaAhHQJHUcVBUrCp1fZQoaAZHQGUgXMINVipoB03oA2gIR0CR5DpbUwztdX2UKGgGR0BeQtld1MdtaAdN6ANoCEdAket9jLB9C3V9lChoBkdAYVfLdN34bmgHTegDaAhHQJH5xfICEHt1fZQoaAZHQGBIdTo+wC9oB03oA2gIR0CR+5gmJFb3dX2UKGgGR0Bhj2Y8dPtVaAdN6ANoCEdAkfuZDZ13dXV9lChoBkdAYmJbxmTTv2gHTegDaAhHQJH7ms3hn8N1fZQoaAZHQGDETySV4X5oB03oA2gIR0CR+5u7YkE+dX2UKGgGR0Bfp3Upd8iOaAdN6ANoCEdAkfudLpRoAXV9lChoBkdAW9bebd8ArGgHTegDaAhHQJH7niiqQzV1fZQoaAZHQGbjCFsYVItoB03oA2gIR0CR+58qWkaddX2UKGgGR0Biz41FYuCgaAdN6ANoCEdAkfugRkEs8XV9lChoBkdAYTpMYdhiLGgHTegDaAhHQJIAAFRpDeF1fZQoaAZHQGMx0ojOcDtoB03oA2gIR0CSAPFAmiQDdX2UKGgGR0BfBxT0g8r7aAdN6ANoCEdAkgIFII4VAXV9lChoBkdAZxwWjXWe6WgHTegDaAhHQJIExas6q811fZQoaAZHQDc0QjD8+A5oB0vHaAhHQJIOYO7QLNR1fZQoaAZHQGHbscIZ62RoB03oA2gIR0CSEu+wTufFdX2UKGgGR0Bs+efmLcbjaAdNrAFoCEdAkhOA57w8XHV9lChoBkdAbQ6X7cfvF2gHTUgBaAhHQJIVGlpGnXN1fZQoaAZHQGw3Ba9sabZoB03UAmgIR0CSFhJCjUNKdX2UKGgGR0BxGtIJ7b+MaAdNAwJoCEdAkhjYo3JgcHV9lChoBkdAXmYc94eLemgHTegDaAhHQJIeo1n/T9d1fZQoaAZHQAsYkeIVM25oB0v5aAhHQJIjb24/eLx1fZQoaAZHQG6km4Ajps5oB00HA2gIR0CSJxsmv4dqdX2UKGgGR0BsXmhZha1UaAdNcgNoCEdAki1ny/bj+HV9lChoBkdAXet6QeV9nmgHTegDaAhHQJIyl4eLehx1fZQoaAZHQFrqro4dZJVoB03oA2gIR0CSNE9Jz1brdX2UKGgGR0BiHie9SMtLaAdN6ANoCEdAkjRQAMlTnHV9lChoBkdAXTe/bj94vGgHTegDaAhHQJI0UD1XeWR1fZQoaAZHQGDlXdj5KvpoB03oA2gIR0CSNFGrCFbndX2UKGgGR0BiaT8aXKKYaAdN6ANoCEdAkjs6WHDaXnV9lChoBkdAY4ajtXxOL2gHTegDaAhHQJKkfBsQ/X51fZQoaAZHQGyZiJfpljFoB03TAmgIR0CSrRfU4JeFdX2UKGgGR0Bj58OG0u14aAdN6ANoCEdAkq7BXKbKBHV9lChoBkdAa4fyQxN7B2gHTbUDaAhHQJKw5TYNAkd1fZQoaAZHQGGOxZ+x4Y9oB03oA2gIR0CSsqC0F8ohdX2UKGgGR0Bh+BV4oqkNaAdN6ANoCEdAkrMGzF+/g3V9lChoBkdAb3TdRiw0O2gHTQwCaAhHQJK2bdUKiPB1fZQoaAZHQGLIPvrnkktoB03oA2gIR0CSt4qxTsIFdX2UKGgGR0Bu3EPe54GEaAdNGwJoCEdAkritnoPkJnV9lChoBkdAcRRcer+5v2gHTawDaAhHQJK+qHk92X91fZQoaAZHQGsK0MPSUkhoB006AWgIR0CSw2KV6eGxdX2UKGgGR0Bi6VclgMMJaAdN6ANoCEdAksXOtCAtnXV9lChoBkdAa09nLaEi+2gHTZ8BaAhHQJLJ6ZKFqSJ1fZQoaAZHQG1kGmtQsPJoB01NA2gIR0CSygdGRV6vdX2UKGgGR0BjifNs3yZsaAdN6ANoCEdAkswarmyPdXV9lChoBkdAbgFtNSIgvGgHTa4BaAhHQJLPoEJSiud1fZQoaAZHQF/U2ovSMLpoB03oA2gIR0CS0s5nDiwTdX2UKGgGR0BnJYHcDbJwaAdN6ANoCEdAktLPVy3kP3V9lChoBkdAbWZ6iTMaCWgHTbICaAhHQJLWMiRnvlV1fZQoaAZHQGEe0vXbudBoB03oA2gIR0CS23ioKlYVdX2UKGgGR0BvJ85IYm9haAdNMANoCEdAkuENv863iXV9lChoBkdAZEk4c3l0YGgHTegDaAhHQJLi1ZgXuVp1fZQoaAZHQFjnbZvkzXVoB03oA2gIR0CS6wlijL0SdX2UKGgGR0BkT3LaEi+taAdN6ANoCEdAkvOcJdB0IXV9lChoBkdAZAyKpkwvg2gHTegDaAhHQJL2Xxsl9jR1fZQoaAZHQG4v5kCmuT1oB007A2gIR0CS+jYXwb2ldX2UKGgGR0BiHZ1xKg7HaAdN6ANoCEdAkv1ZtrKvFHV9lChoBkdAZlWjO9nK4mgHTegDaAhHQJMCXwlSjxl1fZQoaAZHQF4o1Aqur6toB03oA2gIR0CTCUH+6y0KdX2UKGgGR0BlI+iJwbVCaAdN6ANoCEdAkwltvKlpGnV9lChoBkdAZKyIyj59E2gHTegDaAhHQJMLtj6N2kl1fZQoaAZHQHC4Q+hXbM5oB02dAWgIR0CTDTXmNipedX2UKGgGR0Bft5T2nKnvaAdN6ANoCEdAkw9vQa72+XV9lChoBkdAWlDKgZjx1GgHTegDaAhHQJMTqtbLU1B1fZQoaAZHQFxk4VARkEtoB03oA2gIR0CTE7Q79ycTdX2UKGgGR0BiS0aKk2xZaAdN6ANoCEdAkxgRx5s0pHV9lChoBkdATPIo7V8TjGgHS81oCEdAkxw3HNorWnV9lChoBkdAYGv3gUDdQGgHTegDaAhHQJMeYafjCHh1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 180, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV/QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgLjAJpOJSJiIeUUpQoSwNoD05OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 2048, "gamma": 0.99, "gae_lambda": 0.95, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-6.1.85+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Thu Jun 27 21:05:47 UTC 2024", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.4.0+cu121", "GPU Enabled": "True", "Numpy": "1.26.4", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7a8e71966d40>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7a8e71966dd0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7a8e71966e60>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7a8e71966ef0>", "_build": "<function ActorCriticPolicy._build at 0x7a8e71966f80>", "forward": "<function ActorCriticPolicy.forward at 0x7a8e71967010>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7a8e719670a0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7a8e71967130>", "_predict": "<function ActorCriticPolicy._predict at 0x7a8e719671c0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7a8e71967250>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7a8e719672e0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7a8e71967370>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7a8e72290180>"}, "verbose": 0, "policy_kwargs": {}, "num_timesteps": 131072, "_total_timesteps": 100000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1724931803726300587, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": null, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.3107200000000001, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVHwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHCihxgiNbWMAWyUTRUBjAF0lEdAnT30BXCCSXV9lChoBkdAcYvZKFqSHWgHTREBaAhHQJ0/JT6zmfZ1fZQoaAZHQHCJrX+VC5VoB00NAWgIR0CdPyVzp5eJdX2UKGgGR0BuimbqhUR4aAdL+GgIR0CdQbgGbCrMdX2UKGgGR0BguNiONo8IaAdN6ANoCEdAnUHwzUI9knV9lChoBkdAb/oukk8ifWgHS+hoCEdAnULHa8Hv+nV9lChoBkdAcNzHiFTNuGgHTacBaAhHQJ1Dpk+X7ch1fZQoaAZHQDjZ3GGVRk5oB0vpaAhHQJ1FpJf6XSl1fZQoaAZHQGJ2mZmZmZpoB03oA2gIR0CdRssqril0dX2UKGgGR0BicicEvCdjaAdN6ANoCEdAnUmPUWl/IHV9lChoBkdAR8rHn2ZiNWgHS9hoCEdAnUmv3FkxynV9lChoBkdAcjhm3OObRWgHS/NoCEdAnUmxFuvU0HV9lChoBkdAbzFQTmGM42gHTQkCaAhHQJ1PWdRR/Ex1fZQoaAZHQGzTGnn+yZ9oB02rAWgIR0CdUBHmig01dX2UKGgGR0BxGb7+DOC5aAdNFAFoCEdAnVJAPiDM/3V9lChoBkdAcgPenAIppmgHTQwBaAhHQJ1SxuGbkOt1fZQoaAZHQHHLJwn6VMVoB00SAWgIR0CdVSLdN34cdX2UKGgGR8BJoXZXdTHbaAdL12gIR0CdVWAgPmPpdX2UKGgGR0BuDJ2r4nF6aAdL+WgIR0CdVvdTo+wDdX2UKGgGR0BxVzmeUY8/aAdNBwFoCEdAnVeSGnGbTnV9lChoBkdAZgd+jM3ZPGgHTegDaAhHQJ1Xp+w1R+B1fZQoaAZHQG+pIhQm/nJoB0v6aAhHQJ1a8SL61st1fZQoaAZHQHFB6QRwqAloB0vlaAhHQJ1c2WLP2PF1fZQoaAZHQF+KG8274BVoB03oA2gIR0CdXYMfA9FGdX2UKGgGR0BwSTgLqlguaAdNCwFoCEdAnV4F0YCQtHV9lChoBkdAb8Xzp5eJHmgHTdMBaAhHQJ1eeP5pJwt1fZQoaAZHQHGbQp8WsRxoB0vkaAhHQJ1fBouf29N1fZQoaAZHQHDjYKhL5ARoB01gAWgIR0CdX8fiPyTZdX2UKGgGR0BvLDU3GXHBaAdL82gIR0CdX9GgzxgBdX2UKGgGR0BwZrd2xIJ7aAdNCgFoCEdAnWKtLlFMI3V9lChoBkdAcMy6eGwiaGgHTRMBaAhHQJ1jGdUbT+h1fZQoaAZHQGAbQUHpr1xoB03oA2gIR0CdZgLPldTpdX2UKGgGR0BFTYkVvddnaAdL1mgIR0CdZjmdiDujdX2UKGgGR0ByMwOLBKtgaAdNEwFoCEdAnWZ1oUSIxnV9lChoBkdAYfPqHGjsU2gHTegDaAhHQJ1mdh6Skj51fZQoaAZHQHFg0UTL4etoB0vnaAhHQJ3MpS1maph1fZQoaAZHQHImnxjJ+2FoB0vRaAhHQJ3NjNY8uBd1fZQoaAZHQG/GBomG/N9oB02kAWgIR0CdzbIAwPAgdX2UKGgGR0ByNI61b7j1aAdNBwFoCEdAnc7mjwhGIHV9lChoBkdAbEN9ph4MW2gHTbEDaAhHQJ3QJ5le4Td1fZQoaAZHQHBZwnQY1pFoB01cAWgIR0Cd0E7N0NjLdX2UKGgGR0BBVXs5XEIgaAdLyWgIR0Cd0J29L6DXdX2UKGgGR0BsABC2MKkVaAdNJgFoCEdAndDrUb1h9nV9lChoBkdAYs7V6NVBEGgHTegDaAhHQJ3UmkSElE91fZQoaAZHQFzqf779AHFoB03oA2gIR0Cd1M2zOX3QdX2UKGgGR0Bxoo7/4qPPaAdNCAFoCEdAndWosunMuHV9lChoBkdAcDPX8O09hmgHTRYBaAhHQJ3WirfcesB1fZQoaAZHQDdkxubZvk1oB0u9aAhHQJ3XZl5GBnV1fZQoaAZHQG4jhhx5s0poB0v7aAhHQJ3XeDdxhlV1fZQoaAZHQHG1AIyCWeJoB00dAWgIR0Cd2KrwvxpddX2UKGgGR0Bw2JUT+NtJaAdNQAFoCEdAndknf2saKnV9lChoBkdAcof9YOlO5GgHS+loCEdAndlP+GXXy3V9lChoBkdAbLAT6i0v5GgHS+JoCEdAnd1U6cRUWHV9lChoBkdAcMB37UG3WmgHS/xoCEdAnd6jlkpZwHV9lChoBkdAb3sGFi8WbmgHS+9oCEdAnd8aBqbjLnV9lChoBkdAcc24qwyIpGgHS/poCEdAneCyMo+fRXV9lChoBkdAb/KkP+XJHWgHTQ0BaAhHQJ3jkFB6a9d1fZQoaAZHQG1gVMuez2RoB00SAWgIR0Cd48INVinYdX2UKGgGR0BvZwbdadMCaAdL62gIR0Cd5FXK8tf5dX2UKGgGR0Blz+cc2itaaAdN6AFoCEdAneZxwl0HQnV9lChoBkdAbU+ADJU5uWgHTSUBaAhHQJ3nj+6y0KJ1fZQoaAZHQHLGtZNfw7VoB01bAWgIR0Cd6h1yvLX+dX2UKGgGR0BxLWTGHYYjaAdL/GgIR0Cd7a/CqIacdX2UKGgGR0Bxsi2H+IdmaAdNOgFoCEdAne8wvlEJB3V9lChoBkdAWzYDhcZ9/mgHTegDaAhHQJ3xH58BuGd1fZQoaAZHQG+vnOryUcJoB0v1aAhHQJ3xtrgwXZZ1fZQoaAZHQG1du4gA6uJoB0v6aAhHQJ3yg9mpVCJ1fZQoaAZHQG2cMQNCqp9oB03DA2gIR0Cd9HTTfBN3dX2UKGgGR0BvhLEcbR4RaAdNhAFoCEdAnfan/tICl3V9lChoBkdAcZM+uNgjQmgHTQYBaAhHQJ338EzO5ax1fZQoaAZHQHBlSmdiDuloB01CAWgIR0Cd+NF4LThHdX2UKGgGR0Bex52pyZKGaAdN6ANoCEdAnfqDL0SRKnV9lChoBkdAXDhHz6JqI2gHTegDaAhHQJ36wLUkOZt1fZQoaAZHQHCPHeaa1CxoB00IAWgIR0Cd+/ECeVcEdX2UKGgGR0Bvxiwt8NQTaAdL3mgIR0Cd/E/1xsEadX2UKGgGR0Bdm9a2WpqAaAdN6ANoCEdAnf4ztXxOL3V9lChoBkdAcSwYukDZDmgHTSUBaAhHQJ3+4B/7SAp1fZQoaAZHQHG1R+nZTQ5oB00XAWgIR0Cd/3mozeoDdX2UKGgGR0Befh4t6HCXaAdN6ANoCEdAnf/phWo3rHV9lChoBkdAcGeabF0gbWgHS/xoCEdAngAIUSIxg3V9lChoBkdAbnNqWTot+WgHS/5oCEdAngGwmReTmnV9lChoBkdAcJzV/MGHHmgHS+poCEdAngKYvvjOs3V9lChoBkdAbjoyLQ5WBGgHS+FoCEdAngPkoKD02HV9lChoBkdAcYItz0Yj0WgHS/toCEdAngZPv0AcUHV9lChoBkdAJtNiYsunM2gHS8doCEdAngcOsHSncnV9lChoBkdAcqt1Q66remgHTRoBaAhHQJ4ILMJQcgh1fZQoaAZHQGryl98Z1mtoB00SAWgIR0CeDBHG0eEJdX2UKGgGR0BgudvES/TLaAdN6ANoCEdAnhDeSB9TgnV9lChoBkdAYRFS9du50GgHTegDaAhHQJ4VHnxJ/Xp1fZQoaAZHQGOkDcVQAMloB03oA2gIR0CeGBh4+r2hdX2UKGgGR0Bt/RDZ13dLaAdNBwJoCEdAnhmn8jzI3nV9lChoBkdAckHkE9t/F2gHTQoBaAhHQJ4bFrXUYsN1fZQoaAZHQGGKrnDBMzxoB03oA2gIR0CeH6DIikftdX2UKGgGR0BxFTNX5nDjaAdL9mgIR0CeIA0Rvm5ldX2UKGgGR0BwqFfYzzmPaAdL+mgIR0CeJnPN3W4FdX2UKGgGR0Bt+BAWznieaAdL9GgIR0CeJ0zLwF1TdX2UKGgGR0Bdh5nctXgcaAdN6ANoCEdAnioMcABDHHV9lChoBkdAcETC4jKPn2gHS/hoCEdAnix0k0JnhHV9lChoBkdAXy9uIhyKemgHTegDaAhHQJ4s3OX3QD51fZQoaAZHQHG5OwTufEpoB01VAWgIR0CeLXftQbdadWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 220, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV/QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgLjAJpOJSJiIeUUpQoSwNoD05OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 2048, "gamma": 0.99, "gae_lambda": 0.95, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-6.1.85+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Thu Jun 27 21:05:47 UTC 2024", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.4.0+cu121", "GPU Enabled": "True", "Numpy": "1.26.4", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
ppo-LunarLander-v2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2633de360af29f41fda24dd7fd3a357b4a1cf3d18f32e2e06ded1901cad2039a
3
- size 147316
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ddf684e580da55b3eaed722aaf1bc7a5a2f85bbd3aee741ce8fd21292d000d7
3
+ size 147272
ppo-LunarLander-v2/data CHANGED
@@ -26,7 +26,7 @@
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
- "start_time": 1724931069041287856,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": null,
@@ -42,13 +42,13 @@
42
  "_stats_window_size": 100,
43
  "ep_info_buffer": {
44
  ":type:": "<class 'collections.deque'>",
45
- ":serialized:": "gAWVPwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQGAxRJEpiJCMAWyUTegDjAF0lEdAkR/V0Lc9GXV9lChoBkdAZd8iwjdHlWgHTegDaAhHQJEf11SwW311fZQoaAZHQF12Em6XjVBoB03oA2gIR0CRH9f4REncdX2UKGgGR0BkAROxjawmaAdN6ANoCEdAkR/Ys3AEdXV9lChoBkdAVRt6D5CWvGgHTegDaAhHQJEf2ixmkFh1fZQoaAZHQF6r7Xg9/z9oB03oA2gIR0CRH9vc8DB/dX2UKGgGR0BjSwTIvJzUaAdN6ANoCEdAkR/d0vGp/HV9lChoBkdAY9K0IC2c8WgHTegDaAhHQJEf3obGWD91fZQoaAZHQGWTLh73PAxoB03oA2gIR0CRH9/H5rP/dX2UKGgGR0BgRGSEDhcaaAdN6ANoCEdAkSTrrgOz6nV9lChoBkdAYfMujASFoWgHTegDaAhHQJEmz3BYV7B1fZQoaAZHQGMB/w7T2FpoB03oA2gIR0CRKQa8Yht+dX2UKGgGR0BGgRe1KGtZaAdLxGgIR0CRMdMUh3aBdX2UKGgGR0BhAWkHlfZ3aAdN6ANoCEdAkUSQuM+/xnV9lChoBkdAYRP+2E0zj2gHTegDaAhHQJFLralDWsl1fZQoaAZHQGLSh/RVp9JoB03oA2gIR0CRWehDPWxydX2UKGgGR0Bg1hRMvh60aAdN6ANoCEdAkVvRNRFZxXV9lChoBkdAVef9xZMcqGgHTegDaAhHQJFb0h2W6bx1fZQoaAZHQGYbKQaJhv1oB03oA2gIR0CRW9Nke6qbdX2UKGgGR0BgFC0WuX/paAdN6ANoCEdAkVvUnLJSznV9lChoBkdAYgR1LamGd2gHTegDaAhHQJFb1cTrVvx1fZQoaAZHQGIwhBJI1+BoB03oA2gIR0CRW9cJtzjndX2UKGgGR0Bj4Y4XGff5aAdN6ANoCEdAkVvYs/Y8MnV9lChoBkdAYW2+WWyC4GgHTegDaAhHQJFb2oR7JGR1fZQoaAZHQFvalk6Lfk5oB03oA2gIR0CRW9vv0AcUdX2UKGgGR0BnFnBi1AqvaAdN6ANoCEdAkVveCf6Gg3V9lChoBkdAcJCVo6CDmWgHTeACaAhHQJHFUTewcHZ1fZQoaAZHQF305wOvt+loB03oA2gIR0CRxi2vStvGdX2UKGgGR0BKeGhdt2s8aAdLqmgIR0CRxygOSW7fdX2UKGgGR0Bjn3nEETxoaAdN6ANoCEdAkcnIHPeHi3V9lChoBkdAbaa1a4c3l2gHTaUBaAhHQJHUcVBUrCp1fZQoaAZHQGUgXMINVipoB03oA2gIR0CR5DpbUwztdX2UKGgGR0BeQtld1MdtaAdN6ANoCEdAket9jLB9C3V9lChoBkdAYVfLdN34bmgHTegDaAhHQJH5xfICEHt1fZQoaAZHQGBIdTo+wC9oB03oA2gIR0CR+5gmJFb3dX2UKGgGR0Bhj2Y8dPtVaAdN6ANoCEdAkfuZDZ13dXV9lChoBkdAYmJbxmTTv2gHTegDaAhHQJH7ms3hn8N1fZQoaAZHQGDETySV4X5oB03oA2gIR0CR+5u7YkE+dX2UKGgGR0Bfp3Upd8iOaAdN6ANoCEdAkfudLpRoAXV9lChoBkdAW9bebd8ArGgHTegDaAhHQJH7niiqQzV1fZQoaAZHQGbjCFsYVItoB03oA2gIR0CR+58qWkaddX2UKGgGR0Biz41FYuCgaAdN6ANoCEdAkfugRkEs8XV9lChoBkdAYTpMYdhiLGgHTegDaAhHQJIAAFRpDeF1fZQoaAZHQGMx0ojOcDtoB03oA2gIR0CSAPFAmiQDdX2UKGgGR0BfBxT0g8r7aAdN6ANoCEdAkgIFII4VAXV9lChoBkdAZxwWjXWe6WgHTegDaAhHQJIExas6q811fZQoaAZHQDc0QjD8+A5oB0vHaAhHQJIOYO7QLNR1fZQoaAZHQGHbscIZ62RoB03oA2gIR0CSEu+wTufFdX2UKGgGR0Bs+efmLcbjaAdNrAFoCEdAkhOA57w8XHV9lChoBkdAbQ6X7cfvF2gHTUgBaAhHQJIVGlpGnXN1fZQoaAZHQGw3Ba9sabZoB03UAmgIR0CSFhJCjUNKdX2UKGgGR0BxGtIJ7b+MaAdNAwJoCEdAkhjYo3JgcHV9lChoBkdAXmYc94eLemgHTegDaAhHQJIeo1n/T9d1fZQoaAZHQAsYkeIVM25oB0v5aAhHQJIjb24/eLx1fZQoaAZHQG6km4Ajps5oB00HA2gIR0CSJxsmv4dqdX2UKGgGR0BsXmhZha1UaAdNcgNoCEdAki1ny/bj+HV9lChoBkdAXet6QeV9nmgHTegDaAhHQJIyl4eLehx1fZQoaAZHQFrqro4dZJVoB03oA2gIR0CSNE9Jz1brdX2UKGgGR0BiHie9SMtLaAdN6ANoCEdAkjRQAMlTnHV9lChoBkdAXTe/bj94vGgHTegDaAhHQJI0UD1XeWR1fZQoaAZHQGDlXdj5KvpoB03oA2gIR0CSNFGrCFbndX2UKGgGR0BiaT8aXKKYaAdN6ANoCEdAkjs6WHDaXnV9lChoBkdAY4ajtXxOL2gHTegDaAhHQJKkfBsQ/X51fZQoaAZHQGyZiJfpljFoB03TAmgIR0CSrRfU4JeFdX2UKGgGR0Bj58OG0u14aAdN6ANoCEdAkq7BXKbKBHV9lChoBkdAa4fyQxN7B2gHTbUDaAhHQJKw5TYNAkd1fZQoaAZHQGGOxZ+x4Y9oB03oA2gIR0CSsqC0F8ohdX2UKGgGR0Bh+BV4oqkNaAdN6ANoCEdAkrMGzF+/g3V9lChoBkdAb3TdRiw0O2gHTQwCaAhHQJK2bdUKiPB1fZQoaAZHQGLIPvrnkktoB03oA2gIR0CSt4qxTsIFdX2UKGgGR0Bu3EPe54GEaAdNGwJoCEdAkritnoPkJnV9lChoBkdAcRRcer+5v2gHTawDaAhHQJK+qHk92X91fZQoaAZHQGsK0MPSUkhoB006AWgIR0CSw2KV6eGxdX2UKGgGR0Bi6VclgMMJaAdN6ANoCEdAksXOtCAtnXV9lChoBkdAa09nLaEi+2gHTZ8BaAhHQJLJ6ZKFqSJ1fZQoaAZHQG1kGmtQsPJoB01NA2gIR0CSygdGRV6vdX2UKGgGR0BjifNs3yZsaAdN6ANoCEdAkswarmyPdXV9lChoBkdAbgFtNSIgvGgHTa4BaAhHQJLPoEJSiud1fZQoaAZHQF/U2ovSMLpoB03oA2gIR0CS0s5nDiwTdX2UKGgGR0BnJYHcDbJwaAdN6ANoCEdAktLPVy3kP3V9lChoBkdAbWZ6iTMaCWgHTbICaAhHQJLWMiRnvlV1fZQoaAZHQGEe0vXbudBoB03oA2gIR0CS23ioKlYVdX2UKGgGR0BvJ85IYm9haAdNMANoCEdAkuENv863iXV9lChoBkdAZEk4c3l0YGgHTegDaAhHQJLi1ZgXuVp1fZQoaAZHQFjnbZvkzXVoB03oA2gIR0CS6wlijL0SdX2UKGgGR0BkT3LaEi+taAdN6ANoCEdAkvOcJdB0IXV9lChoBkdAZAyKpkwvg2gHTegDaAhHQJL2Xxsl9jR1fZQoaAZHQG4v5kCmuT1oB007A2gIR0CS+jYXwb2ldX2UKGgGR0BiHZ1xKg7HaAdN6ANoCEdAkv1ZtrKvFHV9lChoBkdAZlWjO9nK4mgHTegDaAhHQJMCXwlSjxl1fZQoaAZHQF4o1Aqur6toB03oA2gIR0CTCUH+6y0KdX2UKGgGR0BlI+iJwbVCaAdN6ANoCEdAkwltvKlpGnV9lChoBkdAZKyIyj59E2gHTegDaAhHQJMLtj6N2kl1fZQoaAZHQHC4Q+hXbM5oB02dAWgIR0CTDTXmNipedX2UKGgGR0Bft5T2nKnvaAdN6ANoCEdAkw9vQa72+XV9lChoBkdAWlDKgZjx1GgHTegDaAhHQJMTqtbLU1B1fZQoaAZHQFxk4VARkEtoB03oA2gIR0CTE7Q79ycTdX2UKGgGR0BiS0aKk2xZaAdN6ANoCEdAkxgRx5s0pHV9lChoBkdATPIo7V8TjGgHS81oCEdAkxw3HNorWnV9lChoBkdAYGv3gUDdQGgHTegDaAhHQJMeYafjCHh1ZS4="
46
  },
47
  "ep_success_buffer": {
48
  ":type:": "<class 'collections.deque'>",
49
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
50
  },
51
- "_n_updates": 180,
52
  "observation_space": {
53
  ":type:": "<class 'gymnasium.spaces.box.Box'>",
54
  ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
 
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
+ "start_time": 1724931803726300587,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": null,
 
42
  "_stats_window_size": 100,
43
  "ep_info_buffer": {
44
  ":type:": "<class 'collections.deque'>",
45
+ ":serialized:": "gAWVHwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHCihxgiNbWMAWyUTRUBjAF0lEdAnT30BXCCSXV9lChoBkdAcYvZKFqSHWgHTREBaAhHQJ0/JT6zmfZ1fZQoaAZHQHCJrX+VC5VoB00NAWgIR0CdPyVzp5eJdX2UKGgGR0BuimbqhUR4aAdL+GgIR0CdQbgGbCrMdX2UKGgGR0BguNiONo8IaAdN6ANoCEdAnUHwzUI9knV9lChoBkdAb/oukk8ifWgHS+hoCEdAnULHa8Hv+nV9lChoBkdAcNzHiFTNuGgHTacBaAhHQJ1Dpk+X7ch1fZQoaAZHQDjZ3GGVRk5oB0vpaAhHQJ1FpJf6XSl1fZQoaAZHQGJ2mZmZmZpoB03oA2gIR0CdRssqril0dX2UKGgGR0BicicEvCdjaAdN6ANoCEdAnUmPUWl/IHV9lChoBkdAR8rHn2ZiNWgHS9hoCEdAnUmv3FkxynV9lChoBkdAcjhm3OObRWgHS/NoCEdAnUmxFuvU0HV9lChoBkdAbzFQTmGM42gHTQkCaAhHQJ1PWdRR/Ex1fZQoaAZHQGzTGnn+yZ9oB02rAWgIR0CdUBHmig01dX2UKGgGR0BxGb7+DOC5aAdNFAFoCEdAnVJAPiDM/3V9lChoBkdAcgPenAIppmgHTQwBaAhHQJ1SxuGbkOt1fZQoaAZHQHHLJwn6VMVoB00SAWgIR0CdVSLdN34cdX2UKGgGR8BJoXZXdTHbaAdL12gIR0CdVWAgPmPpdX2UKGgGR0BuDJ2r4nF6aAdL+WgIR0CdVvdTo+wDdX2UKGgGR0BxVzmeUY8/aAdNBwFoCEdAnVeSGnGbTnV9lChoBkdAZgd+jM3ZPGgHTegDaAhHQJ1Xp+w1R+B1fZQoaAZHQG+pIhQm/nJoB0v6aAhHQJ1a8SL61st1fZQoaAZHQHFB6QRwqAloB0vlaAhHQJ1c2WLP2PF1fZQoaAZHQF+KG8274BVoB03oA2gIR0CdXYMfA9FGdX2UKGgGR0BwSTgLqlguaAdNCwFoCEdAnV4F0YCQtHV9lChoBkdAb8Xzp5eJHmgHTdMBaAhHQJ1eeP5pJwt1fZQoaAZHQHGbQp8WsRxoB0vkaAhHQJ1fBouf29N1fZQoaAZHQHDjYKhL5ARoB01gAWgIR0CdX8fiPyTZdX2UKGgGR0BvLDU3GXHBaAdL82gIR0CdX9GgzxgBdX2UKGgGR0BwZrd2xIJ7aAdNCgFoCEdAnWKtLlFMI3V9lChoBkdAcMy6eGwiaGgHTRMBaAhHQJ1jGdUbT+h1fZQoaAZHQGAbQUHpr1xoB03oA2gIR0CdZgLPldTpdX2UKGgGR0BFTYkVvddnaAdL1mgIR0CdZjmdiDujdX2UKGgGR0ByMwOLBKtgaAdNEwFoCEdAnWZ1oUSIxnV9lChoBkdAYfPqHGjsU2gHTegDaAhHQJ1mdh6Skj51fZQoaAZHQHFg0UTL4etoB0vnaAhHQJ3MpS1maph1fZQoaAZHQHImnxjJ+2FoB0vRaAhHQJ3NjNY8uBd1fZQoaAZHQG/GBomG/N9oB02kAWgIR0CdzbIAwPAgdX2UKGgGR0ByNI61b7j1aAdNBwFoCEdAnc7mjwhGIHV9lChoBkdAbEN9ph4MW2gHTbEDaAhHQJ3QJ5le4Td1fZQoaAZHQHBZwnQY1pFoB01cAWgIR0Cd0E7N0NjLdX2UKGgGR0BBVXs5XEIgaAdLyWgIR0Cd0J29L6DXdX2UKGgGR0BsABC2MKkVaAdNJgFoCEdAndDrUb1h9nV9lChoBkdAYs7V6NVBEGgHTegDaAhHQJ3UmkSElE91fZQoaAZHQFzqf779AHFoB03oA2gIR0Cd1M2zOX3QdX2UKGgGR0Bxoo7/4qPPaAdNCAFoCEdAndWosunMuHV9lChoBkdAcDPX8O09hmgHTRYBaAhHQJ3WirfcesB1fZQoaAZHQDdkxubZvk1oB0u9aAhHQJ3XZl5GBnV1fZQoaAZHQG4jhhx5s0poB0v7aAhHQJ3XeDdxhlV1fZQoaAZHQHG1AIyCWeJoB00dAWgIR0Cd2KrwvxpddX2UKGgGR0Bw2JUT+NtJaAdNQAFoCEdAndknf2saKnV9lChoBkdAcof9YOlO5GgHS+loCEdAndlP+GXXy3V9lChoBkdAbLAT6i0v5GgHS+JoCEdAnd1U6cRUWHV9lChoBkdAcMB37UG3WmgHS/xoCEdAnd6jlkpZwHV9lChoBkdAb3sGFi8WbmgHS+9oCEdAnd8aBqbjLnV9lChoBkdAcc24qwyIpGgHS/poCEdAneCyMo+fRXV9lChoBkdAb/KkP+XJHWgHTQ0BaAhHQJ3jkFB6a9d1fZQoaAZHQG1gVMuez2RoB00SAWgIR0Cd48INVinYdX2UKGgGR0BvZwbdadMCaAdL62gIR0Cd5FXK8tf5dX2UKGgGR0Blz+cc2itaaAdN6AFoCEdAneZxwl0HQnV9lChoBkdAbU+ADJU5uWgHTSUBaAhHQJ3nj+6y0KJ1fZQoaAZHQHLGtZNfw7VoB01bAWgIR0Cd6h1yvLX+dX2UKGgGR0BxLWTGHYYjaAdL/GgIR0Cd7a/CqIacdX2UKGgGR0Bxsi2H+IdmaAdNOgFoCEdAne8wvlEJB3V9lChoBkdAWzYDhcZ9/mgHTegDaAhHQJ3xH58BuGd1fZQoaAZHQG+vnOryUcJoB0v1aAhHQJ3xtrgwXZZ1fZQoaAZHQG1du4gA6uJoB0v6aAhHQJ3yg9mpVCJ1fZQoaAZHQG2cMQNCqp9oB03DA2gIR0Cd9HTTfBN3dX2UKGgGR0BvhLEcbR4RaAdNhAFoCEdAnfan/tICl3V9lChoBkdAcZM+uNgjQmgHTQYBaAhHQJ338EzO5ax1fZQoaAZHQHBlSmdiDuloB01CAWgIR0Cd+NF4LThHdX2UKGgGR0Bex52pyZKGaAdN6ANoCEdAnfqDL0SRKnV9lChoBkdAXDhHz6JqI2gHTegDaAhHQJ36wLUkOZt1fZQoaAZHQHCPHeaa1CxoB00IAWgIR0Cd+/ECeVcEdX2UKGgGR0Bvxiwt8NQTaAdL3mgIR0Cd/E/1xsEadX2UKGgGR0Bdm9a2WpqAaAdN6ANoCEdAnf4ztXxOL3V9lChoBkdAcSwYukDZDmgHTSUBaAhHQJ3+4B/7SAp1fZQoaAZHQHG1R+nZTQ5oB00XAWgIR0Cd/3mozeoDdX2UKGgGR0Befh4t6HCXaAdN6ANoCEdAnf/phWo3rHV9lChoBkdAcGeabF0gbWgHS/xoCEdAngAIUSIxg3V9lChoBkdAbnNqWTot+WgHS/5oCEdAngGwmReTmnV9lChoBkdAcJzV/MGHHmgHS+poCEdAngKYvvjOs3V9lChoBkdAbjoyLQ5WBGgHS+FoCEdAngPkoKD02HV9lChoBkdAcYItz0Yj0WgHS/toCEdAngZPv0AcUHV9lChoBkdAJtNiYsunM2gHS8doCEdAngcOsHSncnV9lChoBkdAcqt1Q66remgHTRoBaAhHQJ4ILMJQcgh1fZQoaAZHQGryl98Z1mtoB00SAWgIR0CeDBHG0eEJdX2UKGgGR0BgudvES/TLaAdN6ANoCEdAnhDeSB9TgnV9lChoBkdAYRFS9du50GgHTegDaAhHQJ4VHnxJ/Xp1fZQoaAZHQGOkDcVQAMloB03oA2gIR0CeGBh4+r2hdX2UKGgGR0Bt/RDZ13dLaAdNBwJoCEdAnhmn8jzI3nV9lChoBkdAckHkE9t/F2gHTQoBaAhHQJ4bFrXUYsN1fZQoaAZHQGGKrnDBMzxoB03oA2gIR0CeH6DIikftdX2UKGgGR0BxFTNX5nDjaAdL9mgIR0CeIA0Rvm5ldX2UKGgGR0BwqFfYzzmPaAdL+mgIR0CeJnPN3W4FdX2UKGgGR0Bt+BAWznieaAdL9GgIR0CeJ0zLwF1TdX2UKGgGR0Bdh5nctXgcaAdN6ANoCEdAnioMcABDHHV9lChoBkdAcETC4jKPn2gHS/hoCEdAnix0k0JnhHV9lChoBkdAXy9uIhyKemgHTegDaAhHQJ4s3OX3QD51fZQoaAZHQHG5OwTufEpoB01VAWgIR0CeLXftQbdadWUu"
46
  },
47
  "ep_success_buffer": {
48
  ":type:": "<class 'collections.deque'>",
49
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
50
  },
51
+ "_n_updates": 220,
52
  "observation_space": {
53
  ":type:": "<class 'gymnasium.spaces.box.Box'>",
54
  ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
ppo-LunarLander-v2/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:05bd73df6ef187ef1292cb4f76bd7950e153e32d2776f6d6b84677d092700953
3
  size 88490
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ae42d90d7295442a2565448bb55f7b41d8ba1247e07e9762aa52f967cc7d04d
3
  size 88490
ppo-LunarLander-v2/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:721e886c40a4945fcce52befaa75a04902d8a23decd3716af52a52d8c1f9c478
3
  size 43762
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f0c83f956fe9fb51b3914c31b04ab9028aa064c3305dd7902e8b59ec9410738
3
  size 43762
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 224.56240359999998, "std_reward": 70.41596923275944, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-08-29T11:38:48.492041"}
 
1
+ {"mean_reward": 223.8249014, "std_reward": 62.285083669348666, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-08-29T11:48:36.126178"}