oliar commited on
Commit
9099526
1 Parent(s): 894889f

Tried running the lunar lander PPO with 10mil timestamps; limited success.

Browse files
LunarLander-v2-10m_ts.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56f6312366fe5e478e1a64c87998a9508121a52b853cfca200422a17b7435f71
3
+ size 147930
LunarLander-v2-10m_ts/_stable_baselines3_version ADDED
@@ -0,0 +1 @@
 
 
1
+ 2.0.0a5
LunarLander-v2-10m_ts/data ADDED
@@ -0,0 +1,99 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "policy_class": {
3
+ ":type:": "<class 'abc.ABCMeta'>",
4
+ ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
+ "__module__": "stable_baselines3.common.policies",
6
+ "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7815ce6ac9d0>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7815ce6aca60>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7815ce6acaf0>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7815ce6acb80>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7815ce6acc10>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7815ce6acca0>",
13
+ "extract_features": "<function ActorCriticPolicy.extract_features at 0x7815ce6acd30>",
14
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7815ce6acdc0>",
15
+ "_predict": "<function ActorCriticPolicy._predict at 0x7815ce6ace50>",
16
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7815ce6acee0>",
17
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7815ce6acf70>",
18
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7815ce6ad000>",
19
+ "__abstractmethods__": "frozenset()",
20
+ "_abc_impl": "<_abc._abc_data object at 0x7815ce84a440>"
21
+ },
22
+ "verbose": 1,
23
+ "policy_kwargs": {},
24
+ "num_timesteps": 10010624,
25
+ "_total_timesteps": 10000000,
26
+ "_num_timesteps_at_start": 0,
27
+ "seed": null,
28
+ "action_noise": null,
29
+ "start_time": 1698505574986195902,
30
+ "learning_rate": 0.0003,
31
+ "tensorboard_log": null,
32
+ "_last_obs": {
33
+ ":type:": "<class 'numpy.ndarray'>",
34
+ ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAGZ6JT7huvQ9Sp0av1+V374hd8o96kLIvgAAAAAAAAAAGo2hPb7/sj+1D9k+Nl18vr4z9j1Ceos+AAAAAAAAAAAzr4u7SPuIuoOqmzUz2JAv+RRGOk6csbQAAIA/AACAP82UNj177JW6/Q0yvQxYLDMCmjK7qz1PswAAgD8AAIA/cxnwPQfmrz9FiOU+1ULBvkDtaD5Tgp8+AAAAAAAAAAAzHds9tBPAP6aiIz/BV6A9/4SIPd4JvD4AAAAAAAAAAM14sDwUrpu43YLAs/4ygq7qJ9W7y3utMwAAgD8AAIA/AFg9O9dBFrs9c+g7SfSRPDWMErwz7Hs9AACAPwAAgD864D8++1pOP5/SNj7NVyG/Hc3uPq4liz0AAAAAAAAAAJqH0b3kQSY/MB+7vV2KV78+i4e+4gFvvAAAAAAAAAAAZra8vMqJrj9uWOO+u8byvkodCzz2HSW9AAAAAAAAAABmvF8+tVWGP+pdFT6/+TS/8sX4PnxwBD0AAAAAAAAAAM1TVz04jM896sGevsmtsr4NmJ29JTNVvgAAAAAAAAAAQNWmPaQdET5OBm++5IPJvoW0r7yGXjK+AAAAAAAAAAAAy4M8rjWEusgKZzMFZ5Wv2UN5uqs7wbMAAIA/AACAPwCjxLwrnoA9FBU1PnE52b66VFk97rjNPQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
35
+ },
36
+ "_last_episode_starts": {
37
+ ":type:": "<class 'numpy.ndarray'>",
38
+ ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="
39
+ },
40
+ "_last_original_obs": null,
41
+ "_episode_num": 0,
42
+ "use_sde": false,
43
+ "sde_sample_freq": -1,
44
+ "_current_progress_remaining": -0.0010623999999999079,
45
+ "_stats_window_size": 100,
46
+ "ep_info_buffer": {
47
+ ":type:": "<class 'collections.deque'>",
48
+ ":serialized:": "gAWV4QsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHKqO32EkB2MAWyUS7mMAXSUR0DBD4EOwxFidX2UKGgGR0BxsX0J4SpSaAdLnWgIR0DBD4Cx/ustdX2UKGgGR0BzeN+6RQrMaAdLnGgIR0DBD4kSCe3AdX2UKGgGR0Bv891B+nZTaAdLnGgIR0DBD6Ki22G7dX2UKGgGR0Bz91p35eqraAdLq2gIR0DBEgnuy/sWdX2UKGgGR0BvrN1r6+FlaAdLnWgIR0DBEgtEd/8VdX2UKGgGR0Bzg9RDTjNqaAdLvWgIR0DBEhYkcCHRdX2UKGgGR0BySV9c8kleaAdLuWgIR0DBEh1lK9PDdX2UKGgGR0ByZGUqx1PnaAdLrmgIR0DBEicgjhUBdX2UKGgGR0ByzxLBbfP5aAdLlGgIR0DBEikBKcurdX2UKGgGR0ByjRkf9xZMaAdLnGgIR0DBEjWx4Y78dX2UKGgGR0BzccLw4KhMaAdL3WgIR0DBEjypJf6XdX2UKGgGR0BvjbUy57PZaAdLqWgIR0DBEkSIpH7QdX2UKGgGR0Bw++gYgq3FaAdLoWgIR0DBEklxS5y3dX2UKGgGR0By2MKiO/+LaAdLmmgIR0DBElKtozvadX2UKGgGR0BzGif4AS39aAdL62gIR0DBElZHqeK9dX2UKGgGR0Byj+GdqcmTaAdLrWgIR0DBEmJT2nKodX2UKGgGR0BwthEXtShraAdLs2gIR0DBEmMDwH7hdX2UKGgGR0BxBCY0EX+EaAdLrWgIR0DBEm3RCx/vdX2UKGgGR0Bx8OphnanKaAdLlGgIR0DBEn1vES/TdX2UKGgGR0BvsCWNWEK3aAdLpmgIR0DBEpgFV1fWdX2UKGgGR0ByMdbPhQ3xaAdLl2gIR0DBEq3RTjvNdX2UKGgGR0Byw8+HJtBOaAdLqmgIR0DBEr8YGdI5dX2UKGgGR0Bz94c0cfeUaAdL0GgIR0DBEsEOf/WEdX2UKGgGR0ByUc7V8Ti9aAdLvGgIR0DBEsRSpBHDdX2UKGgGR0Bzg+EpRXOoaAdLyWgIR0DBEsfcN6PbdX2UKGgGR0Bx7YWac7QtaAdLr2gIR0DBEtwTqSowdX2UKGgGR0BzdjfqHGjsaAdLwmgIR0DBEuV3IMjNdX2UKGgGR0Bx6a/zreImaAdLm2gIR0DBEvLIq9XcdX2UKGgGR0Bx/Zs54nndaAdLsmgIR0DBEvVjPOY6dX2UKGgGR0Byfn0Cih38aAdLvmgIR0DBEvc0YTCcdX2UKGgGR0ByQTonrpqzaAdLvmgIR0DBEwPq/ub7dX2UKGgGR0Bzi8okRjBmaAdL3WgIR0DBEw7hR64UdX2UKGgGR0BxEU66reZYaAdLwWgIR0DBExSCFsYVdX2UKGgGR0BzYD1AZ88caAdLumgIR0DBExqbvw3HdX2UKGgGR0BywR62OQyRaAdLsGgIR0DBEyHFYMfBdX2UKGgGR0BwfzfvWpZPaAdLoWgIR0DBEyw9Pk7wdX2UKGgGR0BxrKACnxaxaAdLkmgIR0DBEzI3HaN/dX2UKGgGR0BxWKXZ5AyEaAdLp2gIR0DBE1TpaA4GdX2UKGgGR0Bv27tw71ZlaAdLoGgIR0DBE1c30f5ldX2UKGgGR0BzdyWv8qFzaAdLvWgIR0DBE2v/vOQhdX2UKGgGR0Bz31gUlAu7aAdLvGgIR0DBE254rz5HdX2UKGgGR0Bycctcv/R3aAdLi2gIR0DBE3OLNwBHdX2UKGgGR0ByBP1J17pnaAdLl2gIR0DBE4C17Y03dX2UKGgGR0Bxzx7+kxh2aAdLr2gIR0DBE4VipeeGdX2UKGgGR0ByPfQTmGM5aAdLwWgIR0DBE4yDPGADdX2UKGgGR0BycVe1KGtZaAdLl2gIR0DBE451ie/YdX2UKGgGR0BzzcmVqveQaAdLwmgIR0DBE6P/giu/dX2UKGgGR0Bx5c1tO2y+aAdLo2gIR0DBE7BDu0CzdX2UKGgGR0BxkDLDAJswaAdLtmgIR0DBE7uD3/PxdX2UKGgGR0ByrAfRu0kXaAdLm2gIR0DBE7xrxiG4dX2UKGgGR0ByHHHdXT3JaAdLwGgIR0DBE782aUiZdX2UKGgGR0ByJLkU9IPLaAdLsGgIR0DBE8RMN+b3dX2UKGgGR0BzcGg3974SaAdLrmgIR0DBE9N/x2B8dX2UKGgGR0BxrJCY1He8aAdLp2gIR0DBE++CK77LdX2UKGgGR0Byy2RaHKwIaAdLl2gIR0DBE/jzwtrcdX2UKGgGR0Bz/ZiZv1lHaAdLuGgIR0DBFAF7dBSldX2UKGgGR0BwopqTKT0QaAdLlWgIR0DBFA1MfzSUdX2UKGgGR0ByAM8IRh+faAdLs2gIR0DBFBPJYDDCdX2UKGgGR0By58EJSiudaAdLvGgIR0DBFBQ3gk1NdX2UKGgGR0Bxt/iCJ40NaAdLrmgIR0DBFBk4aP0adX2UKGgGR0BvVEvh60IDaAdLpGgIR0DBFBqeRPoFdX2UKGgGR0BwQ+4oZydXaAdLnGgIR0DBFDLEcbR4dX2UKGgGR0ByOWDK5kLAaAdLmWgIR0DBFDM1qFh5dX2UKGgGR0BzI1rcj7hvaAdLv2gIR0DBFDkhV2iddX2UKGgGR0B0QXpu/DceaAdL4GgIR0DBFD53Roh7dX2UKGgGR0By9Pk/8l5XaAdLsmgIR0DBFEC7K7qZdX2UKGgGR0Bxip4W1twaaAdLmWgIR0DBFEEK7ZnMdX2UKGgGR0BzOv3Cbc46aAdLw2gIR0DBFEMrmQr+dX2UKGgGR0BxVjp5eJHiaAdLnWgIR0DBFFN3+uNhdX2UKGgGR0Bzaj9kz41xaAdL0WgIR0DBFFXUYsNEdX2UKGgGR0BwenogV45caAdLj2gIR0DBFFa3XqZ/dX2UKGgGR0BvEVDc/MW5aAdLnWgIR0DBFFmZPVNIdX2UKGgGR0BRYU7bL2YfaAdLVGgIR0DBFGGJxeb/dX2UKGgGR0Bvdug3974SaAdLpmgIR0DBFGpftx+8dX2UKGgGR0BwMcaWHDaXaAdLqWgIR0DBFHJ17pmmdX2UKGgGR0ByhWbd8Aq/aAdLvWgIR0DBFH3zxwyZdX2UKGgGR0AlrEfDDTBqaAdLTGgIR0DBFIBCpm29dX2UKGgGR0ByXPPszEaVaAdLwWgIR0DBFIa5sj3VdX2UKGgGR0BzYop8WsRyaAdLymgIR0DBFI5g/keZdX2UKGgGR0Bzhtguyu6maAdLqWgIR0DBFKMGxD9gdX2UKGgGR0ByUCyTpxFRaAdLv2gIR0DBFKL0z0pWdX2UKGgGR0ByOVzCDVYqaAdLwmgIR0DBFKpvLowFdX2UKGgGR0ByDs4HX2/SaAdLumgIR0DBFK/6O5rhdX2UKGgGR0Bx77NnoPkJaAdLxWgIR0DBFLTG1hLHdX2UKGgGR0Byh6dYnv2HaAdLrmgIR0DBFLv3BYV7dX2UKGgGR0Bxc5vtMPBjaAdLrmgIR0DBFL9IuoP1dX2UKGgGR0Busiynk1dgaAdLnWgIR0DBFME56t1ZdX2UKGgGR0ByK/g4wRGuaAdLv2gIR0DBFMvbItDldX2UKGgGR0BxF/VAiV0LaAdLpGgIR0DBFNc+5e7ddX2UKGgGR0ByRxChN/OMaAdLh2gIR0DBFNlMPBi1dX2UKGgGR0B0Loo5PuXvaAdLwGgIR0DBFN+BOHnEdX2UKGgGR0By2AUAT7EYaAdLn2gIR0DBFOJ86V+rdX2UKGgGR0BzLwyfthNNaAdLwWgIR0DBFPT1EmY0dX2UKGgGR0Bz2U6nzg/DaAdLrWgIR0DBFPeOp84QdX2UKGgGR0BvKDwrlNlAaAdLl2gIR0DBFP5g3LmqdX2UKGgGR0Byg8tQKrq/aAdNVgFoCEdAwRULjghr33V9lChoBkdActGicG1QZWgHS5toCEdAwRUP1uBMBnV9lChoBkdAcg5Uoa1kUmgHS7JoCEdAwRUQ4ffXPXV9lChoBkdAcPVwe/5+IGgHS59oCEdAwRUWmjTKDHVlLg=="
49
+ },
50
+ "ep_success_buffer": {
51
+ ":type:": "<class 'collections.deque'>",
52
+ ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
53
+ },
54
+ "_n_updates": 2692,
55
+ "observation_space": {
56
+ ":type:": "<class 'gymnasium.spaces.box.Box'>",
57
+ ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
58
+ "dtype": "float32",
59
+ "bounded_below": "[ True True True True True True True True]",
60
+ "bounded_above": "[ True True True True True True True True]",
61
+ "_shape": [
62
+ 8
63
+ ],
64
+ "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]",
65
+ "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]",
66
+ "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]",
67
+ "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]",
68
+ "_np_random": null
69
+ },
70
+ "action_space": {
71
+ ":type:": "<class 'gymnasium.spaces.discrete.Discrete'>",
72
+ ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=",
73
+ "n": "4",
74
+ "start": "0",
75
+ "_shape": [],
76
+ "dtype": "int64",
77
+ "_np_random": null
78
+ },
79
+ "n_envs": 16,
80
+ "n_steps": 1024,
81
+ "gamma": 0.999,
82
+ "gae_lambda": 0.98,
83
+ "ent_coef": 0.01,
84
+ "vf_coef": 0.5,
85
+ "max_grad_norm": 0.5,
86
+ "batch_size": 64,
87
+ "n_epochs": 4,
88
+ "clip_range": {
89
+ ":type:": "<class 'function'>",
90
+ ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
91
+ },
92
+ "clip_range_vf": null,
93
+ "normalize_advantage": true,
94
+ "target_kl": null,
95
+ "lr_schedule": {
96
+ ":type:": "<class 'function'>",
97
+ ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
98
+ }
99
+ }
LunarLander-v2-10m_ts/policy.optimizer.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:faf6eaac08a7d1bad4b39a2d491046bbebb5d1426443b747cc75cad7a214f618
3
+ size 88362
LunarLander-v2-10m_ts/policy.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfde5a0a0158626eb37c396711004ba5d65843bc394ba4fdf8dbd62f65bb83b0
3
+ size 43762
LunarLander-v2-10m_ts/pytorch_variables.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c35cea3b2e60fb5e7e162d3592df775cd400e575a31c72f359fb9e654ab00c5
3
+ size 864
LunarLander-v2-10m_ts/system_info.txt ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ - OS: Linux-5.15.120+-x86_64-with-glibc2.35 # 1 SMP Wed Aug 30 11:19:59 UTC 2023
2
+ - Python: 3.10.12
3
+ - Stable-Baselines3: 2.0.0a5
4
+ - PyTorch: 2.1.0+cu118
5
+ - GPU Enabled: True
6
+ - Numpy: 1.23.5
7
+ - Cloudpickle: 2.2.1
8
+ - Gymnasium: 0.28.1
9
+ - OpenAI Gym: 0.25.2
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 259.75 +/- 12.46
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 302.85 +/- 14.52
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7815ce6ac9d0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7815ce6aca60>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7815ce6acaf0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7815ce6acb80>", "_build": "<function ActorCriticPolicy._build at 0x7815ce6acc10>", "forward": "<function ActorCriticPolicy.forward at 0x7815ce6acca0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7815ce6acd30>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7815ce6acdc0>", "_predict": "<function ActorCriticPolicy._predict at 0x7815ce6ace50>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7815ce6acee0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7815ce6acf70>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7815ce6ad000>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7815ce84a440>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1698503731180515390, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAANr5h71ccQ28kIwKviIpuDx0m4A9mPqXvQAAgD8AAIA/5mprvaXqQj/SnWA9fmz2vixWmr1qDTg9AAAAAAAAAAAzoQg+z95cP7Vi3T0f5u++zh9APvaqQzwAAAAAAAAAAGYhGz3RdwY/479WvTPKor7cpZ88cXO/vAAAAAAAAAAA4MAgvmNWeD+ueZy+bQj4vgwfQr5Oplm9AAAAAAAAAACNkIE97O3DPFCvD76HZCm+0KaLvfIIkL0AAAAAAAAAAA25S74UfbI+uxWpPrM4kb7c2bQ8J8UqPgAAAAAAAAAATQQwvfQojT1lHq49ZDRNvqlY0zyOx/C8AAAAAAAAAAAADla9soyqP8Y/yb5VcuC+19dSvcAFdL4AAAAAAAAAAJoVr7tIPZi6uuJDuvzI67iIhxW7i11sOQAAgD8AAIA/ZnCovcoaaz4nkEw+PH6Xvj9fwD1A1F+9AAAAAAAAAADdKY2+xwOdP7Vi+75fEh2/YObWvhael70AAAAAAAAAAPMELj5RK1g+dJgvvhfyoL7p7XC8OE+ovQAAAAAAAAAAjW28Pa7HlLpZwSe1nlqjryIhETtiLV80AACAPwAAgD8z0/o6ewKVupNskTK7n00wSMydupDzaLMAAIA/AACAPwAN373MTJg/Vi8mv1WPMr/f3BW9U/BHvgAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVJwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHICF/+bVjKMAWyUTRQBjAF0lEdAklpdKqXF+HV9lChoBkdAcusO8CgbqGgHTRkBaAhHQJJaZdB0ITp1fZQoaAZHQG/vYFzMibFoB00NAWgIR0CSW0Id2gWadX2UKGgGR0BxuTqptJnQaAdNNgFoCEdAklushcJMQHV9lChoBkdAcIKNNahYeWgHTTEBaAhHQJJcUoa1kUd1fZQoaAZHQHKgEU47zTZoB00KAWgIR0CSXHiKR+z/dX2UKGgGR0ByfwC5mRNiaAdNDAFoCEdAklx5D7ZWaXV9lChoBkdAb93w0fozN2gHTQ8BaAhHQJJdL2RJVbR1fZQoaAZHQHEx3dXT3IxoB0vnaAhHQJJdqIZZSvV1fZQoaAZHQHMf7srupjtoB0vuaAhHQJJeQWl/H5t1fZQoaAZHQHEs6POpsGhoB00QAWgIR0CSXpzWf9P2dX2UKGgGR0BypNdGAkLQaAdNHQFoCEdAkl7pnxri2nV9lChoBkdAcPOZk078vWgHTT8BaAhHQJJfnwuuiex1fZQoaAZHQHHe+MVDa5BoB00tAWgIR0CSYBTakAPvdX2UKGgGR0By6b5j6N2laAdNCQFoCEdAkmB5SBK+SXV9lChoBkdAcON+ee4Cp2gHTXIBaAhHQJJhegsbvPV1fZQoaAZHQHMowVXV9WpoB00bAWgIR0CSYhAY51eTdX2UKGgGR0BwnWQ9zOopaAdNIwFoCEdAkmJP4ZdfLXV9lChoBkdAc5IS00FbFGgHTRMBaAhHQJJiu9pRGc51fZQoaAZHQHNQ9mDlHSZoB00HAWgIR0CSYsYYixFBdX2UKGgGR0BxUJMTN+spaAdL72gIR0CSYuFNL128dX2UKGgGR0BwA+hCdBjXaAdL/GgIR0CSYzE6kqMFdX2UKGgGR0BwyymoBJZoaAdNEAFoCEdAkmOHCwbEP3V9lChoBkdAb2EqT8pCr2gHTQsBaAhHQJJkqHXVbzN1fZQoaAZHQHIQQeeWfK9oB00jAWgIR0CSZNVUMoc8dX2UKGgGR0Bx3V8LKFIvaAdNBwFoCEdAkmV/0qYqonV9lChoBkdAcl4420iQk2gHS9xoCEdAkmXc4ku6E3V9lChoBkdAcf/UrTYukGgHTS8BaAhHQJJmM31jAi51fZQoaAZHQHLW+V9nbqRoB00OAWgIR0CSZqDMvAXVdX2UKGgGR0BxTIeOn2qUaAdL7mgIR0CSZqYLLIPtdX2UKGgGR0ByAfjCHh0haAdNSQFoCEdAkmdry6MBIXV9lChoBkdAcr0dKNAC4mgHS9toCEdAkmePmknCwnV9lChoBkdAcAq18b70nWgHS/xoCEdAkmjD6JqIrXV9lChoBkdAbyjxCpm29mgHTSsBaAhHQJJpXTc6/7B1fZQoaAZHQHE6SjpLVWloB00PAWgIR0CSaeXRgJC0dX2UKGgGR0BuMotrbg0kaAdNAgFoCEdAkmp2zru6VnV9lChoBkdAcRn4y44IbGgHTSQBaAhHQJJqiv4dp7F1fZQoaAZHQHGG7Ikqto1oB01DAWgIR0CSa4ESuhbodX2UKGgGR0BvVeWjXWe6aAdNTAFoCEdAkmwhvaURnXV9lChoBkdAc2PyUcGTtGgHTQsBaAhHQJJsMXN1QqJ1fZQoaAZHQHK0rNB4UvhoB0vcaAhHQJJsUyfthNN1fZQoaAZHQHAQm1twaR9oB00wAWgIR0CSgp8LKFIvdX2UKGgGR0BwH4iu+yquaAdL5GgIR0CSgqkxh2GJdX2UKGgGR0B0B9mg8KXwaAdNEgFoCEdAkoK0CV8kU3V9lChoBkdAbO/IpYs/ZGgHS/VoCEdAkoNH1SOzY3V9lChoBkdAcBdV6eGwimgHS+1oCEdAkoQst9QXRHV9lChoBkdAcJ3AuqWC3GgHTUUBaAhHQJKFHfIjnmt1fZQoaAZHQEiqK0lZ5iVoB0vKaAhHQJKFXAaef7J1fZQoaAZHQHFJbcO9WZJoB00kAWgIR0CShi/GEPDpdX2UKGgGR0BwkTlQuVX4aAdNDAFoCEdAkoeZNTLntHV9lChoBkdAcvp+RYA80WgHTUMBaAhHQJKIJgOSW7h1fZQoaAZHQG8BN47ihnJoB0v4aAhHQJKIrv0AcT91fZQoaAZHQHDWUVi4J/poB00uAWgIR0CSiToDgZTAdX2UKGgGR0BxSfrv9cbBaAdL3mgIR0CSiY0FKTStdX2UKGgGR0BzhvLRrrPdaAdNRAFoCEdAkonJamoBJnV9lChoBkdAbmtqVQhwEWgHS/toCEdAkopTSkTHsHV9lChoBkdAcT640dilSGgHTSABaAhHQJKKeyGBWgh1fZQoaAZHQHCvLojfNzNoB00LAWgIR0CSi1AkcCHRdX2UKGgGR0BywiosI3R5aAdNUAFoCEdAkovgtOEdvXV9lChoBkdAcgN9m6GxlmgHTTMBaAhHQJKL7qW1MM91fZQoaAZHQHDqCOq//NtoB01VAWgIR0CSjCB3zMA4dX2UKGgGR0BxDzT6SDAaaAdNNAFoCEdAkoz+mrKeTXV9lChoBkdAc521JlJ6IGgHTRgBaAhHQJKN38Kohpx1fZQoaAZHQHBDZ4fOlftoB0vyaAhHQJKOR1MdtEZ1fZQoaAZHQHKSQUYbbURoB01HAWgIR0CSjlGUOd5IdX2UKGgGR0Bx7Oa+evpyaAdNeQFoCEdAko+KcEvCdnV9lChoBkdAc9unjABT42gHTRsBaAhHQJKP+xfOUt91fZQoaAZHQG90PmHP/rBoB0vuaAhHQJKQD+o99tx1fZQoaAZHQG5/uG0u14RoB009AWgIR0CSkW8FY+0PdX2UKGgGR0BxjQsmOU+taAdNDAFoCEdAkpGo6wMYuXV9lChoBkdAcKETpxFRYWgHS9loCEdAkpHRDohY/3V9lChoBkdAUf62c8TzumgHS6BoCEdAkpJEtmL9/HV9lChoBkdAc1EI065oXmgHS+RoCEdAkpJK8QI2O3V9lChoBkdAb4oK9f1Hv2gHTSIBaAhHQJKSWW9lEql1fZQoaAZHQHLOMuFpPARoB01RAWgIR0CSkm9g4OtodX2UKGgGR0BzIVHYpUgkaAdNUQFoCEdAkpLm6PKdQXV9lChoBkdAbk6cxTKkmGgHTRoBaAhHQJKTUNayKN11fZQoaAZHQHOAiCaqjrRoB00+AWgIR0CSk6ixmkFfdX2UKGgGR0ByU1+I/JNkaAdNPQFoCEdAkpVi7oSteXV9lChoBkdAbrVAMUh3aGgHTR0BaAhHQJKV0+IMz/J1fZQoaAZHQHH76Lfk3jxoB0viaAhHQJKV+a7VawF1fZQoaAZHQHF9OBg/keZoB00vAWgIR0CSll7fHggpdX2UKGgGR0BzS0qiGnGbaAdNCAFoCEdAkpaBl6JIlXV9lChoBkdAcidwIdELIGgHS+doCEdAkpd2i5/b03V9lChoBkdAcZLF3pwCKmgHS91oCEdAkpgcy31BdHV9lChoBkdAbteuAZsKs2gHS+BoCEdAkphkahpQDXV9lChoBkdAc1Uhhpg1FmgHTRsBaAhHQJKZZ7F85S51fZQoaAZHQHFeOp84PwxoB0vtaAhHQJKZ8KlYU351fZQoaAZHQHDS98E3bVVoB00MAWgIR0CSmk8lXzUadX2UKGgGR0Bt0MC5mRNiaAdNPgFoCEdAkppPDP4VRHV9lChoBkdAc6oEbHZK4GgHTSQBaAhHQJKaVOj7AL11fZQoaAZHQHMWSnpB5X5oB01AAWgIR0CSmwIVdonKdX2UKGgGR0BvmC3iJfpmaAdNEAFoCEdAkptXv+fh/HV9lChoBkdAcGoiQ1aW5mgHTcUBaAhHQJKcUvAXVLB1fZQoaAZHQHA/XjyWiURoB00FAWgIR0CSnT0o0ALidX2UKGgGR0BuJ6NCJGe+aAdNBQFoCEdAkp1jFQ2uPnV9lChoBkdAcKZjNIK+jGgHS9VoCEdAkp2LvG6wuHV9lChoBkdAcQA6rvLHMmgHS/9oCEdAkp2/EbYK6XV9lChoBkdAcXlgv114gWgHTRoBaAhHQJKeWVlf7aZ1fZQoaAZHQEJ3DPWxyGVoB0u0aAhHQJKecP9UCJZ1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 248, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-5.15.120+-x86_64-with-glibc2.35 # 1 SMP Wed Aug 30 11:19:59 UTC 2023", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.1.0+cu118", "GPU Enabled": "True", "Numpy": "1.23.5", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7815ce6ac9d0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7815ce6aca60>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7815ce6acaf0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7815ce6acb80>", "_build": "<function ActorCriticPolicy._build at 0x7815ce6acc10>", "forward": "<function ActorCriticPolicy.forward at 0x7815ce6acca0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7815ce6acd30>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7815ce6acdc0>", "_predict": "<function ActorCriticPolicy._predict at 0x7815ce6ace50>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7815ce6acee0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7815ce6acf70>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7815ce6ad000>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7815ce84a440>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 10010624, "_total_timesteps": 10000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1698505574986195902, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAGZ6JT7huvQ9Sp0av1+V374hd8o96kLIvgAAAAAAAAAAGo2hPb7/sj+1D9k+Nl18vr4z9j1Ceos+AAAAAAAAAAAzr4u7SPuIuoOqmzUz2JAv+RRGOk6csbQAAIA/AACAP82UNj177JW6/Q0yvQxYLDMCmjK7qz1PswAAgD8AAIA/cxnwPQfmrz9FiOU+1ULBvkDtaD5Tgp8+AAAAAAAAAAAzHds9tBPAP6aiIz/BV6A9/4SIPd4JvD4AAAAAAAAAAM14sDwUrpu43YLAs/4ygq7qJ9W7y3utMwAAgD8AAIA/AFg9O9dBFrs9c+g7SfSRPDWMErwz7Hs9AACAPwAAgD864D8++1pOP5/SNj7NVyG/Hc3uPq4liz0AAAAAAAAAAJqH0b3kQSY/MB+7vV2KV78+i4e+4gFvvAAAAAAAAAAAZra8vMqJrj9uWOO+u8byvkodCzz2HSW9AAAAAAAAAABmvF8+tVWGP+pdFT6/+TS/8sX4PnxwBD0AAAAAAAAAAM1TVz04jM896sGevsmtsr4NmJ29JTNVvgAAAAAAAAAAQNWmPaQdET5OBm++5IPJvoW0r7yGXjK+AAAAAAAAAAAAy4M8rjWEusgKZzMFZ5Wv2UN5uqs7wbMAAIA/AACAPwCjxLwrnoA9FBU1PnE52b66VFk97rjNPQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.0010623999999999079, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV4QsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHKqO32EkB2MAWyUS7mMAXSUR0DBD4EOwxFidX2UKGgGR0BxsX0J4SpSaAdLnWgIR0DBD4Cx/ustdX2UKGgGR0BzeN+6RQrMaAdLnGgIR0DBD4kSCe3AdX2UKGgGR0Bv891B+nZTaAdLnGgIR0DBD6Ki22G7dX2UKGgGR0Bz91p35eqraAdLq2gIR0DBEgnuy/sWdX2UKGgGR0BvrN1r6+FlaAdLnWgIR0DBEgtEd/8VdX2UKGgGR0Bzg9RDTjNqaAdLvWgIR0DBEhYkcCHRdX2UKGgGR0BySV9c8kleaAdLuWgIR0DBEh1lK9PDdX2UKGgGR0ByZGUqx1PnaAdLrmgIR0DBEicgjhUBdX2UKGgGR0ByzxLBbfP5aAdLlGgIR0DBEikBKcurdX2UKGgGR0ByjRkf9xZMaAdLnGgIR0DBEjWx4Y78dX2UKGgGR0BzccLw4KhMaAdL3WgIR0DBEjypJf6XdX2UKGgGR0BvjbUy57PZaAdLqWgIR0DBEkSIpH7QdX2UKGgGR0Bw++gYgq3FaAdLoWgIR0DBEklxS5y3dX2UKGgGR0By2MKiO/+LaAdLmmgIR0DBElKtozvadX2UKGgGR0BzGif4AS39aAdL62gIR0DBElZHqeK9dX2UKGgGR0Byj+GdqcmTaAdLrWgIR0DBEmJT2nKodX2UKGgGR0BwthEXtShraAdLs2gIR0DBEmMDwH7hdX2UKGgGR0BxBCY0EX+EaAdLrWgIR0DBEm3RCx/vdX2UKGgGR0Bx8OphnanKaAdLlGgIR0DBEn1vES/TdX2UKGgGR0BvsCWNWEK3aAdLpmgIR0DBEpgFV1fWdX2UKGgGR0ByMdbPhQ3xaAdLl2gIR0DBEq3RTjvNdX2UKGgGR0Byw8+HJtBOaAdLqmgIR0DBEr8YGdI5dX2UKGgGR0Bz94c0cfeUaAdL0GgIR0DBEsEOf/WEdX2UKGgGR0ByUc7V8Ti9aAdLvGgIR0DBEsRSpBHDdX2UKGgGR0Bzg+EpRXOoaAdLyWgIR0DBEsfcN6PbdX2UKGgGR0Bx7YWac7QtaAdLr2gIR0DBEtwTqSowdX2UKGgGR0BzdjfqHGjsaAdLwmgIR0DBEuV3IMjNdX2UKGgGR0Bx6a/zreImaAdLm2gIR0DBEvLIq9XcdX2UKGgGR0Bx/Zs54nndaAdLsmgIR0DBEvVjPOY6dX2UKGgGR0Byfn0Cih38aAdLvmgIR0DBEvc0YTCcdX2UKGgGR0ByQTonrpqzaAdLvmgIR0DBEwPq/ub7dX2UKGgGR0Bzi8okRjBmaAdL3WgIR0DBEw7hR64UdX2UKGgGR0BxEU66reZYaAdLwWgIR0DBExSCFsYVdX2UKGgGR0BzYD1AZ88caAdLumgIR0DBExqbvw3HdX2UKGgGR0BywR62OQyRaAdLsGgIR0DBEyHFYMfBdX2UKGgGR0BwfzfvWpZPaAdLoWgIR0DBEyw9Pk7wdX2UKGgGR0BxrKACnxaxaAdLkmgIR0DBEzI3HaN/dX2UKGgGR0BxWKXZ5AyEaAdLp2gIR0DBE1TpaA4GdX2UKGgGR0Bv27tw71ZlaAdLoGgIR0DBE1c30f5ldX2UKGgGR0BzdyWv8qFzaAdLvWgIR0DBE2v/vOQhdX2UKGgGR0Bz31gUlAu7aAdLvGgIR0DBE254rz5HdX2UKGgGR0Bycctcv/R3aAdLi2gIR0DBE3OLNwBHdX2UKGgGR0ByBP1J17pnaAdLl2gIR0DBE4C17Y03dX2UKGgGR0Bxzx7+kxh2aAdLr2gIR0DBE4VipeeGdX2UKGgGR0ByPfQTmGM5aAdLwWgIR0DBE4yDPGADdX2UKGgGR0BycVe1KGtZaAdLl2gIR0DBE451ie/YdX2UKGgGR0BzzcmVqveQaAdLwmgIR0DBE6P/giu/dX2UKGgGR0Bx5c1tO2y+aAdLo2gIR0DBE7BDu0CzdX2UKGgGR0BxkDLDAJswaAdLtmgIR0DBE7uD3/PxdX2UKGgGR0ByrAfRu0kXaAdLm2gIR0DBE7xrxiG4dX2UKGgGR0ByHHHdXT3JaAdLwGgIR0DBE782aUiZdX2UKGgGR0ByJLkU9IPLaAdLsGgIR0DBE8RMN+b3dX2UKGgGR0BzcGg3974SaAdLrmgIR0DBE9N/x2B8dX2UKGgGR0BxrJCY1He8aAdLp2gIR0DBE++CK77LdX2UKGgGR0Byy2RaHKwIaAdLl2gIR0DBE/jzwtrcdX2UKGgGR0Bz/ZiZv1lHaAdLuGgIR0DBFAF7dBSldX2UKGgGR0BwopqTKT0QaAdLlWgIR0DBFA1MfzSUdX2UKGgGR0ByAM8IRh+faAdLs2gIR0DBFBPJYDDCdX2UKGgGR0By58EJSiudaAdLvGgIR0DBFBQ3gk1NdX2UKGgGR0Bxt/iCJ40NaAdLrmgIR0DBFBk4aP0adX2UKGgGR0BvVEvh60IDaAdLpGgIR0DBFBqeRPoFdX2UKGgGR0BwQ+4oZydXaAdLnGgIR0DBFDLEcbR4dX2UKGgGR0ByOWDK5kLAaAdLmWgIR0DBFDM1qFh5dX2UKGgGR0BzI1rcj7hvaAdLv2gIR0DBFDkhV2iddX2UKGgGR0B0QXpu/DceaAdL4GgIR0DBFD53Roh7dX2UKGgGR0By9Pk/8l5XaAdLsmgIR0DBFEC7K7qZdX2UKGgGR0Bxip4W1twaaAdLmWgIR0DBFEEK7ZnMdX2UKGgGR0BzOv3Cbc46aAdLw2gIR0DBFEMrmQr+dX2UKGgGR0BxVjp5eJHiaAdLnWgIR0DBFFN3+uNhdX2UKGgGR0Bzaj9kz41xaAdL0WgIR0DBFFXUYsNEdX2UKGgGR0BwenogV45caAdLj2gIR0DBFFa3XqZ/dX2UKGgGR0BvEVDc/MW5aAdLnWgIR0DBFFmZPVNIdX2UKGgGR0BRYU7bL2YfaAdLVGgIR0DBFGGJxeb/dX2UKGgGR0Bvdug3974SaAdLpmgIR0DBFGpftx+8dX2UKGgGR0BwMcaWHDaXaAdLqWgIR0DBFHJ17pmmdX2UKGgGR0ByhWbd8Aq/aAdLvWgIR0DBFH3zxwyZdX2UKGgGR0AlrEfDDTBqaAdLTGgIR0DBFIBCpm29dX2UKGgGR0ByXPPszEaVaAdLwWgIR0DBFIa5sj3VdX2UKGgGR0BzYop8WsRyaAdLymgIR0DBFI5g/keZdX2UKGgGR0Bzhtguyu6maAdLqWgIR0DBFKMGxD9gdX2UKGgGR0ByUCyTpxFRaAdLv2gIR0DBFKL0z0pWdX2UKGgGR0ByOVzCDVYqaAdLwmgIR0DBFKpvLowFdX2UKGgGR0ByDs4HX2/SaAdLumgIR0DBFK/6O5rhdX2UKGgGR0Bx77NnoPkJaAdLxWgIR0DBFLTG1hLHdX2UKGgGR0Byh6dYnv2HaAdLrmgIR0DBFLv3BYV7dX2UKGgGR0Bxc5vtMPBjaAdLrmgIR0DBFL9IuoP1dX2UKGgGR0Busiynk1dgaAdLnWgIR0DBFME56t1ZdX2UKGgGR0ByK/g4wRGuaAdLv2gIR0DBFMvbItDldX2UKGgGR0BxF/VAiV0LaAdLpGgIR0DBFNc+5e7ddX2UKGgGR0ByRxChN/OMaAdLh2gIR0DBFNlMPBi1dX2UKGgGR0B0Loo5PuXvaAdLwGgIR0DBFN+BOHnEdX2UKGgGR0By2AUAT7EYaAdLn2gIR0DBFOJ86V+rdX2UKGgGR0BzLwyfthNNaAdLwWgIR0DBFPT1EmY0dX2UKGgGR0Bz2U6nzg/DaAdLrWgIR0DBFPeOp84QdX2UKGgGR0BvKDwrlNlAaAdLl2gIR0DBFP5g3LmqdX2UKGgGR0Byg8tQKrq/aAdNVgFoCEdAwRULjghr33V9lChoBkdActGicG1QZWgHS5toCEdAwRUP1uBMBnV9lChoBkdAcg5Uoa1kUmgHS7JoCEdAwRUQ4ffXPXV9lChoBkdAcPVwe/5+IGgHS59oCEdAwRUWmjTKDHVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 2692, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-5.15.120+-x86_64-with-glibc2.35 # 1 SMP Wed Aug 30 11:19:59 UTC 2023", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.1.0+cu118", "GPU Enabled": "True", "Numpy": "1.23.5", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 259.7505985760466, "std_reward": 12.456677554269561, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-10-28T14:58:08.315476"}
 
1
+ {"mean_reward": 302.84871481441974, "std_reward": 14.520752642652598, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-10-28T16:59:05.465546"}