Wim Straetemans
commited on
Commit
·
9869e17
1
Parent(s):
e938d9f
Initial commit
Browse files- README.md +1 -1
- a2c-PandaReachDense-v2.zip +2 -2
- a2c-PandaReachDense-v2/data +18 -18
- a2c-PandaReachDense-v2/policy.optimizer.pth +1 -1
- a2c-PandaReachDense-v2/policy.pth +1 -1
- config.json +1 -1
- replay.mp4 +0 -0
- results.json +1 -1
- vec_normalize.pkl +1 -1
README.md
CHANGED
@@ -16,7 +16,7 @@ model-index:
|
|
16 |
type: PandaReachDense-v2
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
-
value: -
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
|
|
16 |
type: PandaReachDense-v2
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
+
value: -1.11 +/- 0.53
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
a2c-PandaReachDense-v2.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb6ebe4dc659a28e48eb1136fb2378c0332c5590644185d3621923775437ab1a
|
3 |
+
size 109106
|
a2c-PandaReachDense-v2/data
CHANGED
@@ -4,9 +4,9 @@
|
|
4 |
":serialized:": "gAWVRQAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMG011bHRpSW5wdXRBY3RvckNyaXRpY1BvbGljeZSTlC4=",
|
5 |
"__module__": "stable_baselines3.common.policies",
|
6 |
"__doc__": "\n MultiInputActorClass policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space (Tuple)\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Uses the CombinedExtractor\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
7 |
-
"__init__": "<function MultiInputActorCriticPolicy.__init__ at
|
8 |
"__abstractmethods__": "frozenset()",
|
9 |
-
"_abc_impl": "<_abc_data object at
|
10 |
},
|
11 |
"verbose": 1,
|
12 |
"policy_kwargs": {
|
@@ -40,13 +40,13 @@
|
|
40 |
"bounded_above": "[ True True True]",
|
41 |
"_np_random": null
|
42 |
},
|
43 |
-
"n_envs":
|
44 |
-
"num_timesteps":
|
45 |
-
"_total_timesteps":
|
46 |
"_num_timesteps_at_start": 0,
|
47 |
"seed": null,
|
48 |
"action_noise": null,
|
49 |
-
"start_time":
|
50 |
"learning_rate": 0.0007,
|
51 |
"tensorboard_log": null,
|
52 |
"lr_schedule": {
|
@@ -55,35 +55,35 @@
|
|
55 |
},
|
56 |
"_last_obs": {
|
57 |
":type:": "<class 'collections.OrderedDict'>",
|
58 |
-
":serialized:": "
|
59 |
-
"achieved_goal": "[[ 0.
|
60 |
-
"desired_goal": "[[
|
61 |
-
"observation": "[[
|
62 |
},
|
63 |
"_last_episode_starts": {
|
64 |
":type:": "<class 'numpy.ndarray'>",
|
65 |
-
":serialized:": "
|
66 |
},
|
67 |
"_last_original_obs": {
|
68 |
":type:": "<class 'collections.OrderedDict'>",
|
69 |
-
":serialized:": "
|
70 |
-
"achieved_goal": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]]",
|
71 |
-
"desired_goal": "[[ 0.
|
72 |
-
"observation": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]]"
|
73 |
},
|
74 |
"_episode_num": 0,
|
75 |
"use_sde": false,
|
76 |
"sde_sample_freq": -1,
|
77 |
-
"_current_progress_remaining":
|
78 |
"ep_info_buffer": {
|
79 |
":type:": "<class 'collections.deque'>",
|
80 |
-
":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////
|
81 |
},
|
82 |
"ep_success_buffer": {
|
83 |
":type:": "<class 'collections.deque'>",
|
84 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
85 |
},
|
86 |
-
"_n_updates":
|
87 |
"n_steps": 5,
|
88 |
"gamma": 0.99,
|
89 |
"gae_lambda": 1.0,
|
|
|
4 |
":serialized:": "gAWVRQAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMG011bHRpSW5wdXRBY3RvckNyaXRpY1BvbGljeZSTlC4=",
|
5 |
"__module__": "stable_baselines3.common.policies",
|
6 |
"__doc__": "\n MultiInputActorClass policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space (Tuple)\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Uses the CombinedExtractor\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
7 |
+
"__init__": "<function MultiInputActorCriticPolicy.__init__ at 0x7f1f3bea5430>",
|
8 |
"__abstractmethods__": "frozenset()",
|
9 |
+
"_abc_impl": "<_abc_data object at 0x7f1f3be9ea80>"
|
10 |
},
|
11 |
"verbose": 1,
|
12 |
"policy_kwargs": {
|
|
|
40 |
"bounded_above": "[ True True True]",
|
41 |
"_np_random": null
|
42 |
},
|
43 |
+
"n_envs": 6,
|
44 |
+
"num_timesteps": 500010,
|
45 |
+
"_total_timesteps": 500000,
|
46 |
"_num_timesteps_at_start": 0,
|
47 |
"seed": null,
|
48 |
"action_noise": null,
|
49 |
+
"start_time": 1674231992111677191,
|
50 |
"learning_rate": 0.0007,
|
51 |
"tensorboard_log": null,
|
52 |
"lr_schedule": {
|
|
|
55 |
},
|
56 |
"_last_obs": {
|
57 |
":type:": "<class 'collections.OrderedDict'>",
|
58 |
+
":serialized:": "gAWVGwIAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QolkgAAAAAAAAAhdFXP+Csjz+wtJK/wUQfPsUpLT/jLbq+MkJfv2G3gb934Hm/WnpHP7xfhb/BibQ+IAF3vy88Kz74h3g+n287P1Bvxb9dfjY+lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksGSwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcolkgAAAAAAAAAg92EPztUhj8PB5G/zuAGPgPfGz8XjIu+O/tzv/5Nd7/wO5S/W/+FP9wsd7/o4uI+FQGnvzmH9j0LnMA+ezKAP9o/vL9/rzY+lGgOSwZLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWkAAAAAAAAACF0Vc/4KyPP7C0kr9F2Z897punvXdQ6DzBRB8+xSktP+Mtur4WFCq81wQIPF2jiDoyQl+/YbeBv3fgeb/wpKc8ZMbQPANpaL1aekc/vF+Fv8GJtD4BNXy91CMqvlq9Yb0gAXe/LzwrPviHeD7+qjY99MUBvrYQ8bufbzs/UG/Fv11+Nj42wqo9mTwIvXlvoTyUaA5LBksGhpRoEnSUUpR1Lg==",
|
59 |
+
"achieved_goal": "[[ 0.84304076 1.1224632 -1.1461391 ]\n [ 0.15553571 0.6764186 -0.36363134]\n [-0.8721038 -1.0134088 -0.9760813 ]\n [ 0.7792107 -1.0419841 0.35261348]\n [-0.9648609 0.16722177 0.24270618]\n [ 0.73217195 -1.5424595 0.17821641]]",
|
60 |
+
"desired_goal": "[[ 1.03801 1.0494455 -1.1330279 ]\n [ 0.13171694 0.60887164 -0.27255318]\n [-0.9530522 -0.9660338 -1.1580791 ]\n [ 1.0468553 -0.96552825 0.4431374 ]\n [-1.3047205 0.1203751 0.3761905 ]\n [ 1.0015405 -1.4706986 0.17840384]]",
|
61 |
+
"observation": "[[ 8.4304076e-01 1.1224632e+00 -1.1461391e+00 7.8051127e-02\n -8.1840381e-02 2.8358681e-02]\n [ 1.5553571e-01 6.7641860e-01 -3.6363134e-01 -1.0380765e-02\n 8.3019352e-03 1.0424663e-03]\n [-8.7210381e-01 -1.0134088e+00 -9.7608131e-01 2.0464391e-02\n 2.5485225e-02 -5.6740772e-02]\n [ 7.7921069e-01 -1.0419841e+00 3.5261348e-01 -6.1573986e-02\n -1.6615230e-01 -5.5112220e-02]\n [-9.6486092e-01 1.6722177e-01 2.4270618e-01 4.4596665e-02\n -1.2673169e-01 -7.3567284e-03]\n [ 7.3217195e-01 -1.5424595e+00 1.7821641e-01 8.3378240e-02\n -3.3260915e-02 1.9706475e-02]]"
|
62 |
},
|
63 |
"_last_episode_starts": {
|
64 |
":type:": "<class 'numpy.ndarray'>",
|
65 |
+
":serialized:": "gAWVeQAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYGAAAAAAAAAAAAAAAAAJSMBW51bXB5lIwFZHR5cGWUk5SMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLBoWUjAFDlHSUUpQu"
|
66 |
},
|
67 |
"_last_original_obs": {
|
68 |
":type:": "<class 'collections.OrderedDict'>",
|
69 |
+
":serialized:": "gAWVGwIAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QolkgAAAAAAAAA6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksGSwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcolkgAAAAAAAAAuDPDPSABRb0/C4w+A6bjPbHtnDx1ZIc+2RWyPXoChT3zSHA+AqmovZ5hA72QZQo+vve8vHXjjb1NoJY+8LpdvYd6JD1d5RE9lGgOSwZLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWkAAAAAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAACUaA5LBksGhpRoEnSUUpR1Lg==",
|
70 |
+
"achieved_goal": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]]",
|
71 |
+
"desired_goal": "[[ 0.09531349 -0.04809678 0.2735233 ]\n [ 0.11115649 0.01915631 0.2644383 ]\n [ 0.08695573 0.06494613 0.23465328]\n [-0.08235361 -0.03207552 0.13515306]\n [-0.02306735 -0.0692815 0.29419175]\n [-0.05413336 0.04015591 0.03561913]]",
|
72 |
+
"observation": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]]"
|
73 |
},
|
74 |
"_episode_num": 0,
|
75 |
"use_sde": false,
|
76 |
"sde_sample_freq": -1,
|
77 |
+
"_current_progress_remaining": -1.999999999990898e-05,
|
78 |
"ep_info_buffer": {
|
79 |
":type:": "<class 'collections.deque'>",
|
80 |
+
":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIkPmAQGdS7L+UhpRSlIwBbJRLMowBdJRHQJHidNahYeV1fZQoaAZoCWgPQwjwF7MlqyLqv5SGlFKUaBVLMmgWR0CR4f4agmJFdX2UKGgGaAloD0MIk3L3OT7a7r+UhpRSlGgVSzJoFkdAkeGCS7oStnV9lChoBmgJaA9DCKp+pfPh2fa/lIaUUpRoFUsyaBZHQJHhCdWhh6V1fZQoaAZoCWgPQwiuLqcExKTwv5SGlFKUaBVLMmgWR0CR5pBTn7pFdX2UKGgGaAloD0MIFqJD4Egg5L+UhpRSlGgVSzJoFkdAkeXomw7kn3V9lChoBmgJaA9DCHlZEwt8xeS/lIaUUpRoFUsyaBZHQJHlZRyfcvd1fZQoaAZoCWgPQwhIiV3b263iv5SGlFKUaBVLMmgWR0CR5O35N47jdX2UKGgGaAloD0MIp+Zyg6GO8L+UhpRSlGgVSzJoFkdAkeRx8D0UXnV9lChoBmgJaA9DCK7zb5f9Ou+/lIaUUpRoFUsyaBZHQJHj+UnogV51fZQoaAZoCWgPQwjKNnAH6pTqv5SGlFKUaBVLMmgWR0CR6XgctGutdX2UKGgGaAloD0MIyvs4miMr5b+UhpRSlGgVSzJoFkdAkejQw0wai3V9lChoBmgJaA9DCM5RR8fVSOi/lIaUUpRoFUsyaBZHQJHoTWy1NQF1fZQoaAZoCWgPQwjnjCjtDb7qv5SGlFKUaBVLMmgWR0CR59ZqVQhwdX2UKGgGaAloD0MIiZgSSfQy77+UhpRSlGgVSzJoFkdAkedaYVqN63V9lChoBmgJaA9DCA1S8BRypeG/lIaUUpRoFUsyaBZHQJHm4bEP1+R1fZQoaAZoCWgPQwiHF0Skpt3tv5SGlFKUaBVLMmgWR0CR7Ey+6Ae8dX2UKGgGaAloD0MIKsWOxqF+97+UhpRSlGgVSzJoFkdAkeulSS/0unV9lChoBmgJaA9DCLt868N6I+K/lIaUUpRoFUsyaBZHQJHrIe3hGYt1fZQoaAZoCWgPQwg7N23GaUj1v5SGlFKUaBVLMmgWR0CR6qrRBu4xdX2UKGgGaAloD0MI2NMOf03W7L+UhpRSlGgVSzJoFkdAkeouueSSvHV9lChoBmgJaA9DCEiKyLCKN92/lIaUUpRoFUsyaBZHQJHptb7j1f51fZQoaAZoCWgPQwgtlbcjnJbjv5SGlFKUaBVLMmgWR0CR7yHRCx/vdX2UKGgGaAloD0MI0Vs8vOdA6b+UhpRSlGgVSzJoFkdAke56Cg9Ne3V9lChoBmgJaA9DCJ2C/Gzk+vK/lIaUUpRoFUsyaBZHQJHt9rO7g891fZQoaAZoCWgPQwh6xOi5ha7tv5SGlFKUaBVLMmgWR0CR7X+3Ytg8dX2UKGgGaAloD0MI0/pbAvAP8r+UhpRSlGgVSzJoFkdAke0D0163RXV9lChoBmgJaA9DCFSthVloZ+m/lIaUUpRoFUsyaBZHQJHsixrzoU11fZQoaAZoCWgPQwjTZpyGqAL1v5SGlFKUaBVLMmgWR0CR8fzhP0qZdX2UKGgGaAloD0MI7NtJRPiX5b+UhpRSlGgVSzJoFkdAkfFVGb1AaHV9lChoBmgJaA9DCML4adyb3+u/lIaUUpRoFUsyaBZHQJHw0ZsKsuF1fZQoaAZoCWgPQwizs+idCrjuv5SGlFKUaBVLMmgWR0CR8FqWC2+gdX2UKGgGaAloD0MI3e9QFOgT47+UhpRSlGgVSzJoFkdAke/ei8FpwnV9lChoBmgJaA9DCOcYkL3e/ea/lIaUUpRoFUsyaBZHQJHvZgAp8Wt1fZQoaAZoCWgPQwjlCu9yEd/5v5SGlFKUaBVLMmgWR0CR9NWjXWe6dX2UKGgGaAloD0MIyJQPQdXo7L+UhpRSlGgVSzJoFkdAkfQtwNsnA3V9lChoBmgJaA9DCNffEoB/KgDAlIaUUpRoFUsyaBZHQJHzqpKjBVN1fZQoaAZoCWgPQwiUhETaxt/wv5SGlFKUaBVLMmgWR0CR8zOIqLCOdX2UKGgGaAloD0MI7C+7Jw9L+r+UhpRSlGgVSzJoFkdAkfK32h7E53V9lChoBmgJaA9DCK67eapDbvC/lIaUUpRoFUsyaBZHQJHyP2g39751fZQoaAZoCWgPQwjMmljgK7rev5SGlFKUaBVLMmgWR0CR95pRoAXEdX2UKGgGaAloD0MIUMdjBipj+r+UhpRSlGgVSzJoFkdAkfby2c8Tz3V9lChoBmgJaA9DCP+vOnKkM+2/lIaUUpRoFUsyaBZHQJH2bzXjENx1fZQoaAZoCWgPQwi4Wicux6vqv5SGlFKUaBVLMmgWR0CR9fgHu7YkdX2UKGgGaAloD0MI1V5E2zE1/L+UhpRSlGgVSzJoFkdAkfV8NYr8SHV9lChoBmgJaA9DCN0Ii4o4Hfa/lIaUUpRoFUsyaBZHQJH1A3l0YCR1fZQoaAZoCWgPQwg9DRgkfRr9v5SGlFKUaBVLMmgWR0CR+nNucc2jdX2UKGgGaAloD0MIlDMUd7xJ57+UhpRSlGgVSzJoFkdAkfnLronrp3V9lChoBmgJaA9DCC0Heqhtw+S/lIaUUpRoFUsyaBZHQJH5SDRMN+d1fZQoaAZoCWgPQwiwcJLmj2n4v5SGlFKUaBVLMmgWR0CR+NEhJRO2dX2UKGgGaAloD0MIFAX6RJ6k/L+UhpRSlGgVSzJoFkdAkfhVOfukUXV9lChoBmgJaA9DCHGPpQ9dkP+/lIaUUpRoFUsyaBZHQJH33Mpw0fp1fZQoaAZoCWgPQwgZA+s4fuj4v5SGlFKUaBVLMmgWR0CR/VWuoxYadX2UKGgGaAloD0MIG2X9ZmK68b+UhpRSlGgVSzJoFkdAkfyt9MK1HHV9lChoBmgJaA9DCGjKTj+oy/m/lIaUUpRoFUsyaBZHQJH8KtSydFx1fZQoaAZoCWgPQwg9D+7O2u30v5SGlFKUaBVLMmgWR0CR+7PSDyvtdX2UKGgGaAloD0MIPZ6WH7jK8L+UhpRSlGgVSzJoFkdAkfs3xe9i+nV9lChoBmgJaA9DCDSEY5Y9yf+/lIaUUpRoFUsyaBZHQJH6vustCiR1fZQoaAZoCWgPQwgtB3qobYP2v5SGlFKUaBVLMmgWR0CSAGF3IMjNdX2UKGgGaAloD0MIw/UoXI8C87+UhpRSlGgVSzJoFkdAkf+6ASWZ7XV9lChoBmgJaA9DCG3GaYgq/PS/lIaUUpRoFUsyaBZHQJH/NoYekpJ1fZQoaAZoCWgPQwgi41Eq4Qnxv5SGlFKUaBVLMmgWR0CR/r+2mYShdX2UKGgGaAloD0MIWYtPATCeA8CUhpRSlGgVSzJoFkdAkf5Dx5LRKHV9lChoBmgJaA9DCPNUh9wMd/K/lIaUUpRoFUsyaBZHQJH9ywX668R1fZQoaAZoCWgPQwjH155ZEqDmv5SGlFKUaBVLMmgWR0CSA1jNpudgdX2UKGgGaAloD0MITYV4JF4e97+UhpRSlGgVSzJoFkdAkgKxNIsiCHV9lChoBmgJaA9DCBah2Aqa9gXAlIaUUpRoFUsyaBZHQJICLZSNwR51fZQoaAZoCWgPQwi2ErpL4qzlv5SGlFKUaBVLMmgWR0CSAbaLXL/0dX2UKGgGaAloD0MIISI17WIa/b+UhpRSlGgVSzJoFkdAkgE6r/82rHV9lChoBmgJaA9DCAVPIVfqWfm/lIaUUpRoFUsyaBZHQJIAwkRjBmB1fZQoaAZoCWgPQwjqXif1Zen3v5SGlFKUaBVLMmgWR0CSBitZFG5MdX2UKGgGaAloD0MIfQiqRq+G97+UhpRSlGgVSzJoFkdAkgWDjrAxjHV9lChoBmgJaA9DCIZY/RGGge+/lIaUUpRoFUsyaBZHQJIFABkqc3F1fZQoaAZoCWgPQwgBTYQNT+/zv5SGlFKUaBVLMmgWR0CSBIktVaOhdX2UKGgGaAloD0MIhVs+kpJe9L+UhpRSlGgVSzJoFkdAkgQNVea8YnV9lChoBmgJaA9DCMpOP6iL1PG/lIaUUpRoFUsyaBZHQJIDlJg9eQd1fZQoaAZoCWgPQwiDhv4JLlbrv5SGlFKUaBVLMmgWR0CSCQxBE8aGdX2UKGgGaAloD0MIQRAgQ8cO7b+UhpRSlGgVSzJoFkdAkghksJ6Y3XV9lChoBmgJaA9DCJc8npYfGATAlIaUUpRoFUsyaBZHQJIH4S39aU11fZQoaAZoCWgPQwgPuRluwKf1v5SGlFKUaBVLMmgWR0CSB2qvNeMRdX2UKGgGaAloD0MIxvmbUIjA87+UhpRSlGgVSzJoFkdAkgbu67NB4XV9lChoBmgJaA9DCBvZlZaRuve/lIaUUpRoFUsyaBZHQJIGdhd+ocd1fZQoaAZoCWgPQwh7Mv/om/QFwJSGlFKUaBVLMmgWR0CSC+5xBE8adX2UKGgGaAloD0MIUDqRYKqZ67+UhpRSlGgVSzJoFkdAkgtGk8A7xXV9lChoBmgJaA9DCGAgCJChY/q/lIaUUpRoFUsyaBZHQJIKwyhzvJB1fZQoaAZoCWgPQwhOYaWCiur0v5SGlFKUaBVLMmgWR0CSCkxxT850dX2UKGgGaAloD0MIVwdA3NUr+7+UhpRSlGgVSzJoFkdAkgnQemvW6XV9lChoBmgJaA9DCAk02NR5VPC/lIaUUpRoFUsyaBZHQJIJV84Pwux1fZQoaAZoCWgPQwhEqFKzB9rlv5SGlFKUaBVLMmgWR0CSDs8h9srNdX2UKGgGaAloD0MIPBIvT+eK8b+UhpRSlGgVSzJoFkdAkg4nfZVXFXV9lChoBmgJaA9DCAckYd9OouW/lIaUUpRoFUsyaBZHQJINpA/s3Q51fZQoaAZoCWgPQwgdy7vqATP6v5SGlFKUaBVLMmgWR0CSDS0knkT6dX2UKGgGaAloD0MIObNdoQ+W3r+UhpRSlGgVSzJoFkdAkgyxCpm29nV9lChoBmgJaA9DCCbGMv0S8fq/lIaUUpRoFUsyaBZHQJIMOE12q1h1fZQoaAZoCWgPQwhJvDydK0r4v5SGlFKUaBVLMmgWR0CSEbd5IH1OdX2UKGgGaAloD0MIXalnQSgv8b+UhpRSlGgVSzJoFkdAkhEP6CUX53V9lChoBmgJaA9DCN9t3jgpjPa/lIaUUpRoFUsyaBZHQJIQjJQtSQ51fZQoaAZoCWgPQwgrpWd6iZEAwJSGlFKUaBVLMmgWR0CSEBYoy9EkdX2UKGgGaAloD0MIcsPvplu2+7+UhpRSlGgVSzJoFkdAkg+abSZ0CHV9lChoBmgJaA9DCOuLhLacCwTAlIaUUpRoFUsyaBZHQJIPIdXDFZR1ZS4="
|
81 |
},
|
82 |
"ep_success_buffer": {
|
83 |
":type:": "<class 'collections.deque'>",
|
84 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
85 |
},
|
86 |
+
"_n_updates": 16667,
|
87 |
"n_steps": 5,
|
88 |
"gamma": 0.99,
|
89 |
"gae_lambda": 1.0,
|
a2c-PandaReachDense-v2/policy.optimizer.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 44734
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3fa43fd8e98a45976f3de648611109f73015469656c3e39a5c8255ddced6b21c
|
3 |
size 44734
|
a2c-PandaReachDense-v2/policy.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 46014
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d59507284cf17c09bf73559bbeaf9688cdc63f446fb8c11267c0a276b2769179
|
3 |
size 46014
|
config.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVRQAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMG011bHRpSW5wdXRBY3RvckNyaXRpY1BvbGljeZSTlC4=", "__module__": "stable_baselines3.common.policies", "__doc__": "\n MultiInputActorClass policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space (Tuple)\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Uses the CombinedExtractor\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function MultiInputActorCriticPolicy.__init__ at 0x7f785cdb1c10>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7f785cdada80>"}, "verbose": 1, "policy_kwargs": {":type:": "<class 'dict'>", ":serialized:": "gAWVgQAAAAAAAAB9lCiMD29wdGltaXplcl9jbGFzc5SME3RvcmNoLm9wdGltLnJtc3Byb3CUjAdSTVNwcm9wlJOUjBBvcHRpbWl6ZXJfa3dhcmdzlH2UKIwFYWxwaGGURz/vrhR64UeujANlcHOURz7k+LWI42jxjAx3ZWlnaHRfZGVjYXmUSwB1dS4=", "optimizer_class": "<class 'torch.optim.rmsprop.RMSprop'>", "optimizer_kwargs": {"alpha": 0.99, "eps": 1e-05, "weight_decay": 0}}, "observation_space": {":type:": "<class 'gym.spaces.dict.Dict'>", ":serialized:": "gAWVUgMAAAAAAACMD2d5bS5zcGFjZXMuZGljdJSMBERpY3SUk5QpgZR9lCiMBnNwYWNlc5SMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwOZ3ltLnNwYWNlcy5ib3iUjANCb3iUk5QpgZR9lCiMBWR0eXBllIwFbnVtcHmUaBCTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowGX3NoYXBllEsDhZSMA2xvd5SMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYMAAAAAAAAAAAAIMEAACDBAAAgwZRoFUsDhZSMAUOUdJRSlIwEaGlnaJRoHSiWDAAAAAAAAAAAACBBAAAgQQAAIEGUaBVLA4WUaCB0lFKUjA1ib3VuZGVkX2JlbG93lGgdKJYDAAAAAAAAAAEBAZRoEowCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksDhZRoIHSUUpSMDWJvdW5kZWRfYWJvdmWUaB0olgMAAAAAAAAAAQEBlGgsSwOFlGggdJRSlIwKX25wX3JhbmRvbZROdWKMDGRlc2lyZWRfZ29hbJRoDSmBlH2UKGgQaBVoGEsDhZRoGmgdKJYMAAAAAAAAAAAAIMEAACDBAAAgwZRoFUsDhZRoIHSUUpRoI2gdKJYMAAAAAAAAAAAAIEEAACBBAAAgQZRoFUsDhZRoIHSUUpRoKGgdKJYDAAAAAAAAAAEBAZRoLEsDhZRoIHSUUpRoMmgdKJYDAAAAAAAAAAEBAZRoLEsDhZRoIHSUUpRoN051YowLb2JzZXJ2YXRpb26UaA0pgZR9lChoEGgVaBhLBoWUaBpoHSiWGAAAAAAAAAAAACDBAAAgwQAAIMEAACDBAAAgwQAAIMGUaBVLBoWUaCB0lFKUaCNoHSiWGAAAAAAAAAAAACBBAAAgQQAAIEEAACBBAAAgQQAAIEGUaBVLBoWUaCB0lFKUaChoHSiWBgAAAAAAAAABAQEBAQGUaCxLBoWUaCB0lFKUaDJoHSiWBgAAAAAAAAABAQEBAQGUaCxLBoWUaCB0lFKUaDdOdWJ1aBhOaBBOaDdOdWIu", "spaces": "OrderedDict([('achieved_goal', Box([-10. -10. -10.], [10. 10. 10.], (3,), float32)), ('desired_goal', Box([-10. -10. -10.], [10. 10. 10.], (3,), float32)), ('observation', Box([-10. -10. -10. -10. -10. -10.], [10. 10. 10. 10. 10. 10.], (6,), float32))])", "_shape": null, "dtype": null, "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVbQEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLA4WUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWDAAAAAAAAAAAAIC/AACAvwAAgL+UaApLA4WUjAFDlHSUUpSMBGhpZ2iUaBIolgwAAAAAAAAAAACAPwAAgD8AAIA/lGgKSwOFlGgVdJRSlIwNYm91bmRlZF9iZWxvd5RoEiiWAwAAAAAAAAABAQGUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLA4WUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYDAAAAAAAAAAEBAZRoIUsDhZRoFXSUUpSMCl9ucF9yYW5kb22UTnViLg==", "dtype": "float32", "_shape": [3], "low": "[-1. -1. -1.]", "high": "[1. 1. 1.]", "bounded_below": "[ True True True]", "bounded_above": "[ True True True]", "_np_random": null}, "n_envs": 4, "num_timesteps": 1000000, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1674224886800561643, "learning_rate": 0.0007, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/RvAGjbi6x4WUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'collections.OrderedDict'>", ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAA2rPNPpTv9L0ITBE/2rPNPpTv9L0ITBE/2rPNPpTv9L0ITBE/2rPNPpTv9L0ITBE/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAA5+eJPiIcfL9jdK8/u4gHv+ebmT9DtYq/TocJvscekz/3oYY/FhPBP/LF/z5ljOy+lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAADas80+lO/0vQhMET+VSbC6VGtGu2Wovrzas80+lO/0vQhMET+VSbC6VGtGu2Wovrzas80+lO/0vQhMET+VSbC6VGtGu2Wovrzas80+lO/0vQhMET+VSbC6VGtGu2WovryUaA5LBEsGhpRoEnSUUpR1Lg==", "achieved_goal": "[[ 0.40176278 -0.11959758 0.5675664 ]\n [ 0.40176278 -0.11959758 0.5675664 ]\n [ 0.40176278 -0.11959758 0.5675664 ]\n [ 0.40176278 -0.11959758 0.5675664 ]]", "desired_goal": "[[ 0.2693474 -0.9848043 1.3707393 ]\n [-0.5294301 1.2000703 -1.0836567 ]\n [-0.13430521 1.1493767 1.0518178 ]\n [ 1.508395 0.49955708 -0.46200863]]", "observation": "[[ 0.40176278 -0.11959758 0.5675664 -0.00134497 -0.00302764 -0.02327366]\n [ 0.40176278 -0.11959758 0.5675664 -0.00134497 -0.00302764 -0.02327366]\n [ 0.40176278 -0.11959758 0.5675664 -0.00134497 -0.00302764 -0.02327366]\n [ 0.40176278 -0.11959758 0.5675664 -0.00134497 -0.00302764 -0.02327366]]"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAEBAQGUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'collections.OrderedDict'>", ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAA6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAL1sSPEbu3by8htA8eVXgvbRLnb3kfyM+sIgGvtxDFb7BK8Y73pGPPH8yqD2NIVQ+lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAACUaA5LBEsGhpRoEnSUUpR1Lg==", "achieved_goal": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]]", "desired_goal": "[[ 0.00893287 -0.02709116 0.02545487]\n [-0.10953803 -0.07680455 0.15966755]\n [-0.1313808 -0.14576668 0.0060477 ]\n [ 0.01752561 0.08212756 0.20715924]]", "observation": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]]"}, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": 0.0, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIjup0IOvpD8CUhpRSlIwBbJRLMowBdJRHQKJAACRwIdF1fZQoaAZoCWgPQwhWuOUjKRkSwJSGlFKUaBVLMmgWR0CiP8UfYBeYdX2UKGgGaAloD0MIYDsYsU8gBMCUhpRSlGgVSzJoFkdAoj+I7PppvnV9lChoBmgJaA9DCA/vObAcMRLAlIaUUpRoFUsyaBZHQKI/S/GEPDp1fZQoaAZoCWgPQwjNeFvptfkEwJSGlFKUaBVLMmgWR0CiQNeaz/p/dX2UKGgGaAloD0MIIGCt2jWBCMCUhpRSlGgVSzJoFkdAokCcoScslXV9lChoBmgJaA9DCGagMv59JgzAlIaUUpRoFUsyaBZHQKJAYF0xM391fZQoaAZoCWgPQwi9/iQ+d0IMwJSGlFKUaBVLMmgWR0CiQCNet0V8dX2UKGgGaAloD0MIildZ2xQPBsCUhpRSlGgVSzJoFkdAokG3wAlv63V9lChoBmgJaA9DCMdHizOG2QfAlIaUUpRoFUsyaBZHQKJBfRc/t6Z1fZQoaAZoCWgPQwhCB13CoVcHwJSGlFKUaBVLMmgWR0CiQUEEcKgJdX2UKGgGaAloD0MItAJDVrfaAsCUhpRSlGgVSzJoFkdAokEEI3R5T3V9lChoBmgJaA9DCGIRww5jkgPAlIaUUpRoFUsyaBZHQKJCkFYdQwd1fZQoaAZoCWgPQwi7DWq/tRMLwJSGlFKUaBVLMmgWR0CiQlVzZHurdX2UKGgGaAloD0MITyFX6lmwBsCUhpRSlGgVSzJoFkdAokIZS1mapnV9lChoBmgJaA9DCKInZVJDuwfAlIaUUpRoFUsyaBZHQKJB3FNL1291fZQoaAZoCWgPQwh0CvKzkYsJwJSGlFKUaBVLMmgWR0CiQ2/hVENOdX2UKGgGaAloD0MIChAFM6YgCMCUhpRSlGgVSzJoFkdAokM00rK/23V9lChoBmgJaA9DCMxFfCdmnQrAlIaUUpRoFUsyaBZHQKJC+JvYODt1fZQoaAZoCWgPQwh/hGHAkusGwJSGlFKUaBVLMmgWR0CiQruEdvKmdX2UKGgGaAloD0MIRxyygXQRCcCUhpRSlGgVSzJoFkdAokRJULlV+HV9lChoBmgJaA9DCPfMkgA1dRDAlIaUUpRoFUsyaBZHQKJEDl1bJOp1fZQoaAZoCWgPQwi9HkyKj28HwJSGlFKUaBVLMmgWR0CiQ9Iyj59FdX2UKGgGaAloD0MItksbDkvDD8CUhpRSlGgVSzJoFkdAokOVHH3lCHV9lChoBmgJaA9DCPwYc9cS4hHAlIaUUpRoFUsyaBZHQKJFH5prULF1fZQoaAZoCWgPQwh4COOncc8LwJSGlFKUaBVLMmgWR0CiROSrxRVIdX2UKGgGaAloD0MIS1rxDYUvCsCUhpRSlGgVSzJoFkdAokSohhYvFnV9lChoBmgJaA9DCFsjgnFwCQzAlIaUUpRoFUsyaBZHQKJEa3l0YCR1fZQoaAZoCWgPQwgyWdx/ZLoHwJSGlFKUaBVLMmgWR0CiRf+3hGYsdX2UKGgGaAloD0MIXd+Hg4RoC8CUhpRSlGgVSzJoFkdAokXEpCrtFHV9lChoBmgJaA9DCCLgEKrUfBHAlIaUUpRoFUsyaBZHQKJFiHerMkh1fZQoaAZoCWgPQwhBvK5fsJsOwJSGlFKUaBVLMmgWR0CiRUtVinYQdX2UKGgGaAloD0MIT7FqEOYWCcCUhpRSlGgVSzJoFkdAokbViDujRHV9lChoBmgJaA9DCK+xS1RvjQjAlIaUUpRoFUsyaBZHQKJGmoVEd/91fZQoaAZoCWgPQwjtnGaBdkcJwJSGlFKUaBVLMmgWR0CiRl49X9zfdX2UKGgGaAloD0MIBU62gTuwC8CUhpRSlGgVSzJoFkdAokYhJkGzKXV9lChoBmgJaA9DCOi9MQQAhwLAlIaUUpRoFUsyaBZHQKJHtqnm7rd1fZQoaAZoCWgPQwgiN8MN+LwLwJSGlFKUaBVLMmgWR0CiR3un/DLsdX2UKGgGaAloD0MIDFpIwOgSFMCUhpRSlGgVSzJoFkdAokc/bVSXMXV9lChoBmgJaA9DCO26tyIxAQ/AlIaUUpRoFUsyaBZHQKJHAnFYMfB1fZQoaAZoCWgPQwifAIqRJTMHwJSGlFKUaBVLMmgWR0CiSItGd7OWdX2UKGgGaAloD0MImBdgH50KEcCUhpRSlGgVSzJoFkdAokhQP9UCJXV9lChoBmgJaA9DCJeQD3o2Kw3AlIaUUpRoFUsyaBZHQKJIFB2wFC91fZQoaAZoCWgPQwifHtsy4MwFwJSGlFKUaBVLMmgWR0CiR9dU83dcdX2UKGgGaAloD0MIqDrkZrgBBMCUhpRSlGgVSzJoFkdAoklsW43FUHV9lChoBmgJaA9DCNECtK1m/QPAlIaUUpRoFUsyaBZHQKJJMVwgkkd1fZQoaAZoCWgPQwjbp+MxA3UNwJSGlFKUaBVLMmgWR0CiSPVpj+aSdX2UKGgGaAloD0MINszQeCLIB8CUhpRSlGgVSzJoFkdAoki4Si/O+3V9lChoBmgJaA9DCLr5RnTPug/AlIaUUpRoFUsyaBZHQKJKSeI2wV11fZQoaAZoCWgPQwjLTdTS3AoJwJSGlFKUaBVLMmgWR0CiSg779AHFdX2UKGgGaAloD0MI9aCgFK1cCMCUhpRSlGgVSzJoFkdAoknS/j81oHV9lChoBmgJaA9DCOik942vnRDAlIaUUpRoFUsyaBZHQKJJleFcpsp1fZQoaAZoCWgPQwhjQWFQpjEIwJSGlFKUaBVLMmgWR0CiSx3dbgTAdX2UKGgGaAloD0MIMVwdAHE3DsCUhpRSlGgVSzJoFkdAokri4nWrfnV9lChoBmgJaA9DCAx07QvoxQvAlIaUUpRoFUsyaBZHQKJKpruYx+N1fZQoaAZoCWgPQwhrRDAOLl0NwJSGlFKUaBVLMmgWR0CiSmmyX2M9dX2UKGgGaAloD0MI7NlzmZoUEcCUhpRSlGgVSzJoFkdAokv8Z5zHTHV9lChoBmgJaA9DCFgBvtu8cQ3AlIaUUpRoFUsyaBZHQKJLwVtXPqt1fZQoaAZoCWgPQwgGK061FuYTwJSGlFKUaBVLMmgWR0CiS4U96kZadX2UKGgGaAloD0MIFr1TAfd8BsCUhpRSlGgVSzJoFkdAoktIOe8PF3V9lChoBmgJaA9DCF5LyAc9OwnAlIaUUpRoFUsyaBZHQKJM2NOuaF51fZQoaAZoCWgPQwhgj4mUZlMFwJSGlFKUaBVLMmgWR0CiTJ3juKGddX2UKGgGaAloD0MIG70aoDQUDsCUhpRSlGgVSzJoFkdAokxh/Aj6e3V9lChoBmgJaA9DCIWy8PW1bgrAlIaUUpRoFUsyaBZHQKJMJOX3QD51fZQoaAZoCWgPQwjAIVSp2XMQwJSGlFKUaBVLMmgWR0CiTbntOVPfdX2UKGgGaAloD0MIBVCMLJkDB8CUhpRSlGgVSzJoFkdAok1+9WZJCnV9lChoBmgJaA9DCMvVj03yAwrAlIaUUpRoFUsyaBZHQKJNQuL74zt1fZQoaAZoCWgPQwgv+grSjEUHwJSGlFKUaBVLMmgWR0CiTQXz+WGAdX2UKGgGaAloD0MI0NGqlnSUB8CUhpRSlGgVSzJoFkdAok6VgF5fMXV9lChoBmgJaA9DCELsTKHz+gPAlIaUUpRoFUsyaBZHQKJOWpG4I8h1fZQoaAZoCWgPQwgFw7mGGZoKwJSGlFKUaBVLMmgWR0CiTh5tvXK9dX2UKGgGaAloD0MIDtqrj4deBcCUhpRSlGgVSzJoFkdAok3hdld1MnV9lChoBmgJaA9DCOkmMQisfALAlIaUUpRoFUsyaBZHQKJPbsj3VTd1fZQoaAZoCWgPQwineccpOlIDwJSGlFKUaBVLMmgWR0CiTzRGDtgKdX2UKGgGaAloD0MIKSDtf4BVAcCUhpRSlGgVSzJoFkdAok74njQzDXV9lChoBmgJaA9DCLQ8D+7OmgjAlIaUUpRoFUsyaBZHQKJOvAsTWXl1fZQoaAZoCWgPQwheDybFx4cGwJSGlFKUaBVLMmgWR0CiUEkDIRywdX2UKGgGaAloD0MIVRUaiGUzCsCUhpRSlGgVSzJoFkdAolAN/YraunV9lChoBmgJaA9DCDSD+MCO/wjAlIaUUpRoFUsyaBZHQKJP0fdyksV1fZQoaAZoCWgPQwj75ZMVw7UPwJSGlFKUaBVLMmgWR0CiT5TuOS4fdX2UKGgGaAloD0MI2jujrUoCC8CUhpRSlGgVSzJoFkdAolEob4rSVnV9lChoBmgJaA9DCHptNlZiHgjAlIaUUpRoFUsyaBZHQKJQ7VrhzeZ1fZQoaAZoCWgPQwgmcyzvqmcGwJSGlFKUaBVLMmgWR0CiULFw97ngdX2UKGgGaAloD0MIbsST3cwoEMCUhpRSlGgVSzJoFkdAolB0UbkwOHV9lChoBmgJaA9DCF9CBYcXxAfAlIaUUpRoFUsyaBZHQKJSCIInjQ11fZQoaAZoCWgPQwhM4qyImmgKwJSGlFKUaBVLMmgWR0CiUc145cTrdX2UKGgGaAloD0MITkcAN4v3BcCUhpRSlGgVSzJoFkdAolGRRTCLuXV9lChoBmgJaA9DCArcupunegbAlIaUUpRoFUsyaBZHQKJRVDTBqKx1fZQoaAZoCWgPQwjy6bEtA84JwJSGlFKUaBVLMmgWR0CiUurhrFfidX2UKGgGaAloD0MIsFbtmpBGEMCUhpRSlGgVSzJoFkdAolKv1WbPQnV9lChoBmgJaA9DCDbLZaNzvg/AlIaUUpRoFUsyaBZHQKJSc5OrQw91fZQoaAZoCWgPQwj9wcBz76EFwJSGlFKUaBVLMmgWR0CiUjbNr0rcdX2UKGgGaAloD0MIPE1mvK1UCcCUhpRSlGgVSzJoFkdAolPY9C/oJXV9lChoBmgJaA9DCFsomZza2f+/lIaUUpRoFUsyaBZHQKJTng5zYEp1fZQoaAZoCWgPQwh79fHQd5cHwJSGlFKUaBVLMmgWR0CiU2HkT6BRdX2UKGgGaAloD0MIvYv34/YLCcCUhpRSlGgVSzJoFkdAolMkyP+4snV9lChoBmgJaA9DCHsTQ3IyMQbAlIaUUpRoFUsyaBZHQKJUrSeiBXl1fZQoaAZoCWgPQwhIp658licIwJSGlFKUaBVLMmgWR0CiVHIQWepXdX2UKGgGaAloD0MIuAIK9fRRBsCUhpRSlGgVSzJoFkdAolQ11KXfInV9lChoBmgJaA9DCOz5muWysQnAlIaUUpRoFUsyaBZHQKJT+LmZE2J1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 50000, "n_steps": 5, "gamma": 0.99, "gae_lambda": 1.0, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "normalize_advantage": false, "system_info": {"OS": "Linux-5.10.147+-x86_64-with-glibc2.29 # 1 SMP Sat Dec 10 16:00:40 UTC 2022", "Python": "3.8.10", "Stable-Baselines3": "1.7.0", "PyTorch": "1.13.1+cu116", "GPU Enabled": "True", "Numpy": "1.21.6", "Gym": "0.21.0"}}
|
|
|
1 |
+
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVRQAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMG011bHRpSW5wdXRBY3RvckNyaXRpY1BvbGljeZSTlC4=", "__module__": "stable_baselines3.common.policies", "__doc__": "\n MultiInputActorClass policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space (Tuple)\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Uses the CombinedExtractor\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function MultiInputActorCriticPolicy.__init__ at 0x7f1f3bea5430>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7f1f3be9ea80>"}, "verbose": 1, "policy_kwargs": {":type:": "<class 'dict'>", ":serialized:": "gAWVgQAAAAAAAAB9lCiMD29wdGltaXplcl9jbGFzc5SME3RvcmNoLm9wdGltLnJtc3Byb3CUjAdSTVNwcm9wlJOUjBBvcHRpbWl6ZXJfa3dhcmdzlH2UKIwFYWxwaGGURz/vrhR64UeujANlcHOURz7k+LWI42jxjAx3ZWlnaHRfZGVjYXmUSwB1dS4=", "optimizer_class": "<class 'torch.optim.rmsprop.RMSprop'>", "optimizer_kwargs": {"alpha": 0.99, "eps": 1e-05, "weight_decay": 0}}, "observation_space": {":type:": "<class 'gym.spaces.dict.Dict'>", ":serialized:": "gAWVUgMAAAAAAACMD2d5bS5zcGFjZXMuZGljdJSMBERpY3SUk5QpgZR9lCiMBnNwYWNlc5SMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwOZ3ltLnNwYWNlcy5ib3iUjANCb3iUk5QpgZR9lCiMBWR0eXBllIwFbnVtcHmUaBCTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowGX3NoYXBllEsDhZSMA2xvd5SMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYMAAAAAAAAAAAAIMEAACDBAAAgwZRoFUsDhZSMAUOUdJRSlIwEaGlnaJRoHSiWDAAAAAAAAAAAACBBAAAgQQAAIEGUaBVLA4WUaCB0lFKUjA1ib3VuZGVkX2JlbG93lGgdKJYDAAAAAAAAAAEBAZRoEowCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksDhZRoIHSUUpSMDWJvdW5kZWRfYWJvdmWUaB0olgMAAAAAAAAAAQEBlGgsSwOFlGggdJRSlIwKX25wX3JhbmRvbZROdWKMDGRlc2lyZWRfZ29hbJRoDSmBlH2UKGgQaBVoGEsDhZRoGmgdKJYMAAAAAAAAAAAAIMEAACDBAAAgwZRoFUsDhZRoIHSUUpRoI2gdKJYMAAAAAAAAAAAAIEEAACBBAAAgQZRoFUsDhZRoIHSUUpRoKGgdKJYDAAAAAAAAAAEBAZRoLEsDhZRoIHSUUpRoMmgdKJYDAAAAAAAAAAEBAZRoLEsDhZRoIHSUUpRoN051YowLb2JzZXJ2YXRpb26UaA0pgZR9lChoEGgVaBhLBoWUaBpoHSiWGAAAAAAAAAAAACDBAAAgwQAAIMEAACDBAAAgwQAAIMGUaBVLBoWUaCB0lFKUaCNoHSiWGAAAAAAAAAAAACBBAAAgQQAAIEEAACBBAAAgQQAAIEGUaBVLBoWUaCB0lFKUaChoHSiWBgAAAAAAAAABAQEBAQGUaCxLBoWUaCB0lFKUaDJoHSiWBgAAAAAAAAABAQEBAQGUaCxLBoWUaCB0lFKUaDdOdWJ1aBhOaBBOaDdOdWIu", "spaces": "OrderedDict([('achieved_goal', Box([-10. -10. -10.], [10. 10. 10.], (3,), float32)), ('desired_goal', Box([-10. -10. -10.], [10. 10. 10.], (3,), float32)), ('observation', Box([-10. -10. -10. -10. -10. -10.], [10. 10. 10. 10. 10. 10.], (6,), float32))])", "_shape": null, "dtype": null, "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVbQEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLA4WUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWDAAAAAAAAAAAAIC/AACAvwAAgL+UaApLA4WUjAFDlHSUUpSMBGhpZ2iUaBIolgwAAAAAAAAAAACAPwAAgD8AAIA/lGgKSwOFlGgVdJRSlIwNYm91bmRlZF9iZWxvd5RoEiiWAwAAAAAAAAABAQGUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLA4WUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYDAAAAAAAAAAEBAZRoIUsDhZRoFXSUUpSMCl9ucF9yYW5kb22UTnViLg==", "dtype": "float32", "_shape": [3], "low": "[-1. -1. -1.]", "high": "[1. 1. 1.]", "bounded_below": "[ True True True]", "bounded_above": "[ True True True]", "_np_random": null}, "n_envs": 6, "num_timesteps": 500010, "_total_timesteps": 500000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1674231992111677191, "learning_rate": 0.0007, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/RvAGjbi6x4WUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'collections.OrderedDict'>", ":serialized:": "gAWVGwIAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QolkgAAAAAAAAAhdFXP+Csjz+wtJK/wUQfPsUpLT/jLbq+MkJfv2G3gb934Hm/WnpHP7xfhb/BibQ+IAF3vy88Kz74h3g+n287P1Bvxb9dfjY+lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksGSwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcolkgAAAAAAAAAg92EPztUhj8PB5G/zuAGPgPfGz8XjIu+O/tzv/5Nd7/wO5S/W/+FP9wsd7/o4uI+FQGnvzmH9j0LnMA+ezKAP9o/vL9/rzY+lGgOSwZLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWkAAAAAAAAACF0Vc/4KyPP7C0kr9F2Z897punvXdQ6DzBRB8+xSktP+Mtur4WFCq81wQIPF2jiDoyQl+/YbeBv3fgeb/wpKc8ZMbQPANpaL1aekc/vF+Fv8GJtD4BNXy91CMqvlq9Yb0gAXe/LzwrPviHeD7+qjY99MUBvrYQ8bufbzs/UG/Fv11+Nj42wqo9mTwIvXlvoTyUaA5LBksGhpRoEnSUUpR1Lg==", "achieved_goal": "[[ 0.84304076 1.1224632 -1.1461391 ]\n [ 0.15553571 0.6764186 -0.36363134]\n [-0.8721038 -1.0134088 -0.9760813 ]\n [ 0.7792107 -1.0419841 0.35261348]\n [-0.9648609 0.16722177 0.24270618]\n [ 0.73217195 -1.5424595 0.17821641]]", "desired_goal": "[[ 1.03801 1.0494455 -1.1330279 ]\n [ 0.13171694 0.60887164 -0.27255318]\n [-0.9530522 -0.9660338 -1.1580791 ]\n [ 1.0468553 -0.96552825 0.4431374 ]\n [-1.3047205 0.1203751 0.3761905 ]\n [ 1.0015405 -1.4706986 0.17840384]]", "observation": "[[ 8.4304076e-01 1.1224632e+00 -1.1461391e+00 7.8051127e-02\n -8.1840381e-02 2.8358681e-02]\n [ 1.5553571e-01 6.7641860e-01 -3.6363134e-01 -1.0380765e-02\n 8.3019352e-03 1.0424663e-03]\n [-8.7210381e-01 -1.0134088e+00 -9.7608131e-01 2.0464391e-02\n 2.5485225e-02 -5.6740772e-02]\n [ 7.7921069e-01 -1.0419841e+00 3.5261348e-01 -6.1573986e-02\n -1.6615230e-01 -5.5112220e-02]\n [-9.6486092e-01 1.6722177e-01 2.4270618e-01 4.4596665e-02\n -1.2673169e-01 -7.3567284e-03]\n [ 7.3217195e-01 -1.5424595e+00 1.7821641e-01 8.3378240e-02\n -3.3260915e-02 1.9706475e-02]]"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVeQAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYGAAAAAAAAAAAAAAAAAJSMBW51bXB5lIwFZHR5cGWUk5SMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLBoWUjAFDlHSUUpQu"}, "_last_original_obs": {":type:": "<class 'collections.OrderedDict'>", ":serialized:": "gAWVGwIAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QolkgAAAAAAAAA6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksGSwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcolkgAAAAAAAAAuDPDPSABRb0/C4w+A6bjPbHtnDx1ZIc+2RWyPXoChT3zSHA+AqmovZ5hA72QZQo+vve8vHXjjb1NoJY+8LpdvYd6JD1d5RE9lGgOSwZLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWkAAAAAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAACUaA5LBksGhpRoEnSUUpR1Lg==", "achieved_goal": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]]", "desired_goal": "[[ 0.09531349 -0.04809678 0.2735233 ]\n [ 0.11115649 0.01915631 0.2644383 ]\n [ 0.08695573 0.06494613 0.23465328]\n [-0.08235361 -0.03207552 0.13515306]\n [-0.02306735 -0.0692815 0.29419175]\n [-0.05413336 0.04015591 0.03561913]]", "observation": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]]"}, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -1.999999999990898e-05, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIkPmAQGdS7L+UhpRSlIwBbJRLMowBdJRHQJHidNahYeV1fZQoaAZoCWgPQwjwF7MlqyLqv5SGlFKUaBVLMmgWR0CR4f4agmJFdX2UKGgGaAloD0MIk3L3OT7a7r+UhpRSlGgVSzJoFkdAkeGCS7oStnV9lChoBmgJaA9DCKp+pfPh2fa/lIaUUpRoFUsyaBZHQJHhCdWhh6V1fZQoaAZoCWgPQwiuLqcExKTwv5SGlFKUaBVLMmgWR0CR5pBTn7pFdX2UKGgGaAloD0MIFqJD4Egg5L+UhpRSlGgVSzJoFkdAkeXomw7kn3V9lChoBmgJaA9DCHlZEwt8xeS/lIaUUpRoFUsyaBZHQJHlZRyfcvd1fZQoaAZoCWgPQwhIiV3b263iv5SGlFKUaBVLMmgWR0CR5O35N47jdX2UKGgGaAloD0MIp+Zyg6GO8L+UhpRSlGgVSzJoFkdAkeRx8D0UXnV9lChoBmgJaA9DCK7zb5f9Ou+/lIaUUpRoFUsyaBZHQJHj+UnogV51fZQoaAZoCWgPQwjKNnAH6pTqv5SGlFKUaBVLMmgWR0CR6XgctGutdX2UKGgGaAloD0MIyvs4miMr5b+UhpRSlGgVSzJoFkdAkejQw0wai3V9lChoBmgJaA9DCM5RR8fVSOi/lIaUUpRoFUsyaBZHQJHoTWy1NQF1fZQoaAZoCWgPQwjnjCjtDb7qv5SGlFKUaBVLMmgWR0CR59ZqVQhwdX2UKGgGaAloD0MIiZgSSfQy77+UhpRSlGgVSzJoFkdAkedaYVqN63V9lChoBmgJaA9DCA1S8BRypeG/lIaUUpRoFUsyaBZHQJHm4bEP1+R1fZQoaAZoCWgPQwiHF0Skpt3tv5SGlFKUaBVLMmgWR0CR7Ey+6Ae8dX2UKGgGaAloD0MIKsWOxqF+97+UhpRSlGgVSzJoFkdAkeulSS/0unV9lChoBmgJaA9DCLt868N6I+K/lIaUUpRoFUsyaBZHQJHrIe3hGYt1fZQoaAZoCWgPQwg7N23GaUj1v5SGlFKUaBVLMmgWR0CR6qrRBu4xdX2UKGgGaAloD0MI2NMOf03W7L+UhpRSlGgVSzJoFkdAkeouueSSvHV9lChoBmgJaA9DCEiKyLCKN92/lIaUUpRoFUsyaBZHQJHptb7j1f51fZQoaAZoCWgPQwgtlbcjnJbjv5SGlFKUaBVLMmgWR0CR7yHRCx/vdX2UKGgGaAloD0MI0Vs8vOdA6b+UhpRSlGgVSzJoFkdAke56Cg9Ne3V9lChoBmgJaA9DCJ2C/Gzk+vK/lIaUUpRoFUsyaBZHQJHt9rO7g891fZQoaAZoCWgPQwh6xOi5ha7tv5SGlFKUaBVLMmgWR0CR7X+3Ytg8dX2UKGgGaAloD0MI0/pbAvAP8r+UhpRSlGgVSzJoFkdAke0D0163RXV9lChoBmgJaA9DCFSthVloZ+m/lIaUUpRoFUsyaBZHQJHsixrzoU11fZQoaAZoCWgPQwjTZpyGqAL1v5SGlFKUaBVLMmgWR0CR8fzhP0qZdX2UKGgGaAloD0MI7NtJRPiX5b+UhpRSlGgVSzJoFkdAkfFVGb1AaHV9lChoBmgJaA9DCML4adyb3+u/lIaUUpRoFUsyaBZHQJHw0ZsKsuF1fZQoaAZoCWgPQwizs+idCrjuv5SGlFKUaBVLMmgWR0CR8FqWC2+gdX2UKGgGaAloD0MI3e9QFOgT47+UhpRSlGgVSzJoFkdAke/ei8FpwnV9lChoBmgJaA9DCOcYkL3e/ea/lIaUUpRoFUsyaBZHQJHvZgAp8Wt1fZQoaAZoCWgPQwjlCu9yEd/5v5SGlFKUaBVLMmgWR0CR9NWjXWe6dX2UKGgGaAloD0MIyJQPQdXo7L+UhpRSlGgVSzJoFkdAkfQtwNsnA3V9lChoBmgJaA9DCNffEoB/KgDAlIaUUpRoFUsyaBZHQJHzqpKjBVN1fZQoaAZoCWgPQwiUhETaxt/wv5SGlFKUaBVLMmgWR0CR8zOIqLCOdX2UKGgGaAloD0MI7C+7Jw9L+r+UhpRSlGgVSzJoFkdAkfK32h7E53V9lChoBmgJaA9DCK67eapDbvC/lIaUUpRoFUsyaBZHQJHyP2g39751fZQoaAZoCWgPQwjMmljgK7rev5SGlFKUaBVLMmgWR0CR95pRoAXEdX2UKGgGaAloD0MIUMdjBipj+r+UhpRSlGgVSzJoFkdAkfby2c8Tz3V9lChoBmgJaA9DCP+vOnKkM+2/lIaUUpRoFUsyaBZHQJH2bzXjENx1fZQoaAZoCWgPQwi4Wicux6vqv5SGlFKUaBVLMmgWR0CR9fgHu7YkdX2UKGgGaAloD0MI1V5E2zE1/L+UhpRSlGgVSzJoFkdAkfV8NYr8SHV9lChoBmgJaA9DCN0Ii4o4Hfa/lIaUUpRoFUsyaBZHQJH1A3l0YCR1fZQoaAZoCWgPQwg9DRgkfRr9v5SGlFKUaBVLMmgWR0CR+nNucc2jdX2UKGgGaAloD0MIlDMUd7xJ57+UhpRSlGgVSzJoFkdAkfnLronrp3V9lChoBmgJaA9DCC0Heqhtw+S/lIaUUpRoFUsyaBZHQJH5SDRMN+d1fZQoaAZoCWgPQwiwcJLmj2n4v5SGlFKUaBVLMmgWR0CR+NEhJRO2dX2UKGgGaAloD0MIFAX6RJ6k/L+UhpRSlGgVSzJoFkdAkfhVOfukUXV9lChoBmgJaA9DCHGPpQ9dkP+/lIaUUpRoFUsyaBZHQJH33Mpw0fp1fZQoaAZoCWgPQwgZA+s4fuj4v5SGlFKUaBVLMmgWR0CR/VWuoxYadX2UKGgGaAloD0MIG2X9ZmK68b+UhpRSlGgVSzJoFkdAkfyt9MK1HHV9lChoBmgJaA9DCGjKTj+oy/m/lIaUUpRoFUsyaBZHQJH8KtSydFx1fZQoaAZoCWgPQwg9D+7O2u30v5SGlFKUaBVLMmgWR0CR+7PSDyvtdX2UKGgGaAloD0MIPZ6WH7jK8L+UhpRSlGgVSzJoFkdAkfs3xe9i+nV9lChoBmgJaA9DCDSEY5Y9yf+/lIaUUpRoFUsyaBZHQJH6vustCiR1fZQoaAZoCWgPQwgtB3qobYP2v5SGlFKUaBVLMmgWR0CSAGF3IMjNdX2UKGgGaAloD0MIw/UoXI8C87+UhpRSlGgVSzJoFkdAkf+6ASWZ7XV9lChoBmgJaA9DCG3GaYgq/PS/lIaUUpRoFUsyaBZHQJH/NoYekpJ1fZQoaAZoCWgPQwgi41Eq4Qnxv5SGlFKUaBVLMmgWR0CR/r+2mYShdX2UKGgGaAloD0MIWYtPATCeA8CUhpRSlGgVSzJoFkdAkf5Dx5LRKHV9lChoBmgJaA9DCPNUh9wMd/K/lIaUUpRoFUsyaBZHQJH9ywX668R1fZQoaAZoCWgPQwjH155ZEqDmv5SGlFKUaBVLMmgWR0CSA1jNpudgdX2UKGgGaAloD0MITYV4JF4e97+UhpRSlGgVSzJoFkdAkgKxNIsiCHV9lChoBmgJaA9DCBah2Aqa9gXAlIaUUpRoFUsyaBZHQJICLZSNwR51fZQoaAZoCWgPQwi2ErpL4qzlv5SGlFKUaBVLMmgWR0CSAbaLXL/0dX2UKGgGaAloD0MIISI17WIa/b+UhpRSlGgVSzJoFkdAkgE6r/82rHV9lChoBmgJaA9DCAVPIVfqWfm/lIaUUpRoFUsyaBZHQJIAwkRjBmB1fZQoaAZoCWgPQwjqXif1Zen3v5SGlFKUaBVLMmgWR0CSBitZFG5MdX2UKGgGaAloD0MIfQiqRq+G97+UhpRSlGgVSzJoFkdAkgWDjrAxjHV9lChoBmgJaA9DCIZY/RGGge+/lIaUUpRoFUsyaBZHQJIFABkqc3F1fZQoaAZoCWgPQwgBTYQNT+/zv5SGlFKUaBVLMmgWR0CSBIktVaOhdX2UKGgGaAloD0MIhVs+kpJe9L+UhpRSlGgVSzJoFkdAkgQNVea8YnV9lChoBmgJaA9DCMpOP6iL1PG/lIaUUpRoFUsyaBZHQJIDlJg9eQd1fZQoaAZoCWgPQwiDhv4JLlbrv5SGlFKUaBVLMmgWR0CSCQxBE8aGdX2UKGgGaAloD0MIQRAgQ8cO7b+UhpRSlGgVSzJoFkdAkghksJ6Y3XV9lChoBmgJaA9DCJc8npYfGATAlIaUUpRoFUsyaBZHQJIH4S39aU11fZQoaAZoCWgPQwgPuRluwKf1v5SGlFKUaBVLMmgWR0CSB2qvNeMRdX2UKGgGaAloD0MIxvmbUIjA87+UhpRSlGgVSzJoFkdAkgbu67NB4XV9lChoBmgJaA9DCBvZlZaRuve/lIaUUpRoFUsyaBZHQJIGdhd+ocd1fZQoaAZoCWgPQwh7Mv/om/QFwJSGlFKUaBVLMmgWR0CSC+5xBE8adX2UKGgGaAloD0MIUDqRYKqZ67+UhpRSlGgVSzJoFkdAkgtGk8A7xXV9lChoBmgJaA9DCGAgCJChY/q/lIaUUpRoFUsyaBZHQJIKwyhzvJB1fZQoaAZoCWgPQwhOYaWCiur0v5SGlFKUaBVLMmgWR0CSCkxxT850dX2UKGgGaAloD0MIVwdA3NUr+7+UhpRSlGgVSzJoFkdAkgnQemvW6XV9lChoBmgJaA9DCAk02NR5VPC/lIaUUpRoFUsyaBZHQJIJV84Pwux1fZQoaAZoCWgPQwhEqFKzB9rlv5SGlFKUaBVLMmgWR0CSDs8h9srNdX2UKGgGaAloD0MIPBIvT+eK8b+UhpRSlGgVSzJoFkdAkg4nfZVXFXV9lChoBmgJaA9DCAckYd9OouW/lIaUUpRoFUsyaBZHQJINpA/s3Q51fZQoaAZoCWgPQwgdy7vqATP6v5SGlFKUaBVLMmgWR0CSDS0knkT6dX2UKGgGaAloD0MIObNdoQ+W3r+UhpRSlGgVSzJoFkdAkgyxCpm29nV9lChoBmgJaA9DCCbGMv0S8fq/lIaUUpRoFUsyaBZHQJIMOE12q1h1fZQoaAZoCWgPQwhJvDydK0r4v5SGlFKUaBVLMmgWR0CSEbd5IH1OdX2UKGgGaAloD0MIXalnQSgv8b+UhpRSlGgVSzJoFkdAkhEP6CUX53V9lChoBmgJaA9DCN9t3jgpjPa/lIaUUpRoFUsyaBZHQJIQjJQtSQ51fZQoaAZoCWgPQwgrpWd6iZEAwJSGlFKUaBVLMmgWR0CSEBYoy9EkdX2UKGgGaAloD0MIcsPvplu2+7+UhpRSlGgVSzJoFkdAkg+abSZ0CHV9lChoBmgJaA9DCOuLhLacCwTAlIaUUpRoFUsyaBZHQJIPIdXDFZR1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 16667, "n_steps": 5, "gamma": 0.99, "gae_lambda": 1.0, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "normalize_advantage": false, "system_info": {"OS": "Linux-5.10.147+-x86_64-with-glibc2.29 # 1 SMP Sat Dec 10 16:00:40 UTC 2022", "Python": "3.8.10", "Stable-Baselines3": "1.7.0", "PyTorch": "1.13.1+cu116", "GPU Enabled": "True", "Numpy": "1.21.6", "Gym": "0.21.0"}}
|
replay.mp4
CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
|
|
results.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"mean_reward": -
|
|
|
1 |
+
{"mean_reward": -1.1068491909652949, "std_reward": 0.5270952168581304, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-01-20T16:47:10.173839"}
|
vec_normalize.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3056
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:06667dc9e6f2fed3e5c3f3e8222d83791416dad962c5d8f0a63271fc63724199
|
3 |
size 3056
|