First Push
Browse files- BigWallJump.onnx +3 -0
- BigWallJump/BigWallJump-18499991.onnx +3 -0
- BigWallJump/BigWallJump-18499991.pt +3 -0
- BigWallJump/BigWallJump-18999986.onnx +3 -0
- BigWallJump/BigWallJump-18999986.pt +3 -0
- BigWallJump/BigWallJump-19499996.onnx +3 -0
- BigWallJump/BigWallJump-19499996.pt +3 -0
- BigWallJump/BigWallJump-19999998.onnx +3 -0
- BigWallJump/BigWallJump-19999998.pt +3 -0
- BigWallJump/BigWallJump-20000020.onnx +3 -0
- BigWallJump/BigWallJump-20000020.pt +3 -0
- BigWallJump/BigWallJump-24803.onnx +3 -0
- BigWallJump/BigWallJump-24803.pt +3 -0
- BigWallJump/BigWallJump-39339.onnx +3 -0
- BigWallJump/BigWallJump-39339.pt +3 -0
- BigWallJump/checkpoint.pt +3 -0
- BigWallJump/events.out.tfevents.1693677309.yaohua-NUC12DCMi7.122030.1 +3 -0
- README.md +35 -0
- SmallWallJump.onnx +3 -0
- SmallWallJump/SmallWallJump-17209.onnx +3 -0
- SmallWallJump/SmallWallJump-17209.pt +3 -0
- SmallWallJump/SmallWallJump-17576.onnx +3 -0
- SmallWallJump/SmallWallJump-17576.pt +3 -0
- SmallWallJump/SmallWallJump-3999997.onnx +3 -0
- SmallWallJump/SmallWallJump-3999997.pt +3 -0
- SmallWallJump/SmallWallJump-4499998.onnx +3 -0
- SmallWallJump/SmallWallJump-4499998.pt +3 -0
- SmallWallJump/SmallWallJump-4999999.onnx +3 -0
- SmallWallJump/SmallWallJump-4999999.pt +3 -0
- SmallWallJump/SmallWallJump-5499990.onnx +3 -0
- SmallWallJump/SmallWallJump-5499990.pt +3 -0
- SmallWallJump/SmallWallJump-5556184.onnx +3 -0
- SmallWallJump/SmallWallJump-5556184.pt +3 -0
- SmallWallJump/checkpoint.pt +3 -0
- SmallWallJump/events.out.tfevents.1693677307.yaohua-NUC12DCMi7.122030.0 +3 -0
- config.json +1 -0
- configuration.yaml +121 -0
- run_logs/timers.json +506 -0
- run_logs/training_status.json +123 -0
BigWallJump.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31a40b36dfed240c7ab2ba57aa6c496078212d7dcce94ff871bd09de7b02b491
|
3 |
+
size 741938
|
BigWallJump/BigWallJump-18499991.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:999e5fdbec013154017a315698a8c432b1d8e9b12e6e9e4b29361bf753558a1f
|
3 |
+
size 741938
|
BigWallJump/BigWallJump-18499991.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3922fcd20fc8804d94d77f6352c4ddc4dbcb0fc789f5938dbbec81c74de0bc78
|
3 |
+
size 4377440
|
BigWallJump/BigWallJump-18999986.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c57fdebb3f3118ed94afa1461f1f6702330c1c05734be772da0500fd167ef49
|
3 |
+
size 741938
|
BigWallJump/BigWallJump-18999986.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:951701de97ef08d512476638c9ac5cd0f94759301c44f213b6ff448da14b99a9
|
3 |
+
size 4377440
|
BigWallJump/BigWallJump-19499996.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1687140d353e5427f859c4c3ea0fc5049a150481aa3e8b94cb2b913753aac535
|
3 |
+
size 741938
|
BigWallJump/BigWallJump-19499996.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:14846b956c6c839036ed3d4568c617518c949964f36153d0d5ffacac94170c9c
|
3 |
+
size 4377440
|
BigWallJump/BigWallJump-19999998.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31a40b36dfed240c7ab2ba57aa6c496078212d7dcce94ff871bd09de7b02b491
|
3 |
+
size 741938
|
BigWallJump/BigWallJump-19999998.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb21671ffd052eebd51e6d2a579e828e8ee91f112f611ee1959ce0025ff2ef45
|
3 |
+
size 4377440
|
BigWallJump/BigWallJump-20000020.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31a40b36dfed240c7ab2ba57aa6c496078212d7dcce94ff871bd09de7b02b491
|
3 |
+
size 741938
|
BigWallJump/BigWallJump-20000020.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ef98ec111fc668dd4ca1036a09508467d5753bb08534a75e66e39f6df3d6e48
|
3 |
+
size 4377440
|
BigWallJump/BigWallJump-24803.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5caedf81c91eaf3eba503198dcb9ae508346f755c1cedc5ab2a07e6e9ef39e05
|
3 |
+
size 741938
|
BigWallJump/BigWallJump-24803.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:261abf29a5acff0fab040c4afdc854d8e67e2eb54c2a5d799162a4a8ff185bf3
|
3 |
+
size 4377191
|
BigWallJump/BigWallJump-39339.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb1ff0bb2c4488324597f0f507eedf260718b1272e2be32f2945e4c6719882fa
|
3 |
+
size 741938
|
BigWallJump/BigWallJump-39339.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b32f22287fb2ca5023f14fb2060df26ececf1662fbe0aa018539dfcf4010b038
|
3 |
+
size 4377191
|
BigWallJump/checkpoint.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59bd8db2cb7912688d88c27763ae8493f368dea3484b53d00bd3b668f8c4a546
|
3 |
+
size 4376610
|
BigWallJump/events.out.tfevents.1693677309.yaohua-NUC12DCMi7.122030.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:972e7d53472beccca4f37a3e1186611f248ac066b63b4ab150bf859a24da88c5
|
3 |
+
size 10113085
|
README.md
ADDED
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
library_name: ml-agents
|
3 |
+
tags:
|
4 |
+
- BigWallJump
|
5 |
+
- deep-reinforcement-learning
|
6 |
+
- reinforcement-learning
|
7 |
+
- ML-Agents-BigWallJump
|
8 |
+
---
|
9 |
+
|
10 |
+
# **ppo** Agent playing **BigWallJump**
|
11 |
+
This is a trained model of a **ppo** agent playing **BigWallJump**
|
12 |
+
using the [Unity ML-Agents Library](https://github.com/Unity-Technologies/ml-agents).
|
13 |
+
|
14 |
+
## Usage (with ML-Agents)
|
15 |
+
The Documentation: https://unity-technologies.github.io/ml-agents/ML-Agents-Toolkit-Documentation/
|
16 |
+
|
17 |
+
We wrote a complete tutorial to learn to train your first agent using ML-Agents and publish it to the Hub:
|
18 |
+
- A *short tutorial* where you teach Huggy the Dog 🐶 to fetch the stick and then play with him directly in your
|
19 |
+
browser: https://huggingface.co/learn/deep-rl-course/unitbonus1/introduction
|
20 |
+
- A *longer tutorial* to understand how works ML-Agents:
|
21 |
+
https://huggingface.co/learn/deep-rl-course/unit5/introduction
|
22 |
+
|
23 |
+
### Resume the training
|
24 |
+
```bash
|
25 |
+
mlagents-learn <your_configuration_file_path.yaml> --run-id=<run_id> --resume
|
26 |
+
```
|
27 |
+
|
28 |
+
### Watch your Agent play
|
29 |
+
You can watch your agent **playing directly in your browser**
|
30 |
+
|
31 |
+
1. If the environment is part of ML-Agents official environments, go to https://huggingface.co/unity
|
32 |
+
2. Step 1: Find your model_id: yaohuacn/walljump_test_02
|
33 |
+
3. Step 2: Select your *.nn /*.onnx file
|
34 |
+
4. Click on Watch the agent play 👀
|
35 |
+
|
SmallWallJump.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ac7e842133d1d95145f1aa3c6fbf2dac4b0def184bbce5f8500359172957348
|
3 |
+
size 741938
|
SmallWallJump/SmallWallJump-17209.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6aa8c6291f8bab28dfb8ba5017e1aca82fa9eadd1624450507033be7da8cdc8
|
3 |
+
size 741938
|
SmallWallJump/SmallWallJump-17209.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:761179a5902d65978d60a01ca0d5f06a73365e52ecdb7640c4e3b767bceacad4
|
3 |
+
size 4377357
|
SmallWallJump/SmallWallJump-17576.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9941ae401d7528ee4bb588d0b1e2d90a1dc3ee3f4296e85d32d7199c2d720869
|
3 |
+
size 741938
|
SmallWallJump/SmallWallJump-17576.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f7676a4850568be437295d22e1a2499469d3c2bd7af14e4775fda8bebd5ce67
|
3 |
+
size 4377357
|
SmallWallJump/SmallWallJump-3999997.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0801d7a093fff5c5d3cc78ac62d60f323481ebffb98fd5dd9f2ce3ac7cf1cf90
|
3 |
+
size 741938
|
SmallWallJump/SmallWallJump-3999997.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79967437cfd06f9d9506705d97abfbfe8029c8f3af916679585199631e801a50
|
3 |
+
size 4377523
|
SmallWallJump/SmallWallJump-4499998.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b6de973302486bf8b70b24e909b5829f4011407dcef0387fc977dd2a5293a2e
|
3 |
+
size 741938
|
SmallWallJump/SmallWallJump-4499998.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77464c6bd8300540cf6bbf16bf5f470f9ab5d697a329cc4db72c05077259d53a
|
3 |
+
size 4377523
|
SmallWallJump/SmallWallJump-4999999.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ac7e842133d1d95145f1aa3c6fbf2dac4b0def184bbce5f8500359172957348
|
3 |
+
size 741938
|
SmallWallJump/SmallWallJump-4999999.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f16cc083805d04832936686e4b79083012c3583a258c20dee49a7c12120c716
|
3 |
+
size 4377523
|
SmallWallJump/SmallWallJump-5499990.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ac7e842133d1d95145f1aa3c6fbf2dac4b0def184bbce5f8500359172957348
|
3 |
+
size 741938
|
SmallWallJump/SmallWallJump-5499990.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e437711650f830f9c24003f722b8ad9f1643dc096c088122f15322a710fd9ca2
|
3 |
+
size 4377523
|
SmallWallJump/SmallWallJump-5556184.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ac7e842133d1d95145f1aa3c6fbf2dac4b0def184bbce5f8500359172957348
|
3 |
+
size 741938
|
SmallWallJump/SmallWallJump-5556184.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fda7b8d42a477a77ecb057336760664778e12f7357825161c16ea1a7dd4902c1
|
3 |
+
size 4377523
|
SmallWallJump/checkpoint.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c37f3d482e0dff43cbdc55882a90ed1930e1e04f39114bcef9e07593df3f22f7
|
3 |
+
size 4376610
|
SmallWallJump/events.out.tfevents.1693677307.yaohua-NUC12DCMi7.122030.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:793b770078255796f7c47dbafa509a785c2a91d606a17aebc63a9698f5e42d87
|
3 |
+
size 2786054
|
config.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"default_settings": null, "behaviors": {"BigWallJump": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 1024, "buffer_size": 4096, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 500000, "network_settings": {"normalize": false, "hidden_units": 256, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": 20000000, "time_horizon": 128, "summary_freq": 20000, "threaded": false, "self_play": null, "behavioral_cloning": null}, "SmallWallJump": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 1024, "buffer_size": 4096, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 500000, "network_settings": {"normalize": false, "hidden_units": 256, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": 5000000, "time_horizon": 128, "summary_freq": 20000, "threaded": false, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": null, "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "walljump_test_02", "initialize_from": null, "load_model": false, "resume": false, "force": true, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
|
configuration.yaml
ADDED
@@ -0,0 +1,121 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
default_settings: null
|
2 |
+
behaviors:
|
3 |
+
BigWallJump:
|
4 |
+
trainer_type: ppo
|
5 |
+
hyperparameters:
|
6 |
+
batch_size: 1024
|
7 |
+
buffer_size: 4096
|
8 |
+
learning_rate: 0.0003
|
9 |
+
beta: 0.005
|
10 |
+
epsilon: 0.2
|
11 |
+
lambd: 0.95
|
12 |
+
num_epoch: 3
|
13 |
+
shared_critic: false
|
14 |
+
learning_rate_schedule: linear
|
15 |
+
beta_schedule: linear
|
16 |
+
epsilon_schedule: linear
|
17 |
+
checkpoint_interval: 500000
|
18 |
+
network_settings:
|
19 |
+
normalize: false
|
20 |
+
hidden_units: 256
|
21 |
+
num_layers: 2
|
22 |
+
vis_encode_type: simple
|
23 |
+
memory: null
|
24 |
+
goal_conditioning_type: hyper
|
25 |
+
deterministic: false
|
26 |
+
reward_signals:
|
27 |
+
extrinsic:
|
28 |
+
gamma: 0.99
|
29 |
+
strength: 1.0
|
30 |
+
network_settings:
|
31 |
+
normalize: false
|
32 |
+
hidden_units: 128
|
33 |
+
num_layers: 2
|
34 |
+
vis_encode_type: simple
|
35 |
+
memory: null
|
36 |
+
goal_conditioning_type: hyper
|
37 |
+
deterministic: false
|
38 |
+
init_path: null
|
39 |
+
keep_checkpoints: 5
|
40 |
+
even_checkpoints: false
|
41 |
+
max_steps: 20000000
|
42 |
+
time_horizon: 128
|
43 |
+
summary_freq: 20000
|
44 |
+
threaded: false
|
45 |
+
self_play: null
|
46 |
+
behavioral_cloning: null
|
47 |
+
SmallWallJump:
|
48 |
+
trainer_type: ppo
|
49 |
+
hyperparameters:
|
50 |
+
batch_size: 1024
|
51 |
+
buffer_size: 4096
|
52 |
+
learning_rate: 0.0003
|
53 |
+
beta: 0.005
|
54 |
+
epsilon: 0.2
|
55 |
+
lambd: 0.95
|
56 |
+
num_epoch: 3
|
57 |
+
shared_critic: false
|
58 |
+
learning_rate_schedule: linear
|
59 |
+
beta_schedule: linear
|
60 |
+
epsilon_schedule: linear
|
61 |
+
checkpoint_interval: 500000
|
62 |
+
network_settings:
|
63 |
+
normalize: false
|
64 |
+
hidden_units: 256
|
65 |
+
num_layers: 2
|
66 |
+
vis_encode_type: simple
|
67 |
+
memory: null
|
68 |
+
goal_conditioning_type: hyper
|
69 |
+
deterministic: false
|
70 |
+
reward_signals:
|
71 |
+
extrinsic:
|
72 |
+
gamma: 0.99
|
73 |
+
strength: 1.0
|
74 |
+
network_settings:
|
75 |
+
normalize: false
|
76 |
+
hidden_units: 128
|
77 |
+
num_layers: 2
|
78 |
+
vis_encode_type: simple
|
79 |
+
memory: null
|
80 |
+
goal_conditioning_type: hyper
|
81 |
+
deterministic: false
|
82 |
+
init_path: null
|
83 |
+
keep_checkpoints: 5
|
84 |
+
even_checkpoints: false
|
85 |
+
max_steps: 5000000
|
86 |
+
time_horizon: 128
|
87 |
+
summary_freq: 20000
|
88 |
+
threaded: false
|
89 |
+
self_play: null
|
90 |
+
behavioral_cloning: null
|
91 |
+
env_settings:
|
92 |
+
env_path: null
|
93 |
+
env_args: null
|
94 |
+
base_port: 5005
|
95 |
+
num_envs: 1
|
96 |
+
num_areas: 1
|
97 |
+
seed: -1
|
98 |
+
max_lifetime_restarts: 10
|
99 |
+
restarts_rate_limit_n: 1
|
100 |
+
restarts_rate_limit_period_s: 60
|
101 |
+
engine_settings:
|
102 |
+
width: 84
|
103 |
+
height: 84
|
104 |
+
quality_level: 5
|
105 |
+
time_scale: 20
|
106 |
+
target_frame_rate: -1
|
107 |
+
capture_frame_rate: 60
|
108 |
+
no_graphics: false
|
109 |
+
environment_parameters: null
|
110 |
+
checkpoint_settings:
|
111 |
+
run_id: walljump_test_02
|
112 |
+
initialize_from: null
|
113 |
+
load_model: false
|
114 |
+
resume: false
|
115 |
+
force: true
|
116 |
+
train_model: false
|
117 |
+
inference: false
|
118 |
+
results_dir: results
|
119 |
+
torch_settings:
|
120 |
+
device: null
|
121 |
+
debug: false
|
run_logs/timers.json
ADDED
@@ -0,0 +1,506 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"name": "root",
|
3 |
+
"gauges": {
|
4 |
+
"BigWallJump.Policy.Entropy.mean": {
|
5 |
+
"value": 0.9725682139396667,
|
6 |
+
"min": 0.9625186920166016,
|
7 |
+
"max": 3.9519944190979004,
|
8 |
+
"count": 1000
|
9 |
+
},
|
10 |
+
"BigWallJump.Policy.Entropy.sum": {
|
11 |
+
"value": 19416.3515625,
|
12 |
+
"min": 19233.048828125,
|
13 |
+
"max": 82067.1171875,
|
14 |
+
"count": 1000
|
15 |
+
},
|
16 |
+
"BigWallJump.Environment.EpisodeLength.mean": {
|
17 |
+
"value": 24.652564102564103,
|
18 |
+
"min": 24.180100755667507,
|
19 |
+
"max": 360.2857142857143,
|
20 |
+
"count": 1000
|
21 |
+
},
|
22 |
+
"BigWallJump.Environment.EpisodeLength.sum": {
|
23 |
+
"value": 19229.0,
|
24 |
+
"min": 17869.0,
|
25 |
+
"max": 22004.0,
|
26 |
+
"count": 1000
|
27 |
+
},
|
28 |
+
"BigWallJump.Step.mean": {
|
29 |
+
"value": 19999998.0,
|
30 |
+
"min": 19986.0,
|
31 |
+
"max": 19999998.0,
|
32 |
+
"count": 1000
|
33 |
+
},
|
34 |
+
"BigWallJump.Step.sum": {
|
35 |
+
"value": 19999998.0,
|
36 |
+
"min": 19986.0,
|
37 |
+
"max": 19999998.0,
|
38 |
+
"count": 1000
|
39 |
+
},
|
40 |
+
"BigWallJump.Policy.ExtrinsicValueEstimate.mean": {
|
41 |
+
"value": 0.8230504989624023,
|
42 |
+
"min": -0.5544101595878601,
|
43 |
+
"max": 0.8362411856651306,
|
44 |
+
"count": 1000
|
45 |
+
},
|
46 |
+
"BigWallJump.Policy.ExtrinsicValueEstimate.sum": {
|
47 |
+
"value": 641.9793701171875,
|
48 |
+
"min": -146.78138732910156,
|
49 |
+
"max": 659.5391235351562,
|
50 |
+
"count": 1000
|
51 |
+
},
|
52 |
+
"BigWallJump.Environment.CumulativeReward.mean": {
|
53 |
+
"value": 0.8793814066128853,
|
54 |
+
"min": -1.2468177382446204,
|
55 |
+
"max": 0.9177374817593565,
|
56 |
+
"count": 1000
|
57 |
+
},
|
58 |
+
"BigWallJump.Environment.CumulativeReward.sum": {
|
59 |
+
"value": 685.9174971580505,
|
60 |
+
"min": -337.0195025871508,
|
61 |
+
"max": 719.9999975562096,
|
62 |
+
"count": 1000
|
63 |
+
},
|
64 |
+
"BigWallJump.Policy.ExtrinsicReward.mean": {
|
65 |
+
"value": 0.8793814066128853,
|
66 |
+
"min": -1.2468177382446204,
|
67 |
+
"max": 0.9177374817593565,
|
68 |
+
"count": 1000
|
69 |
+
},
|
70 |
+
"BigWallJump.Policy.ExtrinsicReward.sum": {
|
71 |
+
"value": 685.9174971580505,
|
72 |
+
"min": -337.0195025871508,
|
73 |
+
"max": 719.9999975562096,
|
74 |
+
"count": 1000
|
75 |
+
},
|
76 |
+
"BigWallJump.Losses.PolicyLoss.mean": {
|
77 |
+
"value": 0.017277905321680005,
|
78 |
+
"min": 0.013837956769081453,
|
79 |
+
"max": 0.03131256672592523,
|
80 |
+
"count": 1000
|
81 |
+
},
|
82 |
+
"BigWallJump.Losses.PolicyLoss.sum": {
|
83 |
+
"value": 0.08638952660840003,
|
84 |
+
"min": 0.06026011286303401,
|
85 |
+
"max": 0.15406981386089075,
|
86 |
+
"count": 1000
|
87 |
+
},
|
88 |
+
"BigWallJump.Losses.ValueLoss.mean": {
|
89 |
+
"value": 0.02471310798233996,
|
90 |
+
"min": 0.002555308794399025,
|
91 |
+
"max": 0.08699909243732691,
|
92 |
+
"count": 1000
|
93 |
+
},
|
94 |
+
"BigWallJump.Losses.ValueLoss.sum": {
|
95 |
+
"value": 0.1235655399116998,
|
96 |
+
"min": 0.0102212351775961,
|
97 |
+
"max": 0.43499546218663454,
|
98 |
+
"count": 1000
|
99 |
+
},
|
100 |
+
"BigWallJump.Policy.LearningRate.mean": {
|
101 |
+
"value": 1.7335894224700115e-07,
|
102 |
+
"min": 1.7335894224700115e-07,
|
103 |
+
"max": 0.0002998448963017012,
|
104 |
+
"count": 1000
|
105 |
+
},
|
106 |
+
"BigWallJump.Policy.LearningRate.sum": {
|
107 |
+
"value": 8.667947112350057e-07,
|
108 |
+
"min": 8.667947112350057e-07,
|
109 |
+
"max": 0.001497824085725305,
|
110 |
+
"count": 1000
|
111 |
+
},
|
112 |
+
"BigWallJump.Policy.Epsilon.mean": {
|
113 |
+
"value": 0.100057753,
|
114 |
+
"min": 0.100057753,
|
115 |
+
"max": 0.19994829875000003,
|
116 |
+
"count": 1000
|
117 |
+
},
|
118 |
+
"BigWallJump.Policy.Epsilon.sum": {
|
119 |
+
"value": 0.500288765,
|
120 |
+
"min": 0.400600675,
|
121 |
+
"max": 0.999274695,
|
122 |
+
"count": 1000
|
123 |
+
},
|
124 |
+
"BigWallJump.Policy.Beta.mean": {
|
125 |
+
"value": 1.2881874700000022e-05,
|
126 |
+
"min": 1.2881874700000022e-05,
|
127 |
+
"max": 0.004997420107625,
|
128 |
+
"count": 1000
|
129 |
+
},
|
130 |
+
"BigWallJump.Policy.Beta.sum": {
|
131 |
+
"value": 6.44093735000001e-05,
|
132 |
+
"min": 6.44093735000001e-05,
|
133 |
+
"max": 0.024963807280500003,
|
134 |
+
"count": 1000
|
135 |
+
},
|
136 |
+
"BigWallJump.IsTraining.mean": {
|
137 |
+
"value": 1.0,
|
138 |
+
"min": 1.0,
|
139 |
+
"max": 1.0,
|
140 |
+
"count": 1000
|
141 |
+
},
|
142 |
+
"BigWallJump.IsTraining.sum": {
|
143 |
+
"value": 1.0,
|
144 |
+
"min": 1.0,
|
145 |
+
"max": 1.0,
|
146 |
+
"count": 1000
|
147 |
+
},
|
148 |
+
"SmallWallJump.Policy.Entropy.mean": {
|
149 |
+
"value": 1.1432201862335205,
|
150 |
+
"min": 1.127864122390747,
|
151 |
+
"max": 3.9578561782836914,
|
152 |
+
"count": 277
|
153 |
+
},
|
154 |
+
"SmallWallJump.Policy.Entropy.sum": {
|
155 |
+
"value": 22802.669921875,
|
156 |
+
"min": 22546.00390625,
|
157 |
+
"max": 80419.6796875,
|
158 |
+
"count": 277
|
159 |
+
},
|
160 |
+
"SmallWallJump.Environment.EpisodeLength.mean": {
|
161 |
+
"value": 14.281130634071811,
|
162 |
+
"min": 13.952914798206278,
|
163 |
+
"max": 78.04247104247104,
|
164 |
+
"count": 277
|
165 |
+
},
|
166 |
+
"SmallWallJump.Environment.EpisodeLength.sum": {
|
167 |
+
"value": 18694.0,
|
168 |
+
"min": 18662.0,
|
169 |
+
"max": 20213.0,
|
170 |
+
"count": 277
|
171 |
+
},
|
172 |
+
"SmallWallJump.Step.mean": {
|
173 |
+
"value": 5539990.0,
|
174 |
+
"min": 19906.0,
|
175 |
+
"max": 5539990.0,
|
176 |
+
"count": 277
|
177 |
+
},
|
178 |
+
"SmallWallJump.Step.sum": {
|
179 |
+
"value": 5539990.0,
|
180 |
+
"min": 19906.0,
|
181 |
+
"max": 5539990.0,
|
182 |
+
"count": 277
|
183 |
+
},
|
184 |
+
"SmallWallJump.Policy.ExtrinsicValueEstimate.mean": {
|
185 |
+
"value": 0.9011476635932922,
|
186 |
+
"min": -0.4881293773651123,
|
187 |
+
"max": 0.9083206057548523,
|
188 |
+
"count": 277
|
189 |
+
},
|
190 |
+
"SmallWallJump.Policy.ExtrinsicValueEstimate.sum": {
|
191 |
+
"value": 1179.602294921875,
|
192 |
+
"min": -156.6895294189453,
|
193 |
+
"max": 1206.5859375,
|
194 |
+
"count": 277
|
195 |
+
},
|
196 |
+
"SmallWallJump.Environment.CumulativeReward.mean": {
|
197 |
+
"value": 0.9520741039965334,
|
198 |
+
"min": -1.0653809613504563,
|
199 |
+
"max": 0.9619308807722704,
|
200 |
+
"count": 277
|
201 |
+
},
|
202 |
+
"SmallWallJump.Environment.CumulativeReward.sum": {
|
203 |
+
"value": 1246.265002131462,
|
204 |
+
"min": -357.96800301375333,
|
205 |
+
"max": 1280.3300023078918,
|
206 |
+
"count": 277
|
207 |
+
},
|
208 |
+
"SmallWallJump.Policy.ExtrinsicReward.mean": {
|
209 |
+
"value": 0.9520741039965334,
|
210 |
+
"min": -1.0653809613504563,
|
211 |
+
"max": 0.9619308807722704,
|
212 |
+
"count": 277
|
213 |
+
},
|
214 |
+
"SmallWallJump.Policy.ExtrinsicReward.sum": {
|
215 |
+
"value": 1246.265002131462,
|
216 |
+
"min": -357.96800301375333,
|
217 |
+
"max": 1280.3300023078918,
|
218 |
+
"count": 277
|
219 |
+
},
|
220 |
+
"SmallWallJump.Losses.PolicyLoss.mean": {
|
221 |
+
"value": 0.020284520431111255,
|
222 |
+
"min": 0.014728642107608417,
|
223 |
+
"max": 0.027711384867628412,
|
224 |
+
"count": 250
|
225 |
+
},
|
226 |
+
"SmallWallJump.Losses.PolicyLoss.sum": {
|
227 |
+
"value": 0.10142260215555628,
|
228 |
+
"min": 0.06312889838591218,
|
229 |
+
"max": 0.13855692433814207,
|
230 |
+
"count": 250
|
231 |
+
},
|
232 |
+
"SmallWallJump.Losses.ValueLoss.mean": {
|
233 |
+
"value": 0.014050534221072062,
|
234 |
+
"min": 0.004349971085321158,
|
235 |
+
"max": 0.12879822564621765,
|
236 |
+
"count": 250
|
237 |
+
},
|
238 |
+
"SmallWallJump.Losses.ValueLoss.sum": {
|
239 |
+
"value": 0.0702526711053603,
|
240 |
+
"min": 0.0178363644372439,
|
241 |
+
"max": 0.6439911282310883,
|
242 |
+
"count": 250
|
243 |
+
},
|
244 |
+
"SmallWallJump.Policy.LearningRate.mean": {
|
245 |
+
"value": 5.532878156039934e-07,
|
246 |
+
"min": 5.532878156039934e-07,
|
247 |
+
"max": 0.00029937621020793,
|
248 |
+
"count": 250
|
249 |
+
},
|
250 |
+
"SmallWallJump.Policy.LearningRate.sum": {
|
251 |
+
"value": 2.7664390780199667e-06,
|
252 |
+
"min": 2.7664390780199667e-06,
|
253 |
+
"max": 0.00149128866290378,
|
254 |
+
"count": 250
|
255 |
+
},
|
256 |
+
"SmallWallJump.Policy.Epsilon.mean": {
|
257 |
+
"value": 0.100184396,
|
258 |
+
"min": 0.100184396,
|
259 |
+
"max": 0.19979207000000002,
|
260 |
+
"count": 250
|
261 |
+
},
|
262 |
+
"SmallWallJump.Policy.Epsilon.sum": {
|
263 |
+
"value": 0.50092198,
|
264 |
+
"min": 0.40878648000000006,
|
265 |
+
"max": 0.9970962200000001,
|
266 |
+
"count": 250
|
267 |
+
},
|
268 |
+
"SmallWallJump.Policy.Beta.mean": {
|
269 |
+
"value": 1.9201360399999894e-05,
|
270 |
+
"min": 1.9201360399999894e-05,
|
271 |
+
"max": 0.004989624293,
|
272 |
+
"count": 250
|
273 |
+
},
|
274 |
+
"SmallWallJump.Policy.Beta.sum": {
|
275 |
+
"value": 9.600680199999947e-05,
|
276 |
+
"min": 9.600680199999947e-05,
|
277 |
+
"max": 0.024855101378000004,
|
278 |
+
"count": 250
|
279 |
+
},
|
280 |
+
"SmallWallJump.IsTraining.mean": {
|
281 |
+
"value": 0.0,
|
282 |
+
"min": 0.0,
|
283 |
+
"max": 1.0,
|
284 |
+
"count": 277
|
285 |
+
},
|
286 |
+
"SmallWallJump.IsTraining.sum": {
|
287 |
+
"value": 0.0,
|
288 |
+
"min": 0.0,
|
289 |
+
"max": 1.0,
|
290 |
+
"count": 277
|
291 |
+
}
|
292 |
+
},
|
293 |
+
"metadata": {
|
294 |
+
"timer_format_version": "0.1.0",
|
295 |
+
"start_time_seconds": "1693677305",
|
296 |
+
"python_version": "3.10.10 (main, Mar 21 2023, 18:45:11) [GCC 11.2.0]",
|
297 |
+
"command_line_arguments": "/home/yaohua/miniconda3/envs/drl2/bin/mlagents-learn config/ppo/WallJump.yaml --run-id=walljump_test_02 --force",
|
298 |
+
"mlagents_version": "0.31.0.dev0",
|
299 |
+
"mlagents_envs_version": "0.31.0.dev0",
|
300 |
+
"communication_protocol_version": "1.5.0",
|
301 |
+
"pytorch_version": "2.1.0.dev20230902+cu121",
|
302 |
+
"numpy_version": "1.21.2",
|
303 |
+
"end_time_seconds": "1693694847"
|
304 |
+
},
|
305 |
+
"total": 17542.104710366002,
|
306 |
+
"count": 1,
|
307 |
+
"self": 0.0042794360051630065,
|
308 |
+
"children": {
|
309 |
+
"run_training.setup": {
|
310 |
+
"total": 0.2931904069992015,
|
311 |
+
"count": 1,
|
312 |
+
"self": 0.2931904069992015
|
313 |
+
},
|
314 |
+
"TrainerController.start_learning": {
|
315 |
+
"total": 17541.807240522998,
|
316 |
+
"count": 1,
|
317 |
+
"self": 23.918419953661214,
|
318 |
+
"children": {
|
319 |
+
"TrainerController._reset_env": {
|
320 |
+
"total": 4.204136708998703,
|
321 |
+
"count": 1,
|
322 |
+
"self": 4.204136708998703
|
323 |
+
},
|
324 |
+
"TrainerController.advance": {
|
325 |
+
"total": 17513.588606540332,
|
326 |
+
"count": 1649473,
|
327 |
+
"self": 25.197562763569294,
|
328 |
+
"children": {
|
329 |
+
"env_step": {
|
330 |
+
"total": 12823.833156169661,
|
331 |
+
"count": 1649473,
|
332 |
+
"self": 9685.534935636744,
|
333 |
+
"children": {
|
334 |
+
"SubprocessEnvManager._take_step": {
|
335 |
+
"total": 3124.260964101806,
|
336 |
+
"count": 1649473,
|
337 |
+
"self": 82.05208733542531,
|
338 |
+
"children": {
|
339 |
+
"TorchPolicy.evaluate": {
|
340 |
+
"total": 3042.208876766381,
|
341 |
+
"count": 2084685,
|
342 |
+
"self": 3042.208876766381
|
343 |
+
}
|
344 |
+
}
|
345 |
+
},
|
346 |
+
"workers": {
|
347 |
+
"total": 14.037256431111018,
|
348 |
+
"count": 1649473,
|
349 |
+
"self": 0.0,
|
350 |
+
"children": {
|
351 |
+
"worker_root": {
|
352 |
+
"total": 17510.696612694024,
|
353 |
+
"count": 1649473,
|
354 |
+
"is_parallel": true,
|
355 |
+
"self": 9345.517714997717,
|
356 |
+
"children": {
|
357 |
+
"run_training.setup": {
|
358 |
+
"total": 0.0,
|
359 |
+
"count": 0,
|
360 |
+
"is_parallel": true,
|
361 |
+
"self": 0.0,
|
362 |
+
"children": {
|
363 |
+
"steps_from_proto": {
|
364 |
+
"total": 0.0019906219968106598,
|
365 |
+
"count": 2,
|
366 |
+
"is_parallel": true,
|
367 |
+
"self": 0.00035755999124376103,
|
368 |
+
"children": {
|
369 |
+
"_process_rank_one_or_two_observation": {
|
370 |
+
"total": 0.0016330620055668987,
|
371 |
+
"count": 12,
|
372 |
+
"is_parallel": true,
|
373 |
+
"self": 0.0016330620055668987
|
374 |
+
}
|
375 |
+
}
|
376 |
+
},
|
377 |
+
"UnityEnvironment.step": {
|
378 |
+
"total": 0.015547777999017853,
|
379 |
+
"count": 1,
|
380 |
+
"is_parallel": true,
|
381 |
+
"self": 0.00021877400286030024,
|
382 |
+
"children": {
|
383 |
+
"UnityEnvironment._generate_step_input": {
|
384 |
+
"total": 0.00022080600319895893,
|
385 |
+
"count": 1,
|
386 |
+
"is_parallel": true,
|
387 |
+
"self": 0.00022080600319895893
|
388 |
+
},
|
389 |
+
"communicator.exchange": {
|
390 |
+
"total": 0.014489156994386576,
|
391 |
+
"count": 1,
|
392 |
+
"is_parallel": true,
|
393 |
+
"self": 0.014489156994386576
|
394 |
+
},
|
395 |
+
"steps_from_proto": {
|
396 |
+
"total": 0.000619040998572018,
|
397 |
+
"count": 2,
|
398 |
+
"is_parallel": true,
|
399 |
+
"self": 0.00011063999409088865,
|
400 |
+
"children": {
|
401 |
+
"_process_rank_one_or_two_observation": {
|
402 |
+
"total": 0.0005084010044811293,
|
403 |
+
"count": 12,
|
404 |
+
"is_parallel": true,
|
405 |
+
"self": 0.0005084010044811293
|
406 |
+
}
|
407 |
+
}
|
408 |
+
}
|
409 |
+
}
|
410 |
+
}
|
411 |
+
}
|
412 |
+
},
|
413 |
+
"UnityEnvironment.step": {
|
414 |
+
"total": 8165.178897696307,
|
415 |
+
"count": 1649472,
|
416 |
+
"is_parallel": true,
|
417 |
+
"self": 376.3883987422014,
|
418 |
+
"children": {
|
419 |
+
"UnityEnvironment._generate_step_input": {
|
420 |
+
"total": 164.2484304461541,
|
421 |
+
"count": 1649472,
|
422 |
+
"is_parallel": true,
|
423 |
+
"self": 164.2484304461541
|
424 |
+
},
|
425 |
+
"communicator.exchange": {
|
426 |
+
"total": 6517.66026597649,
|
427 |
+
"count": 1649472,
|
428 |
+
"is_parallel": true,
|
429 |
+
"self": 6517.66026597649
|
430 |
+
},
|
431 |
+
"steps_from_proto": {
|
432 |
+
"total": 1106.8818025314613,
|
433 |
+
"count": 3298944,
|
434 |
+
"is_parallel": true,
|
435 |
+
"self": 223.7129027638657,
|
436 |
+
"children": {
|
437 |
+
"_process_rank_one_or_two_observation": {
|
438 |
+
"total": 883.1688997675956,
|
439 |
+
"count": 19793664,
|
440 |
+
"is_parallel": true,
|
441 |
+
"self": 883.1688997675956
|
442 |
+
}
|
443 |
+
}
|
444 |
+
}
|
445 |
+
}
|
446 |
+
}
|
447 |
+
}
|
448 |
+
}
|
449 |
+
}
|
450 |
+
}
|
451 |
+
}
|
452 |
+
},
|
453 |
+
"trainer_advance": {
|
454 |
+
"total": 4664.557887607101,
|
455 |
+
"count": 3298946,
|
456 |
+
"self": 64.85026829431445,
|
457 |
+
"children": {
|
458 |
+
"process_trajectory": {
|
459 |
+
"total": 1843.857758643273,
|
460 |
+
"count": 3298946,
|
461 |
+
"self": 1841.3516648222503,
|
462 |
+
"children": {
|
463 |
+
"RLTrainer._checkpoint": {
|
464 |
+
"total": 2.5060938210226595,
|
465 |
+
"count": 51,
|
466 |
+
"self": 2.5060938210226595
|
467 |
+
}
|
468 |
+
}
|
469 |
+
},
|
470 |
+
"_update_policy": {
|
471 |
+
"total": 2755.849860669514,
|
472 |
+
"count": 6056,
|
473 |
+
"self": 2171.7557627543065,
|
474 |
+
"children": {
|
475 |
+
"TorchPPOOptimizer.update": {
|
476 |
+
"total": 584.0940979152074,
|
477 |
+
"count": 72672,
|
478 |
+
"self": 584.0940979152074
|
479 |
+
}
|
480 |
+
}
|
481 |
+
}
|
482 |
+
}
|
483 |
+
}
|
484 |
+
}
|
485 |
+
},
|
486 |
+
"trainer_threads": {
|
487 |
+
"total": 5.440015229396522e-07,
|
488 |
+
"count": 1,
|
489 |
+
"self": 5.440015229396522e-07
|
490 |
+
},
|
491 |
+
"TrainerController._save_models": {
|
492 |
+
"total": 0.09607677600433817,
|
493 |
+
"count": 1,
|
494 |
+
"self": 0.0014533749999827705,
|
495 |
+
"children": {
|
496 |
+
"RLTrainer._checkpoint": {
|
497 |
+
"total": 0.0946234010043554,
|
498 |
+
"count": 2,
|
499 |
+
"self": 0.0946234010043554
|
500 |
+
}
|
501 |
+
}
|
502 |
+
}
|
503 |
+
}
|
504 |
+
}
|
505 |
+
}
|
506 |
+
}
|
run_logs/training_status.json
ADDED
@@ -0,0 +1,123 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"BigWallJump": {
|
3 |
+
"checkpoints": [
|
4 |
+
{
|
5 |
+
"steps": 18499991,
|
6 |
+
"file_path": "results/walljump_test_02/BigWallJump/BigWallJump-18499991.onnx",
|
7 |
+
"reward": 0.9090624977099268,
|
8 |
+
"creation_time": 1693693410.7455392,
|
9 |
+
"auxillary_file_paths": [
|
10 |
+
"results/walljump_test_02/BigWallJump/BigWallJump-18499991.pt"
|
11 |
+
]
|
12 |
+
},
|
13 |
+
{
|
14 |
+
"steps": 18999986,
|
15 |
+
"file_path": "results/walljump_test_02/BigWallJump/BigWallJump-18999986.onnx",
|
16 |
+
"reward": 0.8938157878423992,
|
17 |
+
"creation_time": 1693693892.4702873,
|
18 |
+
"auxillary_file_paths": [
|
19 |
+
"results/walljump_test_02/BigWallJump/BigWallJump-18999986.pt"
|
20 |
+
]
|
21 |
+
},
|
22 |
+
{
|
23 |
+
"steps": 19499996,
|
24 |
+
"file_path": "results/walljump_test_02/BigWallJump/BigWallJump-19499996.onnx",
|
25 |
+
"reward": 0.8163281232118607,
|
26 |
+
"creation_time": 1693694371.794366,
|
27 |
+
"auxillary_file_paths": [
|
28 |
+
"results/walljump_test_02/BigWallJump/BigWallJump-19499996.pt"
|
29 |
+
]
|
30 |
+
},
|
31 |
+
{
|
32 |
+
"steps": 19999998,
|
33 |
+
"file_path": "results/walljump_test_02/BigWallJump/BigWallJump-19999998.onnx",
|
34 |
+
"reward": 0.861711534170004,
|
35 |
+
"creation_time": 1693694847.2846408,
|
36 |
+
"auxillary_file_paths": [
|
37 |
+
"results/walljump_test_02/BigWallJump/BigWallJump-19999998.pt"
|
38 |
+
]
|
39 |
+
},
|
40 |
+
{
|
41 |
+
"steps": 20000020,
|
42 |
+
"file_path": "results/walljump_test_02/BigWallJump/BigWallJump-20000020.onnx",
|
43 |
+
"reward": 0.8623664078821662,
|
44 |
+
"creation_time": 1693694847.3825753,
|
45 |
+
"auxillary_file_paths": [
|
46 |
+
"results/walljump_test_02/BigWallJump/BigWallJump-20000020.pt"
|
47 |
+
]
|
48 |
+
}
|
49 |
+
],
|
50 |
+
"final_checkpoint": {
|
51 |
+
"steps": 20000020,
|
52 |
+
"file_path": "results/walljump_test_02/BigWallJump.onnx",
|
53 |
+
"reward": 0.8623664078821662,
|
54 |
+
"creation_time": 1693694847.3825753,
|
55 |
+
"auxillary_file_paths": [
|
56 |
+
"results/walljump_test_02/BigWallJump/BigWallJump-20000020.pt"
|
57 |
+
]
|
58 |
+
}
|
59 |
+
},
|
60 |
+
"SmallWallJump": {
|
61 |
+
"checkpoints": [
|
62 |
+
{
|
63 |
+
"steps": 3999997,
|
64 |
+
"file_path": "results/walljump_test_02/SmallWallJump/SmallWallJump-3999997.onnx",
|
65 |
+
"reward": 0.9061571420942034,
|
66 |
+
"creation_time": 1693690913.70728,
|
67 |
+
"auxillary_file_paths": [
|
68 |
+
"results/walljump_test_02/SmallWallJump/SmallWallJump-3999997.pt"
|
69 |
+
]
|
70 |
+
},
|
71 |
+
{
|
72 |
+
"steps": 4499998,
|
73 |
+
"file_path": "results/walljump_test_02/SmallWallJump/SmallWallJump-4499998.onnx",
|
74 |
+
"reward": 0.962499999198593,
|
75 |
+
"creation_time": 1693692202.4956467,
|
76 |
+
"auxillary_file_paths": [
|
77 |
+
"results/walljump_test_02/SmallWallJump/SmallWallJump-4499998.pt"
|
78 |
+
]
|
79 |
+
},
|
80 |
+
{
|
81 |
+
"steps": 4999999,
|
82 |
+
"file_path": "results/walljump_test_02/SmallWallJump/SmallWallJump-4999999.onnx",
|
83 |
+
"reward": 0.9641923088293809,
|
84 |
+
"creation_time": 1693693486.5171535,
|
85 |
+
"auxillary_file_paths": [
|
86 |
+
"results/walljump_test_02/SmallWallJump/SmallWallJump-4999999.pt"
|
87 |
+
]
|
88 |
+
},
|
89 |
+
{
|
90 |
+
"steps": 5499990,
|
91 |
+
"file_path": "results/walljump_test_02/SmallWallJump/SmallWallJump-5499990.onnx",
|
92 |
+
"reward": 0.9516337079151407,
|
93 |
+
"creation_time": 1693694711.5314128,
|
94 |
+
"auxillary_file_paths": [
|
95 |
+
"results/walljump_test_02/SmallWallJump/SmallWallJump-5499990.pt"
|
96 |
+
]
|
97 |
+
},
|
98 |
+
{
|
99 |
+
"steps": 5556184,
|
100 |
+
"file_path": "results/walljump_test_02/SmallWallJump/SmallWallJump-5556184.onnx",
|
101 |
+
"reward": 0.9514973373853384,
|
102 |
+
"creation_time": 1693694847.3359807,
|
103 |
+
"auxillary_file_paths": [
|
104 |
+
"results/walljump_test_02/SmallWallJump/SmallWallJump-5556184.pt"
|
105 |
+
]
|
106 |
+
}
|
107 |
+
],
|
108 |
+
"final_checkpoint": {
|
109 |
+
"steps": 5556184,
|
110 |
+
"file_path": "results/walljump_test_02/SmallWallJump.onnx",
|
111 |
+
"reward": 0.9514973373853384,
|
112 |
+
"creation_time": 1693694847.3359807,
|
113 |
+
"auxillary_file_paths": [
|
114 |
+
"results/walljump_test_02/SmallWallJump/SmallWallJump-5556184.pt"
|
115 |
+
]
|
116 |
+
}
|
117 |
+
},
|
118 |
+
"metadata": {
|
119 |
+
"stats_format_version": "0.3.0",
|
120 |
+
"mlagents_version": "0.31.0.dev0",
|
121 |
+
"torch_version": "2.1.0.dev20230902+cu121"
|
122 |
+
}
|
123 |
+
}
|