haolx commited on Jan 30, 2024

Commit

68f0c90

verified ·

1 Parent(s): 142a82f

First Push

Browse files

Files changed (21) hide show

SnowballTarget.onnx +2 -2
SnowballTarget/SnowballTarget-200112.onnx +2 -2
SnowballTarget/SnowballTarget-200112.pt +2 -2
SnowballTarget/SnowballTarget-249984.onnx +3 -0
SnowballTarget/SnowballTarget-249984.pt +3 -0
SnowballTarget/SnowballTarget-299944.onnx +3 -0
SnowballTarget/SnowballTarget-299944.pt +3 -0
SnowballTarget/SnowballTarget-349968.onnx +3 -0
SnowballTarget/SnowballTarget-349968.pt +3 -0
SnowballTarget/SnowballTarget-399968.onnx +3 -0
SnowballTarget/SnowballTarget-399968.pt +3 -0
SnowballTarget/SnowballTarget-400224.onnx +3 -0
SnowballTarget/SnowballTarget-400224.pt +3 -0
SnowballTarget/checkpoint.pt +2 -2
SnowballTarget/events.out.tfevents.1706586587.64f70067c60d.6658.0 +3 -0
SnowballTarget/events.out.tfevents.1706586651.64f70067c60d.6984.0 +3 -0
config.json +1 -1
configuration.yaml +3 -3
run_logs/Player-0.log +5 -8
run_logs/timers.json +135 -135
run_logs/training_status.json +58 -13

SnowballTarget.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:aea0441032f0bbd0baaf11a4ca41429a93264db22dd40b1b685f4ca27f2ce8a0
-size 650646

 version https://git-lfs.github.com/spec/v1
+oid sha256:7de8e61718c0d3b83cd0bd296f1e9ed631cd2296a23843e60d8b03b8d3cef4d9
+size 1178864

SnowballTarget/SnowballTarget-200112.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:aea0441032f0bbd0baaf11a4ca41429a93264db22dd40b1b685f4ca27f2ce8a0
-size 650646

 version https://git-lfs.github.com/spec/v1
+oid sha256:4e55ecbef98674628f2cbb3468df640ed49c1e7fea012c74fbf1d9067c36af96
+size 1177899

SnowballTarget/SnowballTarget-200112.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e60f12a2417ca8ca54268ff04dd683d18401d7fd3a5a08bcb42cbcd238816dcc
-size 3850075

 version https://git-lfs.github.com/spec/v1
+oid sha256:9dca1a50bc723fcbdf15080845d455a677a02934fc9e18be24974a71d83873f6
+size 2342243

SnowballTarget/SnowballTarget-249984.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b7dde4581d9b88a82ece2438d9b3c0a9329120a24fc38de85e992eb06ff0fad7
+size 1178864

SnowballTarget/SnowballTarget-249984.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6638b2e4283e7ae9e64f5a1662cb85cec9814c652a718b6cc1b86d5a6fbe5be1
+size 7018622

SnowballTarget/SnowballTarget-299944.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:71d12875e92651c02e3e847b0dbf42d879c500d61bb3022314925ba84a742e91
+size 1178864

SnowballTarget/SnowballTarget-299944.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cb2e799d258c8d73a6219e105f5196d97c1679e556f49dd549d7110a8e79286e
+size 7018622

SnowballTarget/SnowballTarget-349968.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:340c5a6e9ebd7a8c7f235df4ef6e41c98e01bd4e88d65864e91bf72366a5fdcc
+size 1178864

SnowballTarget/SnowballTarget-349968.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c8fc4fe71537b69da9e0203d58c388d101dc73f7dec45434cbb41ffe972bb96f
+size 7018622

SnowballTarget/SnowballTarget-399968.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7de8e61718c0d3b83cd0bd296f1e9ed631cd2296a23843e60d8b03b8d3cef4d9
+size 1178864

SnowballTarget/SnowballTarget-399968.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a0fdd5ebf8c3cc8f31b32307cdffbcd8226893e4c8ff15baca2fef57e38b8bd8
+size 7018622

SnowballTarget/SnowballTarget-400224.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7de8e61718c0d3b83cd0bd296f1e9ed631cd2296a23843e60d8b03b8d3cef4d9
+size 1178864

SnowballTarget/SnowballTarget-400224.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:669d417c3b0e9b179ff392ce8d7b74a88856fa664896b21352e57cce9e7e37cd
+size 7018622

SnowballTarget/checkpoint.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5cee364ef680cc084f26dad581ab9761f19748bcce33e79a656aaac58ac3eee7
-size 3849250

 version https://git-lfs.github.com/spec/v1
+oid sha256:64d85691043578f273f492e7a535a37b1391a15d7b9e836df1863ce13b7bae5f
+size 7017445

SnowballTarget/events.out.tfevents.1706586587.64f70067c60d.6658.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:05cd256de86814088408d0599f04266b38513f6f2f790961de63865ba8681816
+size 1114

SnowballTarget/events.out.tfevents.1706586651.64f70067c60d.6984.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3c66f69d8d5be37e2328ab5a9e2c042c3a0a4744cd4b9ae192bf8c079eab1de0
+size 23247

config.json CHANGED Viewed

@@ -1 +1 @@

- {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 2048, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": 256, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": ~~200000~~, "time_horizon": 64, "summary_freq": 10000, "threaded": true, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget1", "initialize_from": null, "load_model": false, "resume": ~~false~~, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

+ {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 2048, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": 256, "num_layers": 4, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": 400000, "time_horizon": 64, "summary_freq": 10000, "threaded": true, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget1", "initialize_from": null, "load_model": false, "resume": true, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

configuration.yaml CHANGED Viewed

@@ -18,7 +18,7 @@ behaviors:
     network_settings:
       normalize: false
       hidden_units: 256
-      num_layers: 2
       vis_encode_type: simple
       memory: null
       goal_conditioning_type: hyper
@@ -38,7 +38,7 @@ behaviors:
     init_path: null
     keep_checkpoints: 10
     even_checkpoints: false
-    max_steps: 200000
     time_horizon: 64
     summary_freq: 10000
     threaded: true
@@ -69,7 +69,7 @@ checkpoint_settings:
   run_id: SnowballTarget1
   initialize_from: null
   load_model: false
-  resume: false
   force: false
   train_model: false
   inference: false

     network_settings:
       normalize: false
       hidden_units: 256
+      num_layers: 4
       vis_encode_type: simple
       memory: null
       goal_conditioning_type: hyper
     init_path: null
     keep_checkpoints: 10
     even_checkpoints: false
+    max_steps: 400000
     time_horizon: 64
     summary_freq: 10000
     threaded: true
   run_id: SnowballTarget1
   initialize_from: null
   load_model: false
+  resume: true
   force: false
   train_model: false
   inference: false

run_logs/Player-0.log CHANGED Viewed

@@ -2,9 +2,6 @@ Mono path[0] = '/content/ml-agents/training-envs-executables/linux/SnowballTarge
 Mono config path = '/content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/MonoBleedingEdge/etc'
 Preloaded 'lib_burst_generated.so'
 Preloaded 'libgrpc_csharp_ext.x64.so'
-PlayerPrefs - Creating folder: /root/.config/unity3d/Hugging Face
-PlayerPrefs - Creating folder: /root/.config/unity3d/Hugging Face/SnowballTarget
-Unable to load player prefs
 Initialize engine version: 2021.3.14f1 (eee1884e7226)
 [Subsystems] Discovering subsystems at path /content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/UnitySubsystems
 Forcing GfxDevice: Null
@@ -34,7 +31,7 @@ ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM default
 FMOD failed to initialize the output device.: "Error initializing output device. " (60)
 FMOD initialized on nosound output
 Begin MonoManager ReloadAssembly
-- Completed reload, in  0.101 seconds
 ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -45,7 +42,7 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
-UnloadTime: 0.894757 ms
 ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 requesting resize 84 x 84
 Setting up 1 worker threads for Enlighten.
@@ -178,13 +175,13 @@ Memory Statistics:
       Peak usage frame count: [4.0 MB-8.0 MB]: 5460 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 6.6 MB
       Peak Large allocation bytes 0 B
     [ALLOC_DEFAULT_THREAD]
       Peak usage frame count: [16.0 MB-32.0 MB]: 5460 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 17.9 MB
       Peak Large allocation bytes 16.0 MB
 [ALLOC_TEMP_JOB_1_FRAME]
   Initial Block Size 2.0 MB
@@ -213,7 +210,7 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_GFX_MAIN]
-      Peak usage frame count: [32.0 KB-64.0 KB]: 5253 frames, [64.0 KB-128.0 KB]: 207 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 66.0 KB

 Mono config path = '/content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/MonoBleedingEdge/etc'
 Preloaded 'lib_burst_generated.so'
 Preloaded 'libgrpc_csharp_ext.x64.so'
 Initialize engine version: 2021.3.14f1 (eee1884e7226)
 [Subsystems] Discovering subsystems at path /content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/UnitySubsystems
 Forcing GfxDevice: Null
 FMOD failed to initialize the output device.: "Error initializing output device. " (60)
 FMOD initialized on nosound output
 Begin MonoManager ReloadAssembly
+- Completed reload, in  0.093 seconds
 ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
+UnloadTime: 0.841640 ms
 ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 requesting resize 84 x 84
 Setting up 1 worker threads for Enlighten.
       Peak usage frame count: [4.0 MB-8.0 MB]: 5460 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 6.7 MB
       Peak Large allocation bytes 0 B
     [ALLOC_DEFAULT_THREAD]
       Peak usage frame count: [16.0 MB-32.0 MB]: 5460 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 17.8 MB
       Peak Large allocation bytes 16.0 MB
 [ALLOC_TEMP_JOB_1_FRAME]
   Initial Block Size 2.0 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_GFX_MAIN]
+      Peak usage frame count: [32.0 KB-64.0 KB]: 5257 frames, [64.0 KB-128.0 KB]: 203 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 66.0 KB

run_logs/timers.json CHANGED Viewed

@@ -2,39 +2,39 @@
     "name": "root",
     "gauges": {
         "SnowballTarget.Policy.Entropy.mean": {
-            "value": 0.9640917181968689,
-            "min": 0.9640917181968689,
-            "max": 2.875121831893921,
             "count": 20
         },
         "SnowballTarget.Policy.Entropy.sum": {
-            "value": 9194.54296875,
-            "min": 9194.54296875,
-            "max": 29475.748046875,
             "count": 20
         },
         "SnowballTarget.Step.mean": {
-            "value": 199984.0,
-            "min": 9952.0,
-            "max": 199984.0,
             "count": 20
         },
         "SnowballTarget.Step.sum": {
-            "value": 199984.0,
-            "min": 9952.0,
-            "max": 199984.0,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
-            "value": 13.0621919631958,
-            "min": 0.2580852210521698,
-            "max": 13.0621919631958,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
-            "value": 2547.12744140625,
-            "min": 50.06853485107422,
-            "max": 2632.72509765625,
             "count": 20
         },
         "SnowballTarget.Environment.EpisodeLength.mean": {
@@ -50,87 +50,87 @@
             "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.mean": {
-            "value": 0.07620219156310401,
-            "min": 0.058910317715772716,
-            "max": 0.07620219156310401,
             "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.sum": {
-            "value": 0.30480876625241604,
-            "min": 0.23564127086309086,
-            "max": 0.36918028767047195,
             "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.mean": {
-            "value": 0.1935376073507702,
-            "min": 0.10430312625762514,
-            "max": 0.30434047576843526,
             "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.sum": {
-            "value": 0.7741504294030808,
-            "min": 0.41721250503050056,
-            "max": 1.5160913888145895,
             "count": 20
         },
         "SnowballTarget.Policy.LearningRate.mean": {
-            "value": 8.082097306000005e-06,
-            "min": 8.082097306000005e-06,
-            "max": 0.000291882002706,
             "count": 20
         },
         "SnowballTarget.Policy.LearningRate.sum": {
-            "value": 3.232838922400002e-05,
-            "min": 3.232838922400002e-05,
-            "max": 0.00138516003828,
             "count": 20
         },
         "SnowballTarget.Policy.Epsilon.mean": {
-            "value": 0.10269400000000001,
-            "min": 0.10269400000000001,
-            "max": 0.19729400000000002,
             "count": 20
         },
         "SnowballTarget.Policy.Epsilon.sum": {
-            "value": 0.41077600000000003,
-            "min": 0.41077600000000003,
-            "max": 0.96172,
             "count": 20
         },
         "SnowballTarget.Policy.Beta.mean": {
-            "value": 0.0001444306000000001,
-            "min": 0.0001444306000000001,
-            "max": 0.0048649706,
             "count": 20
         },
         "SnowballTarget.Policy.Beta.sum": {
-            "value": 0.0005777224000000004,
-            "min": 0.0005777224000000004,
-            "max": 0.023089828,
             "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.mean": {
-            "value": 25.454545454545453,
-            "min": 3.022727272727273,
-            "max": 25.78181818181818,
             "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.sum": {
-            "value": 1120.0,
-            "min": 133.0,
-            "max": 1418.0,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.mean": {
-            "value": 25.454545454545453,
-            "min": 3.022727272727273,
-            "max": 25.78181818181818,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.sum": {
-            "value": 1120.0,
-            "min": 133.0,
-            "max": 1418.0,
             "count": 20
         },
         "SnowballTarget.IsTraining.mean": {
@@ -148,67 +148,67 @@
     },
     "metadata": {
         "timer_format_version": "0.1.0",
-        "start_time_seconds": "1706585821",
         "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
-        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics",
         "mlagents_version": "1.1.0.dev0",
         "mlagents_envs_version": "1.1.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "2.1.2+cu121",
         "numpy_version": "1.23.5",
-        "end_time_seconds": "1706586320"
     },
-    "total": 498.938967403,
     "count": 1,
-    "self": 0.5930980260000069,
     "children": {
         "run_training.setup": {
-            "total": 0.06141591299990523,
             "count": 1,
-            "self": 0.06141591299990523
         },
         "TrainerController.start_learning": {
-            "total": 498.2844534640001,
             "count": 1,
-            "self": 0.7128704429934487,
             "children": {
                 "TrainerController._reset_env": {
-                    "total": 3.9214750250000634,
                     "count": 1,
-                    "self": 3.9214750250000634
                 },
                 "TrainerController.advance": {
-                    "total": 493.55023995700674,
-                    "count": 18198,
-                    "self": 0.3701143110024532,
                     "children": {
                         "env_step": {
-                            "total": 493.1801256460043,
-                            "count": 18198,
-                            "self": 326.14169851899044,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
-                                    "total": 166.69239135500163,
-                                    "count": 18198,
-                                    "self": 1.6520208929865703,
                                     "children": {
                                         "TorchPolicy.evaluate": {
-                                            "total": 165.04037046201506,
-                                            "count": 18198,
-                                            "self": 165.04037046201506
                                         }
                                     }
                                 },
                                 "workers": {
-                                    "total": 0.3460357720122147,
-                                    "count": 18198,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
-                                            "total": 496.8587532680011,
-                                            "count": 18198,
                                             "is_parallel": true,
-                                            "self": 242.92099891199825,
                                             "children": {
                                                 "run_training.setup": {
                                                     "total": 0.0,
@@ -217,48 +217,48 @@
                                                     "self": 0.0,
                                                     "children": {
                                                         "steps_from_proto": {
-                                                            "total": 0.005800985000064429,
                                                             "count": 1,
                                                             "is_parallel": true,
-                                                            "self": 0.003589930000202912,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
-                                                                    "total": 0.002211054999861517,
                                                                     "count": 10,
                                                                     "is_parallel": true,
-                                                                    "self": 0.002211054999861517
                                                                 }
                                                             }
                                                         },
                                                         "UnityEnvironment.step": {
-                                                            "total": 0.04478171999994629,
                                                             "count": 1,
                                                             "is_parallel": true,
-                                                            "self": 0.0007815909998498682,
                                                             "children": {
                                                                 "UnityEnvironment._generate_step_input": {
-                                                                    "total": 0.0005036119999886068,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.0005036119999886068
                                                                 },
                                                                 "communicator.exchange": {
-                                                                    "total": 0.041240630000061174,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.041240630000061174
                                                                 },
                                                                 "steps_from_proto": {
-                                                                    "total": 0.0022558870000466413,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.0004436040003383823,
                                                                     "children": {
                                                                         "_process_rank_one_or_two_observation": {
-                                                                            "total": 0.001812282999708259,
                                                                             "count": 10,
                                                                             "is_parallel": true,
-                                                                            "self": 0.001812282999708259
                                                                         }
                                                                     }
                                                                 }
@@ -267,34 +267,34 @@
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
-                                                    "total": 253.93775435600287,
-                                                    "count": 18197,
                                                     "is_parallel": true,
-                                                    "self": 11.717513592010505,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
-                                                            "total": 5.80607967000708,
-                                                            "count": 18197,
                                                             "is_parallel": true,
-                                                            "self": 5.80607967000708
                                                         },
                                                         "communicator.exchange": {
-                                                            "total": 199.6506076370058,
-                                                            "count": 18197,
                                                             "is_parallel": true,
-                                                            "self": 199.6506076370058
                                                         },
                                                         "steps_from_proto": {
-                                                            "total": 36.76355345697948,
-                                                            "count": 18197,
                                                             "is_parallel": true,
-                                                            "self": 7.211129860025494,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
-                                                                    "total": 29.552423596953986,
-                                                                    "count": 181970,
                                                                     "is_parallel": true,
-                                                                    "self": 29.552423596953986
                                                                 }
                                                             }
                                                         }
@@ -309,9 +309,9 @@
                     }
                 },
                 "trainer_threads": {
-                    "total": 4.622200003723265e-05,
                     "count": 1,
-                    "self": 4.622200003723265e-05,
                     "children": {
                         "thread_root": {
                             "total": 0.0,
@@ -320,36 +320,36 @@
                             "self": 0.0,
                             "children": {
                                 "trainer_advance": {
-                                    "total": 487.30327751295226,
-                                    "count": 745202,
                                     "is_parallel": true,
-                                    "self": 16.026501295877665,
                                     "children": {
                                         "process_trajectory": {
-                                            "total": 269.20563459607524,
-                                            "count": 745202,
                                             "is_parallel": true,
-                                            "self": 268.6841391000754,
                                             "children": {
                                                 "RLTrainer._checkpoint": {
-                                                    "total": 0.5214954959998295,
                                                     "count": 4,
                                                     "is_parallel": true,
-                                                    "self": 0.5214954959998295
                                                 }
                                             }
                                         },
                                         "_update_policy": {
-                                            "total": 202.07114162099936,
                                             "count": 90,
                                             "is_parallel": true,
-                                            "self": 61.49067776899642,
                                             "children": {
                                                 "TorchPPOOptimizer.update": {
-                                                    "total": 140.58046385200294,
                                                     "count": 4587,
                                                     "is_parallel": true,
-                                                    "self": 140.58046385200294
                                                 }
                                             }
                                         }
@@ -360,14 +360,14 @@
                     }
                 },
                 "TrainerController._save_models": {
-                    "total": 0.09982181699979265,
                     "count": 1,
-                    "self": 0.0011567599997306388,
                     "children": {
                         "RLTrainer._checkpoint": {
-                            "total": 0.098665057000062,
                             "count": 1,
-                            "self": 0.098665057000062
                         }
                     }
                 }

     "name": "root",
     "gauges": {
         "SnowballTarget.Policy.Entropy.mean": {
+            "value": 0.8955487012863159,
+            "min": 0.8948118686676025,
+            "max": 2.853564739227295,
             "count": 20
         },
         "SnowballTarget.Policy.Entropy.sum": {
+            "value": 9053.1015625,
+            "min": 8701.150390625,
+            "max": 29223.357421875,
             "count": 20
         },
         "SnowballTarget.Step.mean": {
+            "value": 399968.0,
+            "min": 209936.0,
+            "max": 399968.0,
             "count": 20
         },
         "SnowballTarget.Step.sum": {
+            "value": 399968.0,
+            "min": 209936.0,
+            "max": 399968.0,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
+            "value": 13.22802734375,
+            "min": 0.2574637532234192,
+            "max": 13.2938232421875,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
+            "value": 2579.46533203125,
+            "min": 49.433040618896484,
+            "max": 2711.93994140625,
             "count": 20
         },
         "SnowballTarget.Environment.EpisodeLength.mean": {
             "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.mean": {
+            "value": 0.07011461774013963,
+            "min": 0.06358130356124556,
+            "max": 0.07595940214380914,
             "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.sum": {
+            "value": 0.28045847096055854,
+            "min": 0.2543252142449822,
+            "max": 0.3797970107190457,
             "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.mean": {
+            "value": 0.21542924686389808,
+            "min": 0.1385706035470517,
+            "max": 0.30058827799032717,
             "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.sum": {
+            "value": 0.8617169874555923,
+            "min": 0.5542824141882068,
+            "max": 1.391813202231538,
             "count": 20
         },
         "SnowballTarget.Policy.LearningRate.mean": {
+            "value": 3.957098681000002e-06,
+            "min": 3.957098681000002e-06,
+            "max": 0.000145857051381,
             "count": 20
         },
         "SnowballTarget.Policy.LearningRate.sum": {
+            "value": 1.582839472400001e-05,
+            "min": 1.582839472400001e-05,
+            "max": 0.00069216026928,
             "count": 20
         },
         "SnowballTarget.Policy.Epsilon.mean": {
+            "value": 0.101319,
+            "min": 0.101319,
+            "max": 0.14861900000000003,
             "count": 20
         },
         "SnowballTarget.Policy.Epsilon.sum": {
+            "value": 0.405276,
+            "min": 0.405276,
+            "max": 0.73072,
             "count": 20
         },
         "SnowballTarget.Policy.Beta.mean": {
+            "value": 7.581810000000006e-05,
+            "min": 7.581810000000006e-05,
+            "max": 0.0024360881000000003,
             "count": 20
         },
         "SnowballTarget.Policy.Beta.sum": {
+            "value": 0.00030327240000000024,
+            "min": 0.00030327240000000024,
+            "max": 0.011562928000000002,
             "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.mean": {
+            "value": 25.704545454545453,
+            "min": 3.6363636363636362,
+            "max": 25.98181818181818,
             "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.sum": {
+            "value": 1131.0,
+            "min": 160.0,
+            "max": 1429.0,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.mean": {
+            "value": 25.704545454545453,
+            "min": 3.6363636363636362,
+            "max": 25.98181818181818,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.sum": {
+            "value": 1131.0,
+            "min": 160.0,
+            "max": 1429.0,
             "count": 20
         },
         "SnowballTarget.IsTraining.mean": {
     },
     "metadata": {
         "timer_format_version": "0.1.0",
+        "start_time_seconds": "1706586650",
         "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
+        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics --resume",
         "mlagents_version": "1.1.0.dev0",
         "mlagents_envs_version": "1.1.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "2.1.2+cu121",
         "numpy_version": "1.23.5",
+        "end_time_seconds": "1706587162"
     },
+    "total": 512.0949007670001,
     "count": 1,
+    "self": 0.47622578300024543,
     "children": {
         "run_training.setup": {
+            "total": 0.0539380440000059,
             "count": 1,
+            "self": 0.0539380440000059
         },
         "TrainerController.start_learning": {
+            "total": 511.5647369399999,
             "count": 1,
+            "self": 0.7514956730024096,
             "children": {
                 "TrainerController._reset_env": {
+                    "total": 2.3224954419999904,
                     "count": 1,
+                    "self": 2.3224954419999904
                 },
                 "TrainerController.advance": {
+                    "total": 508.35818274799726,
+                    "count": 18199,
+                    "self": 0.35644740900397665,
                     "children": {
                         "env_step": {
+                            "total": 508.0017353389933,
+                            "count": 18199,
+                            "self": 331.5146749430048,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
+                                    "total": 176.1266867020031,
+                                    "count": 18199,
+                                    "self": 1.6763091989912482,
                                     "children": {
                                         "TorchPolicy.evaluate": {
+                                            "total": 174.45037750301185,
+                                            "count": 18199,
+                                            "self": 174.45037750301185
                                         }
                                     }
                                 },
                                 "workers": {
+                                    "total": 0.3603736939853661,
+                                    "count": 18199,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
+                                            "total": 509.99262467098515,
+                                            "count": 18199,
                                             "is_parallel": true,
+                                            "self": 255.9905113189609,
                                             "children": {
                                                 "run_training.setup": {
                                                     "total": 0.0,
                                                     "self": 0.0,
                                                     "children": {
                                                         "steps_from_proto": {
+                                                            "total": 0.00214061299993773,
                                                             "count": 1,
                                                             "is_parallel": true,
+                                                            "self": 0.0006248759998470632,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
+                                                                    "total": 0.0015157370000906667,
                                                                     "count": 10,
                                                                     "is_parallel": true,
+                                                                    "self": 0.0015157370000906667
                                                                 }
                                                             }
                                                         },
                                                         "UnityEnvironment.step": {
+                                                            "total": 0.03927482999984022,
                                                             "count": 1,
                                                             "is_parallel": true,
+                                                            "self": 0.000713487999746576,
                                                             "children": {
                                                                 "UnityEnvironment._generate_step_input": {
+                                                                    "total": 0.00043658399999912945,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.00043658399999912945
                                                                 },
                                                                 "communicator.exchange": {
+                                                                    "total": 0.03600957499998003,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.03600957499998003
                                                                 },
                                                                 "steps_from_proto": {
+                                                                    "total": 0.0021151830001144845,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.00043435500015220896,
                                                                     "children": {
                                                                         "_process_rank_one_or_two_observation": {
+                                                                            "total": 0.0016808279999622755,
                                                                             "count": 10,
                                                                             "is_parallel": true,
+                                                                            "self": 0.0016808279999622755
                                                                         }
                                                                     }
                                                                 }
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
+                                                    "total": 254.00211335202425,
+                                                    "count": 18198,
                                                     "is_parallel": true,
+                                                    "self": 11.615472576003185,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
+                                                            "total": 5.810355305988878,
+                                                            "count": 18198,
                                                             "is_parallel": true,
+                                                            "self": 5.810355305988878
                                                         },
                                                         "communicator.exchange": {
+                                                            "total": 199.92710642801785,
+                                                            "count": 18198,
                                                             "is_parallel": true,
+                                                            "self": 199.92710642801785
                                                         },
                                                         "steps_from_proto": {
+                                                            "total": 36.64917904201434,
+                                                            "count": 18198,
                                                             "is_parallel": true,
+                                                            "self": 7.209387495973033,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
+                                                                    "total": 29.439791546041306,
+                                                                    "count": 181980,
                                                                     "is_parallel": true,
+                                                                    "self": 29.439791546041306
                                                                 }
                                                             }
                                                         }
                     }
                 },
                 "trainer_threads": {
+                    "total": 0.0002489560001777136,
                     "count": 1,
+                    "self": 0.0002489560001777136,
                     "children": {
                         "thread_root": {
                             "total": 0.0,
                             "self": 0.0,
                             "children": {
                                 "trainer_advance": {
+                                    "total": 502.01383666296533,
+                                    "count": 762377,
                                     "is_parallel": true,
+                                    "self": 16.35181663889466,
                                     "children": {
                                         "process_trajectory": {
+                                            "total": 274.5566146790702,
+                                            "count": 762377,
                                             "is_parallel": true,
+                                            "self": 273.66009452307003,
                                             "children": {
                                                 "RLTrainer._checkpoint": {
+                                                    "total": 0.8965201560001788,
                                                     "count": 4,
                                                     "is_parallel": true,
+                                                    "self": 0.8965201560001788
                                                 }
                                             }
                                         },
                                         "_update_policy": {
+                                            "total": 211.10540534500046,
                                             "count": 90,
                                             "is_parallel": true,
+                                            "self": 60.61084359299434,
                                             "children": {
                                                 "TorchPPOOptimizer.update": {
+                                                    "total": 150.49456175200612,
                                                     "count": 4587,
                                                     "is_parallel": true,
+                                                    "self": 150.49456175200612
                                                 }
                                             }
                                         }
                     }
                 },
                 "TrainerController._save_models": {
+                    "total": 0.1323141210000358,
                     "count": 1,
+                    "self": 0.002316863000032754,
                     "children": {
                         "RLTrainer._checkpoint": {
+                            "total": 0.12999725800000306,
                             "count": 1,
+                            "self": 0.12999725800000306
                         }
                     }
                 }

run_logs/training_status.json CHANGED Viewed

@@ -1,15 +1,6 @@
 {
     "SnowballTarget": {
         "checkpoints": [
-            {
-                "steps": 49936,
-                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.onnx",
-                "reward": 15.181818181818182,
-                "creation_time": 1706585952.6417303,
-                "auxillary_file_paths": [
-                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.pt"
-                ]
-            },
             {
                 "steps": 99960,
                 "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.onnx",
@@ -45,15 +36,69 @@
                 "auxillary_file_paths": [
                     "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
                 ]
             }
         ],
         "final_checkpoint": {
-            "steps": 200112,
             "file_path": "results/SnowballTarget1/SnowballTarget.onnx",
-            "reward": 24.90909090909091,
-            "creation_time": 1706586320.2787673,
             "auxillary_file_paths": [
-                "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
             ]
         }
     },

 {
     "SnowballTarget": {
         "checkpoints": [
             {
                 "steps": 99960,
                 "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.onnx",
                 "auxillary_file_paths": [
                     "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
                 ]
+            },
+            {
+                "steps": 200112,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.onnx",
+                "reward": null,
+                "creation_time": 1706586589.852068,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
+                ]
+            },
+            {
+                "steps": 249984,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-249984.onnx",
+                "reward": 18.636363636363637,
+                "creation_time": 1706586782.2838278,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-249984.pt"
+                ]
+            },
+            {
+                "steps": 299944,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-299944.onnx",
+                "reward": 25.363636363636363,
+                "creation_time": 1706586910.081696,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-299944.pt"
+                ]
+            },
+            {
+                "steps": 349968,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-349968.onnx",
+                "reward": 26.0,
+                "creation_time": 1706587036.3253357,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-349968.pt"
+                ]
+            },
+            {
+                "steps": 399968,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-399968.onnx",
+                "reward": 25.272727272727273,
+                "creation_time": 1706587161.87238,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-399968.pt"
+                ]
+            },
+            {
+                "steps": 400224,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-400224.onnx",
+                "reward": 25.272727272727273,
+                "creation_time": 1706587162.0471206,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-400224.pt"
+                ]
             }
         ],
         "final_checkpoint": {
+            "steps": 400224,
             "file_path": "results/SnowballTarget1/SnowballTarget.onnx",
+            "reward": 25.272727272727273,
+            "creation_time": 1706587162.0471206,
             "auxillary_file_paths": [
+                "results/SnowballTarget1/SnowballTarget/SnowballTarget-400224.pt"
             ]
         }
     },