|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.3555440604686737, |
|
"min": 0.3444250524044037, |
|
"max": 1.4453279972076416, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 10654.9443359375, |
|
"min": 10277.6435546875, |
|
"max": 43845.46875, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 989936.0, |
|
"min": 29884.0, |
|
"max": 989936.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 989936.0, |
|
"min": 29884.0, |
|
"max": 989936.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.7168408632278442, |
|
"min": -0.11632892489433289, |
|
"max": 0.7337176203727722, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 207.88385009765625, |
|
"min": -28.03527069091797, |
|
"max": 220.8489990234375, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": -0.005016577895730734, |
|
"min": -0.01984540745615959, |
|
"max": 0.32494187355041504, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": -1.4548076391220093, |
|
"min": -5.556714057922363, |
|
"max": 78.31098937988281, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.06983554277255842, |
|
"min": 0.065082382624906, |
|
"max": 0.07398626746989136, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 0.977697598815818, |
|
"min": 0.5689214679210824, |
|
"max": 1.0662160731250576, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.016041410039179024, |
|
"min": 0.0008615226076904601, |
|
"max": 0.01746883107512649, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.22457974054850635, |
|
"min": 0.010338271292285522, |
|
"max": 0.2555410061171392, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 7.440461805592858e-06, |
|
"min": 7.440461805592858e-06, |
|
"max": 0.0002947688642437125, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 0.00010416646527830001, |
|
"min": 0.00010416646527830001, |
|
"max": 0.0036327196890934997, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.10248012142857144, |
|
"min": 0.10248012142857144, |
|
"max": 0.1982562875, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 1.4347217, |
|
"min": 1.4347217, |
|
"max": 2.6109065000000005, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 0.00025776413071428576, |
|
"min": 0.00025776413071428576, |
|
"max": 0.00982580312125, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.0036086978300000007, |
|
"min": 0.0036086978300000007, |
|
"max": 0.12110955934999999, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.01404791884124279, |
|
"min": 0.01404791884124279, |
|
"max": 0.4897589087486267, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.19667086005210876, |
|
"min": 0.19667086005210876, |
|
"max": 3.9180712699890137, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 269.01801801801804, |
|
"min": 242.60162601626016, |
|
"max": 992.516129032258, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 29861.0, |
|
"min": 17450.0, |
|
"max": 32821.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.7129603390758101, |
|
"min": -0.928929082808956, |
|
"max": 1.757398356388255, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 190.13859763741493, |
|
"min": -28.796801567077637, |
|
"max": 216.15999783575535, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.7129603390758101, |
|
"min": -0.928929082808956, |
|
"max": 1.757398356388255, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 190.13859763741493, |
|
"min": -28.796801567077637, |
|
"max": 216.15999783575535, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.03898474175851637, |
|
"min": 0.03579492737054995, |
|
"max": 9.307819741260674, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 4.327306335195317, |
|
"min": 4.327306335195317, |
|
"max": 167.54075534269214, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1734224061", |
|
"python_version": "3.10.12 (main, Nov 6 2024, 20:22:13) [GCC 11.4.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
|
"mlagents_version": "1.2.0.dev0", |
|
"mlagents_envs_version": "1.2.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "2.5.1+cu121", |
|
"numpy_version": "1.23.5", |
|
"end_time_seconds": "1734227796" |
|
}, |
|
"total": 3734.4861459480003, |
|
"count": 1, |
|
"self": 0.7442452810005307, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.08567339599994739, |
|
"count": 1, |
|
"self": 0.08567339599994739 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 3733.656227271, |
|
"count": 1, |
|
"self": 2.3258756500417803, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 7.149475273000007, |
|
"count": 1, |
|
"self": 7.149475273000007 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 3724.0844160139573, |
|
"count": 64287, |
|
"self": 2.4799703210978805, |
|
"children": { |
|
"env_step": { |
|
"total": 2572.8057086688705, |
|
"count": 64287, |
|
"self": 2407.55905183686, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 163.74231810997117, |
|
"count": 64287, |
|
"self": 6.985091713972679, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 156.7572263959985, |
|
"count": 62554, |
|
"self": 156.7572263959985 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 1.5043387220396198, |
|
"count": 64287, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 3726.181707121919, |
|
"count": 64287, |
|
"is_parallel": true, |
|
"self": 1505.5052545249223, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.0036498389999906067, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0012262340000006589, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.002423604999989948, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.002423604999989948 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.06984606499997881, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.000907689999962713, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.000636894999956894, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.000636894999956894 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.06602473700002065, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.06602473700002065 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0022767430000385502, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0004938820000006672, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.001782861000037883, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.001782861000037883 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 2220.6764525969966, |
|
"count": 64286, |
|
"is_parallel": true, |
|
"self": 57.17260016098953, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 34.92766388501718, |
|
"count": 64286, |
|
"is_parallel": true, |
|
"self": 34.92766388501718 |
|
}, |
|
"communicator.exchange": { |
|
"total": 1983.0383064869516, |
|
"count": 64286, |
|
"is_parallel": true, |
|
"self": 1983.0383064869516 |
|
}, |
|
"steps_from_proto": { |
|
"total": 145.53788206403817, |
|
"count": 64286, |
|
"is_parallel": true, |
|
"self": 30.411831057882637, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 115.12605100615554, |
|
"count": 514288, |
|
"is_parallel": true, |
|
"self": 115.12605100615554 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 1148.7987370239891, |
|
"count": 64287, |
|
"self": 4.068511527960027, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 175.85607037002603, |
|
"count": 64287, |
|
"self": 175.52063816502562, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.3354322050004157, |
|
"count": 2, |
|
"self": 0.3354322050004157 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 968.874155126003, |
|
"count": 459, |
|
"self": 402.23629688097026, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 566.6378582450327, |
|
"count": 22806, |
|
"self": 566.6378582450327 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 2.016000507865101e-06, |
|
"count": 1, |
|
"self": 2.016000507865101e-06 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.09645831800025917, |
|
"count": 1, |
|
"self": 0.002015907999521005, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.09444241000073816, |
|
"count": 1, |
|
"self": 0.09444241000073816 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |