|
{ |
|
"name": "root", |
|
"gauges": { |
|
"SoccerTwos.Policy.Entropy.mean": { |
|
"value": 1.5668424367904663, |
|
"min": 1.5011452436447144, |
|
"max": 3.2958030700683594, |
|
"count": 1500 |
|
}, |
|
"SoccerTwos.Policy.Entropy.sum": { |
|
"value": 31437.126953125, |
|
"min": 20539.86328125, |
|
"max": 139477.171875, |
|
"count": 1500 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.mean": { |
|
"value": 49.535353535353536, |
|
"min": 37.40769230769231, |
|
"max": 999.0, |
|
"count": 1500 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.sum": { |
|
"value": 19616.0, |
|
"min": 13784.0, |
|
"max": 30080.0, |
|
"count": 1500 |
|
}, |
|
"SoccerTwos.Self-play.ELO.mean": { |
|
"value": 1613.1626451644208, |
|
"min": 1182.5759922505104, |
|
"max": 1693.1391499720842, |
|
"count": 1461 |
|
}, |
|
"SoccerTwos.Self-play.ELO.sum": { |
|
"value": 319406.20374255534, |
|
"min": 2366.6584398141267, |
|
"max": 418503.31246517465, |
|
"count": 1461 |
|
}, |
|
"SoccerTwos.Step.mean": { |
|
"value": 14999991.0, |
|
"min": 9056.0, |
|
"max": 14999991.0, |
|
"count": 1500 |
|
}, |
|
"SoccerTwos.Step.sum": { |
|
"value": 14999991.0, |
|
"min": 9056.0, |
|
"max": 14999991.0, |
|
"count": 1500 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
|
"value": -0.042363736778497696, |
|
"min": -0.12342528253793716, |
|
"max": 0.21824456751346588, |
|
"count": 1500 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
|
"value": -8.388019561767578, |
|
"min": -23.450803756713867, |
|
"max": 29.76882553100586, |
|
"count": 1500 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": -0.04421196132898331, |
|
"min": -0.12307731062173843, |
|
"max": 0.21696819365024567, |
|
"count": 1500 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": -8.753968238830566, |
|
"min": -23.384689331054688, |
|
"max": 30.355152130126953, |
|
"count": 1500 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.mean": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 1500 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.sum": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 1500 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.mean": { |
|
"value": -0.03473737534850535, |
|
"min": -0.5714285714285714, |
|
"max": 0.5861288127252611, |
|
"count": 1500 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.sum": { |
|
"value": -6.878000319004059, |
|
"min": -59.04639995098114, |
|
"max": 55.0628000497818, |
|
"count": 1500 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.mean": { |
|
"value": -0.03473737534850535, |
|
"min": -0.5714285714285714, |
|
"max": 0.5861288127252611, |
|
"count": 1500 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.sum": { |
|
"value": -6.878000319004059, |
|
"min": -59.04639995098114, |
|
"max": 55.0628000497818, |
|
"count": 1500 |
|
}, |
|
"SoccerTwos.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 1500 |
|
}, |
|
"SoccerTwos.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 1500 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.mean": { |
|
"value": 0.01692735132625482, |
|
"min": 0.008673173755717774, |
|
"max": 0.02537493456620723, |
|
"count": 724 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.sum": { |
|
"value": 0.01692735132625482, |
|
"min": 0.008673173755717774, |
|
"max": 0.02537493456620723, |
|
"count": 724 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.mean": { |
|
"value": 0.1095173495511214, |
|
"min": 2.8146574327555147e-07, |
|
"max": 0.13110793729623157, |
|
"count": 724 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.sum": { |
|
"value": 0.1095173495511214, |
|
"min": 2.8146574327555147e-07, |
|
"max": 0.13110793729623157, |
|
"count": 724 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.mean": { |
|
"value": 0.11108667875329653, |
|
"min": 2.4219187485149024e-07, |
|
"max": 0.1342211882273356, |
|
"count": 724 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.sum": { |
|
"value": 0.11108667875329653, |
|
"min": 2.4219187485149024e-07, |
|
"max": 0.1342211882273356, |
|
"count": 724 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.mean": { |
|
"value": 0.00019999999999999996, |
|
"min": 0.00019999999999999996, |
|
"max": 0.00019999999999999996, |
|
"count": 724 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.sum": { |
|
"value": 0.00019999999999999996, |
|
"min": 0.00019999999999999996, |
|
"max": 0.00019999999999999996, |
|
"count": 724 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.mean": { |
|
"value": 0.20000000000000007, |
|
"min": 0.20000000000000007, |
|
"max": 0.20000000000000007, |
|
"count": 724 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.sum": { |
|
"value": 0.20000000000000007, |
|
"min": 0.20000000000000007, |
|
"max": 0.20000000000000007, |
|
"count": 724 |
|
}, |
|
"SoccerTwos.Policy.Beta.mean": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005000000000000001, |
|
"max": 0.005000000000000001, |
|
"count": 724 |
|
}, |
|
"SoccerTwos.Policy.Beta.sum": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005000000000000001, |
|
"max": 0.005000000000000001, |
|
"count": 724 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1719349536", |
|
"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]", |
|
"command_line_arguments": "/home/pandita/anaconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id==SoccerTwosTrial --force --no-graphics", |
|
"mlagents_version": "1.1.0.dev0", |
|
"mlagents_envs_version": "1.1.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "2.3.1+cu121", |
|
"numpy_version": "1.23.5", |
|
"end_time_seconds": "1719366982" |
|
}, |
|
"total": 17446.608223610998, |
|
"count": 1, |
|
"self": 0.21834589999707532, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.010502066998014925, |
|
"count": 1, |
|
"self": 0.010502066998014925 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 17446.379375644003, |
|
"count": 1, |
|
"self": 17.780386075039132, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 2.5676018060075876, |
|
"count": 75, |
|
"self": 2.5676018060075876 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 17425.867149970956, |
|
"count": 1035080, |
|
"self": 17.467622792311886, |
|
"children": { |
|
"env_step": { |
|
"total": 12158.26244885652, |
|
"count": 1035080, |
|
"self": 8894.618521874247, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 3252.2571331651343, |
|
"count": 1035080, |
|
"self": 100.05797721151976, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 3152.1991559536145, |
|
"count": 1889688, |
|
"self": 3152.1991559536145 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 11.386793817138823, |
|
"count": 1035080, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 17420.066335439395, |
|
"count": 1035080, |
|
"is_parallel": true, |
|
"self": 10324.29204544552, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.001568653002323117, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.0004486799989535939, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0011199730033695232, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0011199730033695232 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.015322688002925133, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00035246599873062223, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.00030690499988850206, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00030690499988850206 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.013634989001729991, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.013634989001729991 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0010283280025760178, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.00023674400654272176, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.000791583996033296, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.000791583996033296 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 7095.698627933849, |
|
"count": 1035079, |
|
"is_parallel": true, |
|
"self": 361.7603478302808, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 274.0821232143244, |
|
"count": 1035079, |
|
"is_parallel": true, |
|
"self": 274.0821232143244 |
|
}, |
|
"communicator.exchange": { |
|
"total": 5442.701532716714, |
|
"count": 1035079, |
|
"is_parallel": true, |
|
"self": 5442.701532716714 |
|
}, |
|
"steps_from_proto": { |
|
"total": 1017.15462417253, |
|
"count": 2070158, |
|
"is_parallel": true, |
|
"self": 200.8899587075939, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 816.2646654649361, |
|
"count": 8280632, |
|
"is_parallel": true, |
|
"self": 816.2646654649361 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0756620600259339, |
|
"count": 148, |
|
"is_parallel": true, |
|
"self": 0.014940235047106398, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0607218249788275, |
|
"count": 592, |
|
"is_parallel": true, |
|
"self": 0.0607218249788275 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 5250.137078322125, |
|
"count": 1035080, |
|
"self": 137.34018241210288, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 1789.6481766791367, |
|
"count": 1035080, |
|
"self": 1784.776113835127, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 4.872062844009633, |
|
"count": 30, |
|
"self": 4.872062844009633 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 3323.148719230885, |
|
"count": 724, |
|
"self": 1161.5716940290258, |
|
"children": { |
|
"TorchPOCAOptimizer.update": { |
|
"total": 2161.577025201859, |
|
"count": 21720, |
|
"self": 2161.577025201859 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 7.019989425316453e-07, |
|
"count": 1, |
|
"self": 7.019989425316453e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.16423709000082454, |
|
"count": 1, |
|
"self": 0.0019961860016337596, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.16224090399919078, |
|
"count": 1, |
|
"self": 0.16224090399919078 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |