|
{ |
|
"name": "root", |
|
"gauges": { |
|
"SoccerTwos.Policy.Entropy.mean": { |
|
"value": 3.1518149375915527, |
|
"min": 3.1280832290649414, |
|
"max": 3.295764923095703, |
|
"count": 50 |
|
}, |
|
"SoccerTwos.Policy.Entropy.sum": { |
|
"value": 62532.0078125, |
|
"min": 7487.9755859375, |
|
"max": 108962.4609375, |
|
"count": 50 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.mean": { |
|
"value": 394.38461538461536, |
|
"min": 333.64285714285717, |
|
"max": 999.0, |
|
"count": 50 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.sum": { |
|
"value": 20508.0, |
|
"min": 13232.0, |
|
"max": 27188.0, |
|
"count": 50 |
|
}, |
|
"SoccerTwos.Self-play.ELO.mean": { |
|
"value": 1217.783430049334, |
|
"min": 1198.6947420967692, |
|
"max": 1219.1502834155515, |
|
"count": 49 |
|
}, |
|
"SoccerTwos.Self-play.ELO.sum": { |
|
"value": 26791.235461085344, |
|
"min": 2399.6648813132306, |
|
"max": 31659.675669988363, |
|
"count": 49 |
|
}, |
|
"SoccerTwos.Step.mean": { |
|
"value": 499342.0, |
|
"min": 9610.0, |
|
"max": 499342.0, |
|
"count": 50 |
|
}, |
|
"SoccerTwos.Step.sum": { |
|
"value": 499342.0, |
|
"min": 9610.0, |
|
"max": 499342.0, |
|
"count": 50 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
|
"value": 0.001771173789165914, |
|
"min": -0.0587509423494339, |
|
"max": 0.008092700503766537, |
|
"count": 50 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
|
"value": 0.04605051875114441, |
|
"min": -1.3193058967590332, |
|
"max": 0.16994671523571014, |
|
"count": 50 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": -0.0030848283786326647, |
|
"min": -0.05528537184000015, |
|
"max": 0.011168592609465122, |
|
"count": 50 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": -0.080205537378788, |
|
"min": -1.1658110618591309, |
|
"max": 0.23374596238136292, |
|
"count": 50 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.mean": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 50 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.sum": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 50 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.mean": { |
|
"value": -0.14319230730716997, |
|
"min": -0.6622699990868568, |
|
"max": 0.38508888747957015, |
|
"count": 50 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.sum": { |
|
"value": -3.7229999899864197, |
|
"min": -13.270399957895279, |
|
"max": 6.931599974632263, |
|
"count": 50 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.mean": { |
|
"value": -0.14319230730716997, |
|
"min": -0.6622699990868568, |
|
"max": 0.38508888747957015, |
|
"count": 50 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.sum": { |
|
"value": -3.7229999899864197, |
|
"min": -13.270399957895279, |
|
"max": 6.931599974632263, |
|
"count": 50 |
|
}, |
|
"SoccerTwos.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 50 |
|
}, |
|
"SoccerTwos.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 50 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.mean": { |
|
"value": 0.019773958838777618, |
|
"min": 0.014282445534384654, |
|
"max": 0.021488917719883222, |
|
"count": 22 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.sum": { |
|
"value": 0.019773958838777618, |
|
"min": 0.014282445534384654, |
|
"max": 0.021488917719883222, |
|
"count": 22 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.mean": { |
|
"value": 0.0035961836498851576, |
|
"min": 0.00197239763136687, |
|
"max": 0.010879720995823542, |
|
"count": 22 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.sum": { |
|
"value": 0.0035961836498851576, |
|
"min": 0.00197239763136687, |
|
"max": 0.010879720995823542, |
|
"count": 22 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.mean": { |
|
"value": 0.0038008132095759114, |
|
"min": 0.0018043413251039705, |
|
"max": 0.011257337064792712, |
|
"count": 22 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.sum": { |
|
"value": 0.0038008132095759114, |
|
"min": 0.0018043413251039705, |
|
"max": 0.011257337064792712, |
|
"count": 22 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.mean": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 22 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.sum": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 22 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.mean": { |
|
"value": 0.20000000000000007, |
|
"min": 0.19999999999999996, |
|
"max": 0.20000000000000007, |
|
"count": 22 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.sum": { |
|
"value": 0.20000000000000007, |
|
"min": 0.19999999999999996, |
|
"max": 0.20000000000000007, |
|
"count": 22 |
|
}, |
|
"SoccerTwos.Policy.Beta.mean": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005, |
|
"max": 0.005000000000000001, |
|
"count": 22 |
|
}, |
|
"SoccerTwos.Policy.Beta.sum": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005, |
|
"max": 0.005000000000000001, |
|
"count": 22 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1679237840", |
|
"python_version": "3.9.16 (main, Dec 7 2022, 01:11:51) \n[GCC 9.4.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-env-executables/linux/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force", |
|
"mlagents_version": "0.31.0.dev0", |
|
"mlagents_envs_version": "0.31.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.11.0+cu102", |
|
"numpy_version": "1.21.2", |
|
"end_time_seconds": "1679238979" |
|
}, |
|
"total": 1139.19451972, |
|
"count": 1, |
|
"self": 0.4422080589997677, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.10711526600016441, |
|
"count": 1, |
|
"self": 0.10711526600016441 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 1138.645196395, |
|
"count": 1, |
|
"self": 0.9060929790161936, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 10.464037975999872, |
|
"count": 3, |
|
"self": 10.464037975999872 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 1127.0194457709838, |
|
"count": 32372, |
|
"self": 1.0659959959739354, |
|
"children": { |
|
"env_step": { |
|
"total": 920.126967747969, |
|
"count": 32372, |
|
"self": 724.232329287993, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 195.33478310100145, |
|
"count": 32372, |
|
"self": 6.310763247022123, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 189.02401985397933, |
|
"count": 64076, |
|
"self": 189.02401985397933 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 0.5598553589745734, |
|
"count": 32372, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 1135.4949169180063, |
|
"count": 32372, |
|
"is_parallel": true, |
|
"self": 528.9950504610001, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.006792135999830862, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.004350616000010632, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0024415199998202297, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0024415199998202297 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.06933690400001069, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0009805639997466642, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0007959760000630922, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0007959760000630922 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.06406958000002305, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.06406958000002305 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0034907840001778823, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.000761014000090654, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0027297700000872283, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0027297700000872283 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 606.4953913580061, |
|
"count": 32371, |
|
"is_parallel": true, |
|
"self": 33.801688653018346, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 25.64243305999662, |
|
"count": 32371, |
|
"is_parallel": true, |
|
"self": 25.64243305999662 |
|
}, |
|
"communicator.exchange": { |
|
"total": 437.3293248820107, |
|
"count": 32371, |
|
"is_parallel": true, |
|
"self": 437.3293248820107 |
|
}, |
|
"steps_from_proto": { |
|
"total": 109.72194476298046, |
|
"count": 64742, |
|
"is_parallel": true, |
|
"self": 20.71364357187258, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 89.00830119110788, |
|
"count": 258968, |
|
"is_parallel": true, |
|
"self": 89.00830119110788 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.004475099000046612, |
|
"count": 4, |
|
"is_parallel": true, |
|
"self": 0.000881249999110878, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.003593849000935734, |
|
"count": 16, |
|
"is_parallel": true, |
|
"self": 0.003593849000935734 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 205.8264820270408, |
|
"count": 32372, |
|
"self": 7.714931302054993, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 57.23321689998488, |
|
"count": 32372, |
|
"self": 56.99616937798487, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.23704752200001167, |
|
"count": 1, |
|
"self": 0.23704752200001167 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 140.87833382500094, |
|
"count": 22, |
|
"self": 87.20122397999853, |
|
"children": { |
|
"TorchPOCAOptimizer.update": { |
|
"total": 53.677109845002406, |
|
"count": 672, |
|
"self": 53.677109845002406 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 1.0140001904801466e-06, |
|
"count": 1, |
|
"self": 1.0140001904801466e-06 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.2556186550000348, |
|
"count": 1, |
|
"self": 0.001857178999671305, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.2537614760003635, |
|
"count": 1, |
|
"self": 0.2537614760003635 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |