|
{ |
|
"name": "root", |
|
"gauges": { |
|
"SoccerTwos.Policy.Entropy.mean": { |
|
"value": 1.953821063041687, |
|
"min": 1.8360395431518555, |
|
"max": 3.2957701683044434, |
|
"count": 2000 |
|
}, |
|
"SoccerTwos.Policy.Entropy.sum": { |
|
"value": 40764.5234375, |
|
"min": 15148.421875, |
|
"max": 150869.625, |
|
"count": 2000 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.mean": { |
|
"value": 61.9125, |
|
"min": 36.71969696969697, |
|
"max": 999.0, |
|
"count": 2000 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.sum": { |
|
"value": 19812.0, |
|
"min": 16324.0, |
|
"max": 25460.0, |
|
"count": 2000 |
|
}, |
|
"SoccerTwos.Self-play.ELO.mean": { |
|
"value": 1491.7116693595483, |
|
"min": 1181.2097928802395, |
|
"max": 1509.8147293466548, |
|
"count": 1933 |
|
}, |
|
"SoccerTwos.Self-play.ELO.sum": { |
|
"value": 238673.86709752772, |
|
"min": 2362.7470600107745, |
|
"max": 390666.0517786308, |
|
"count": 1933 |
|
}, |
|
"SoccerTwos.Step.mean": { |
|
"value": 19999970.0, |
|
"min": 9748.0, |
|
"max": 19999970.0, |
|
"count": 2000 |
|
}, |
|
"SoccerTwos.Step.sum": { |
|
"value": 19999970.0, |
|
"min": 9748.0, |
|
"max": 19999970.0, |
|
"count": 2000 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
|
"value": -0.013983321376144886, |
|
"min": -0.11188939958810806, |
|
"max": 0.14131636917591095, |
|
"count": 2000 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
|
"value": -2.2373313903808594, |
|
"min": -21.442651748657227, |
|
"max": 20.897668838500977, |
|
"count": 2000 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": -0.013222572393715382, |
|
"min": -0.11129643023014069, |
|
"max": 0.14043569564819336, |
|
"count": 2000 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": -2.1156115531921387, |
|
"min": -21.943002700805664, |
|
"max": 22.116891860961914, |
|
"count": 2000 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.mean": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 2000 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.sum": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 2000 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.mean": { |
|
"value": 0.03847750276327133, |
|
"min": -0.6666666666666666, |
|
"max": 0.4657187480479479, |
|
"count": 2000 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.sum": { |
|
"value": 6.156400442123413, |
|
"min": -61.22060042619705, |
|
"max": 64.98719954490662, |
|
"count": 2000 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.mean": { |
|
"value": 0.03847750276327133, |
|
"min": -0.6666666666666666, |
|
"max": 0.4657187480479479, |
|
"count": 2000 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.sum": { |
|
"value": 6.156400442123413, |
|
"min": -61.22060042619705, |
|
"max": 64.98719954490662, |
|
"count": 2000 |
|
}, |
|
"SoccerTwos.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 2000 |
|
}, |
|
"SoccerTwos.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 2000 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.mean": { |
|
"value": 0.010737808815125998, |
|
"min": 0.005027929565403611, |
|
"max": 0.020201207045465706, |
|
"count": 960 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.sum": { |
|
"value": 0.010737808815125998, |
|
"min": 0.005027929565403611, |
|
"max": 0.020201207045465706, |
|
"count": 960 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.mean": { |
|
"value": 0.10132837543884914, |
|
"min": 1.5233589768589204e-06, |
|
"max": 0.13846134146054587, |
|
"count": 960 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.sum": { |
|
"value": 0.10132837543884914, |
|
"min": 1.5233589768589204e-06, |
|
"max": 0.13846134146054587, |
|
"count": 960 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.mean": { |
|
"value": 0.10244849969943365, |
|
"min": 1.6686742810634313e-06, |
|
"max": 0.14102613031864167, |
|
"count": 960 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.sum": { |
|
"value": 0.10244849969943365, |
|
"min": 1.6686742810634313e-06, |
|
"max": 0.14102613031864167, |
|
"count": 960 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.mean": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 960 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.sum": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 960 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.mean": { |
|
"value": 0.20000000000000007, |
|
"min": 0.20000000000000007, |
|
"max": 0.20000000000000007, |
|
"count": 960 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.sum": { |
|
"value": 0.20000000000000007, |
|
"min": 0.20000000000000007, |
|
"max": 0.20000000000000007, |
|
"count": 960 |
|
}, |
|
"SoccerTwos.Policy.Beta.mean": { |
|
"value": 0.005, |
|
"min": 0.005, |
|
"max": 0.005, |
|
"count": 960 |
|
}, |
|
"SoccerTwos.Policy.Beta.sum": { |
|
"value": 0.005, |
|
"min": 0.005, |
|
"max": 0.005, |
|
"count": 960 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1705757198", |
|
"python_version": "3.10.12 | packaged by conda-forge | (main, Jun 23 2023, 22:40:32) [GCC 12.3.0]", |
|
"command_line_arguments": "/opt/conda/bin/mlagents-learn ./../input/soccerfinal/SoccerTwos.yaml --env=./ml-agents/trained-envs-executables/linux/SoccerTwos/SoccerTwos --run-id=Soccer --no-graphics", |
|
"mlagents_version": "1.1.0.dev0", |
|
"mlagents_envs_version": "1.1.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "2.1.2+cu121", |
|
"numpy_version": "1.23.5", |
|
"end_time_seconds": "1705800035" |
|
}, |
|
"total": 42836.813690111, |
|
"count": 1, |
|
"self": 0.3314620749952155, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.09841409399996337, |
|
"count": 1, |
|
"self": 0.09841409399996337 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 42836.383813942004, |
|
"count": 1, |
|
"self": 31.16820587838447, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 7.336992975992871, |
|
"count": 100, |
|
"self": 7.336992975992871 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 42797.65524656562, |
|
"count": 1361678, |
|
"self": 33.933481584601395, |
|
"children": { |
|
"env_step": { |
|
"total": 31111.48385727351, |
|
"count": 1361678, |
|
"self": 23554.45710108044, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 7536.9110729506265, |
|
"count": 1361678, |
|
"self": 220.90544398053498, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 7316.0056289700915, |
|
"count": 2528490, |
|
"self": 7316.0056289700915 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 20.11568324244331, |
|
"count": 1361678, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 42786.915158091026, |
|
"count": 1361678, |
|
"is_parallel": true, |
|
"self": 23799.42821186385, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.004608822000022883, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.0011540760000343653, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0034547459999885177, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0034547459999885177 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.03137612699993042, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0007355089998100084, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0006529350000619161, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0006529350000619161 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.027124995999997736, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.027124995999997736 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0028626870000607596, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.0005997199998546421, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0022629670002061175, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0022629670002061175 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 18987.215949916157, |
|
"count": 1361677, |
|
"is_parallel": true, |
|
"self": 999.5017485719763, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 825.9811654139888, |
|
"count": 1361677, |
|
"is_parallel": true, |
|
"self": 825.9811654139888 |
|
}, |
|
"communicator.exchange": { |
|
"total": 13345.161397115104, |
|
"count": 1361677, |
|
"is_parallel": true, |
|
"self": 13345.161397115104 |
|
}, |
|
"steps_from_proto": { |
|
"total": 3816.571638815089, |
|
"count": 2723354, |
|
"is_parallel": true, |
|
"self": 649.0959179964229, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 3167.475720818666, |
|
"count": 10893416, |
|
"is_parallel": true, |
|
"self": 3167.475720818666 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.2709963110160061, |
|
"count": 198, |
|
"is_parallel": true, |
|
"self": 0.04728555095698539, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.22371076005902069, |
|
"count": 792, |
|
"is_parallel": true, |
|
"self": 0.22371076005902069 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 11652.23790770751, |
|
"count": 1361678, |
|
"self": 249.20661963368548, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 4198.827744278771, |
|
"count": 1361678, |
|
"self": 4190.660633005776, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 8.167111272995271, |
|
"count": 40, |
|
"self": 8.167111272995271 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 7204.203543795053, |
|
"count": 960, |
|
"self": 5050.691455942814, |
|
"children": { |
|
"TorchPOCAOptimizer.update": { |
|
"total": 2153.5120878522384, |
|
"count": 14400, |
|
"self": 2153.5120878522384 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 1.7510028555989265e-06, |
|
"count": 1, |
|
"self": 1.7510028555989265e-06 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.2233667710024747, |
|
"count": 1, |
|
"self": 0.001880750001873821, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.22148602100060089, |
|
"count": 1, |
|
"self": 0.22148602100060089 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |