poca-SoccerTwos / run_logs /timers.json
caiiofc's picture
First Push
8eeb81a verified
raw
history blame contribute delete
No virus
15.6 kB
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 2.3299667835235596,
"min": 2.299405336380005,
"max": 3.295668363571167,
"count": 332
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 47121.25,
"min": 15642.83203125,
"max": 114542.3359375,
"count": 332
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 50.76288659793814,
"min": 42.76521739130435,
"max": 999.0,
"count": 332
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 19696.0,
"min": 15884.0,
"max": 27488.0,
"count": 332
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1478.026642524961,
"min": 1179.7788040428786,
"max": 1478.026642524961,
"count": 325
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 286737.16864984244,
"min": 2364.1918829443184,
"max": 321863.026105703,
"count": 325
},
"SoccerTwos.Step.mean": {
"value": 3319968.0,
"min": 9760.0,
"max": 3319968.0,
"count": 332
},
"SoccerTwos.Step.sum": {
"value": 3319968.0,
"min": 9760.0,
"max": 3319968.0,
"count": 332
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": 0.13224956393241882,
"min": -0.07247133553028107,
"max": 0.17099936306476593,
"count": 332
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": 25.656415939331055,
"min": -13.824865341186523,
"max": 29.924888610839844,
"count": 332
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.13362355530261993,
"min": -0.06882161647081375,
"max": 0.17515622079372406,
"count": 332
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": 25.922969818115234,
"min": -13.692461013793945,
"max": 30.6523380279541,
"count": 332
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 332
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 332
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": 0.08665361109468125,
"min": -0.6923076923076923,
"max": 0.5811499978105227,
"count": 332
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": 16.810800552368164,
"min": -45.21120023727417,
"max": 59.629999458789825,
"count": 332
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": 0.08665361109468125,
"min": -0.6923076923076923,
"max": 0.5811499978105227,
"count": 332
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": 16.810800552368164,
"min": -45.21120023727417,
"max": 59.629999458789825,
"count": 332
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 332
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 332
},
"SoccerTwos.Losses.PolicyLoss.mean": {
"value": 0.01647280962206423,
"min": 0.010384321962677252,
"max": 0.025824726539819192,
"count": 157
},
"SoccerTwos.Losses.PolicyLoss.sum": {
"value": 0.01647280962206423,
"min": 0.010384321962677252,
"max": 0.025824726539819192,
"count": 157
},
"SoccerTwos.Losses.ValueLoss.mean": {
"value": 0.10077739705642065,
"min": 0.0006277227638444553,
"max": 0.11096864019831022,
"count": 157
},
"SoccerTwos.Losses.ValueLoss.sum": {
"value": 0.10077739705642065,
"min": 0.0006277227638444553,
"max": 0.11096864019831022,
"count": 157
},
"SoccerTwos.Losses.BaselineLoss.mean": {
"value": 0.10252556800842286,
"min": 0.0006187290273373947,
"max": 0.11352627476056416,
"count": 157
},
"SoccerTwos.Losses.BaselineLoss.sum": {
"value": 0.10252556800842286,
"min": 0.0006187290273373947,
"max": 0.11352627476056416,
"count": 157
},
"SoccerTwos.Policy.LearningRate.mean": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 157
},
"SoccerTwos.Policy.LearningRate.sum": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 157
},
"SoccerTwos.Policy.Epsilon.mean": {
"value": 0.20000000000000007,
"min": 0.20000000000000007,
"max": 0.20000000000000007,
"count": 157
},
"SoccerTwos.Policy.Epsilon.sum": {
"value": 0.20000000000000007,
"min": 0.20000000000000007,
"max": 0.20000000000000007,
"count": 157
},
"SoccerTwos.Policy.Beta.mean": {
"value": 0.005000000000000001,
"min": 0.005000000000000001,
"max": 0.005000000000000001,
"count": 157
},
"SoccerTwos.Policy.Beta.sum": {
"value": 0.005000000000000001,
"min": 0.005000000000000001,
"max": 0.005000000000000001,
"count": 157
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1724983919",
"python_version": "3.10.12 (main, Jul 5 2023, 15:34:07) [Clang 14.0.6 ]",
"command_line_arguments": "/Users/caio.campos/anaconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.app --run-id=SoccerTwos --no-graphics --force",
"mlagents_version": "1.1.0.dev0",
"mlagents_envs_version": "1.1.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.2.2",
"numpy_version": "1.23.5",
"end_time_seconds": "1725010048"
},
"total": 26128.401052199,
"count": 1,
"self": 0.33014127099886537,
"children": {
"run_training.setup": {
"total": 0.038303445999190444,
"count": 1,
"self": 0.038303445999190444
},
"TrainerController.start_learning": {
"total": 26128.032607482,
"count": 1,
"self": 4.815222942630498,
"children": {
"TrainerController._reset_env": {
"total": 8.892866306008727,
"count": 17,
"self": 8.892866306008727
},
"TrainerController.advance": {
"total": 26114.05709432836,
"count": 220564,
"self": 4.818681626267789,
"children": {
"env_step": {
"total": 20777.331596008145,
"count": 220564,
"self": 20038.60178467525,
"children": {
"SubprocessEnvManager._take_step": {
"total": 735.6629285974359,
"count": 220564,
"self": 28.332394672645023,
"children": {
"TorchPolicy.evaluate": {
"total": 707.3305339247909,
"count": 423602,
"self": 707.3305339247909
}
}
},
"workers": {
"total": 3.06688273546024,
"count": 220563,
"self": 0.0,
"children": {
"worker_root": {
"total": 26112.673646069434,
"count": 220563,
"is_parallel": true,
"self": 6650.5135924498245,
"children": {
"steps_from_proto": {
"total": 0.05718903701563249,
"count": 34,
"is_parallel": true,
"self": 0.008453278995148139,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.048735758020484354,
"count": 136,
"is_parallel": true,
"self": 0.048735758020484354
}
}
},
"UnityEnvironment.step": {
"total": 19462.102864582594,
"count": 220563,
"is_parallel": true,
"self": 59.292598800391715,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 371.8948498334321,
"count": 220563,
"is_parallel": true,
"self": 371.8948498334321
},
"communicator.exchange": {
"total": 18326.88937894188,
"count": 220563,
"is_parallel": true,
"self": 18326.88937894188
},
"steps_from_proto": {
"total": 704.02603700689,
"count": 441126,
"is_parallel": true,
"self": 94.92409573729674,
"children": {
"_process_rank_one_or_two_observation": {
"total": 609.1019412695932,
"count": 1764504,
"is_parallel": true,
"self": 609.1019412695932
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 5331.906816693945,
"count": 220563,
"self": 39.04413141792611,
"children": {
"process_trajectory": {
"total": 676.097296054013,
"count": 220563,
"self": 674.3273022760113,
"children": {
"RLTrainer._checkpoint": {
"total": 1.7699937780016626,
"count": 6,
"self": 1.7699937780016626
}
}
},
"_update_policy": {
"total": 4616.765389222006,
"count": 158,
"self": 473.07072151311513,
"children": {
"TorchPOCAOptimizer.update": {
"total": 4143.694667708891,
"count": 4740,
"self": 4143.694667708891
}
}
}
}
}
}
},
"trainer_threads": {
"total": 1.1279989848844707e-06,
"count": 1,
"self": 1.1279989848844707e-06
},
"TrainerController._save_models": {
"total": 0.2674227770039579,
"count": 1,
"self": 0.0017639980069361627,
"children": {
"RLTrainer._checkpoint": {
"total": 0.2656587789970217,
"count": 1,
"self": 0.2656587789970217
}
}
}
}
}
}
}