akghxhs55's picture
First Push
ce5aafd
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 0.5079799890518188,
"min": 0.5056769251823425,
"max": 0.7852402925491333,
"count": 621
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 51269.40234375,
"min": 326.65997314453125,
"max": 78123.0546875,
"count": 621
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 68.54293628808864,
"min": 9.0,
"max": 80.0551948051948,
"count": 621
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 98976.0,
"min": 72.0,
"max": 100416.0,
"count": 621
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1170.8534892772898,
"min": 1150.3353937746865,
"max": 1250.6523380178,
"count": 621
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 845356.2192582032,
"min": 4804.985629723263,
"max": 1037939.4706775222,
"count": 621
},
"SoccerTwos.Step.mean": {
"value": 99999939.0,
"min": 68999989.0,
"max": 99999939.0,
"count": 621
},
"SoccerTwos.Step.sum": {
"value": 99999939.0,
"min": 68999989.0,
"max": 99999939.0,
"count": 621
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": -0.0405665747821331,
"min": -0.08486969023942947,
"max": 0.1448543667793274,
"count": 621
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": -29.24850082397461,
"min": -65.43453216552734,
"max": 16.586124420166016,
"count": 621
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": -0.040638986974954605,
"min": -0.0855465903878212,
"max": 0.14996777474880219,
"count": 621
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": -29.300710678100586,
"min": -65.9564208984375,
"max": 16.9932861328125,
"count": 621
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 621
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 621
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": -0.05486158003588821,
"min": -0.19329876561223724,
"max": 0.9908000230789185,
"count": 621
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": -39.5551992058754,
"min": -156.57200014591217,
"max": 101.72799974679947,
"count": 621
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": -0.05486158003588821,
"min": -0.19329876561223724,
"max": 0.9908000230789185,
"count": 621
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": -39.5551992058754,
"min": -156.57200014591217,
"max": 101.72799974679947,
"count": 621
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 621
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 621
},
"SoccerTwos.Losses.PolicyLoss.mean": {
"value": 0.011562750603237268,
"min": 0.006540073479603355,
"max": 0.017336187163891736,
"count": 620
},
"SoccerTwos.Losses.PolicyLoss.sum": {
"value": 0.011562750603237268,
"min": 0.006540073479603355,
"max": 0.030448245476388063,
"count": 620
},
"SoccerTwos.Losses.ValueLoss.mean": {
"value": 0.0984947495162487,
"min": 0.0835721002270778,
"max": 0.11199088642994563,
"count": 620
},
"SoccerTwos.Losses.ValueLoss.sum": {
"value": 0.0984947495162487,
"min": 0.0835721002270778,
"max": 0.2153649392227332,
"count": 620
},
"SoccerTwos.Losses.BaselineLoss.mean": {
"value": 0.09880854934453964,
"min": 0.08427299776424964,
"max": 0.1126904608681798,
"count": 620
},
"SoccerTwos.Losses.BaselineLoss.sum": {
"value": 0.09880854934453964,
"min": 0.08427299776424964,
"max": 0.21592610919227204,
"count": 620
},
"SoccerTwos.Policy.LearningRate.mean": {
"value": 4.891898372699995e-08,
"min": 4.891898372699995e-08,
"max": 9.290173803277699e-05,
"count": 620
},
"SoccerTwos.Policy.LearningRate.sum": {
"value": 4.891898372699995e-08,
"min": 4.891898372699995e-08,
"max": 0.00018550815616399398,
"count": 620
},
"SoccerTwos.Policy.Epsilon.mean": {
"value": 0.100016273,
"min": 0.100016273,
"max": 0.13096722300000002,
"count": 620
},
"SoccerTwos.Policy.Epsilon.sum": {
"value": 0.100016273,
"min": 0.100016273,
"max": 0.261836006,
"count": 620
},
"SoccerTwos.Policy.Beta.mean": {
"value": 1.08120227e-05,
"min": 1.08120227e-05,
"max": 0.0015552644277000002,
"count": 620
},
"SoccerTwos.Policy.Beta.sum": {
"value": 1.08120227e-05,
"min": 1.08120227e-05,
"max": 0.0031056166994,
"count": 620
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1677714024",
"python_version": "3.9.5 (default, Nov 23 2021, 15:27:38) \n[GCC 9.3.0]",
"command_line_arguments": "/home/akghxhs55/.local/share/virtualenvs/unit7-nHLSdMlF/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=/home/akghxhs55/study/hugging-face/deep-rl/unit7/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos-11 --no-graphics --resume",
"mlagents_version": "0.31.0.dev0",
"mlagents_envs_version": "0.31.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "1.11.0+cu115",
"numpy_version": "1.21.2",
"end_time_seconds": "1677752204"
},
"total": 38179.97978298599,
"count": 1,
"self": 0.8270952310413122,
"children": {
"run_training.setup": {
"total": 0.009300585952587426,
"count": 1,
"self": 0.009300585952587426
},
"TrainerController.start_learning": {
"total": 38179.143387168995,
"count": 1,
"self": 27.044664017041214,
"children": {
"TrainerController._reset_env": {
"total": 3.966062439722009,
"count": 79,
"self": 3.966062439722009
},
"TrainerController.advance": {
"total": 38147.78208047617,
"count": 2121550,
"self": 27.518943287897855,
"children": {
"env_step": {
"total": 30023.026193613303,
"count": 2121550,
"self": 20003.88848861691,
"children": {
"SubprocessEnvManager._take_step": {
"total": 10000.533994897502,
"count": 2121550,
"self": 172.42056694882922,
"children": {
"TorchPolicy.evaluate": {
"total": 9828.113427948672,
"count": 3883314,
"self": 9828.113427948672
}
}
},
"workers": {
"total": 18.603710098890588,
"count": 2121550,
"self": 0.0,
"children": {
"worker_root": {
"total": 38105.96762576746,
"count": 2121550,
"is_parallel": true,
"self": 20734.46843218454,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.0016472090501338243,
"count": 2,
"is_parallel": true,
"self": 0.0004687310429289937,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0011784780072048306,
"count": 8,
"is_parallel": true,
"self": 0.0011784780072048306
}
}
},
"UnityEnvironment.step": {
"total": 0.01564809901174158,
"count": 1,
"is_parallel": true,
"self": 0.000300175161100924,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.00022016989532858133,
"count": 1,
"is_parallel": true,
"self": 0.00022016989532858133
},
"communicator.exchange": {
"total": 0.014317468972876668,
"count": 1,
"is_parallel": true,
"self": 0.014317468972876668
},
"steps_from_proto": {
"total": 0.0008102849824354053,
"count": 2,
"is_parallel": true,
"self": 0.00017089187167584896,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0006393931107595563,
"count": 8,
"is_parallel": true,
"self": 0.0006393931107595563
}
}
}
}
}
}
},
"steps_from_proto": {
"total": 0.06000017421320081,
"count": 156,
"is_parallel": true,
"self": 0.011994376429356635,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.04800579778384417,
"count": 624,
"is_parallel": true,
"self": 0.04800579778384417
}
}
},
"UnityEnvironment.step": {
"total": 17371.439193408703,
"count": 2121549,
"is_parallel": true,
"self": 568.4360090695554,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 326.56921866338234,
"count": 2121549,
"is_parallel": true,
"self": 326.56921866338234
},
"communicator.exchange": {
"total": 14999.379022408393,
"count": 2121549,
"is_parallel": true,
"self": 14999.379022408393
},
"steps_from_proto": {
"total": 1477.0549432673724,
"count": 4243098,
"is_parallel": true,
"self": 292.3377271288773,
"children": {
"_process_rank_one_or_two_observation": {
"total": 1184.7172161384951,
"count": 16972392,
"is_parallel": true,
"self": 1184.7172161384951
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 8097.2369435749715,
"count": 2121550,
"self": 193.23693259479478,
"children": {
"process_trajectory": {
"total": 3961.4725717210677,
"count": 2121550,
"self": 3939.7263424687553,
"children": {
"RLTrainer._checkpoint": {
"total": 21.746229252312332,
"count": 63,
"self": 21.746229252312332
}
}
},
"_update_policy": {
"total": 3942.527439259109,
"count": 942,
"self": 2009.3178590056486,
"children": {
"TorchPOCAOptimizer.update": {
"total": 1933.2095802534604,
"count": 22608,
"self": 1933.2095802534604
}
}
}
}
}
}
},
"trainer_threads": {
"total": 4.930188879370689e-07,
"count": 1,
"self": 4.930188879370689e-07
},
"TrainerController._save_models": {
"total": 0.3505797430407256,
"count": 1,
"self": 0.004716911003924906,
"children": {
"RLTrainer._checkpoint": {
"total": 0.3458628320368007,
"count": 1,
"self": 0.3458628320368007
}
}
}
}
}
}
}