|
{ |
|
"name": "root", |
|
"gauges": { |
|
"SoccerTwos.Policy.Entropy.mean": { |
|
"value": 0.5079799890518188, |
|
"min": 0.5056769251823425, |
|
"max": 0.7852402925491333, |
|
"count": 621 |
|
}, |
|
"SoccerTwos.Policy.Entropy.sum": { |
|
"value": 51269.40234375, |
|
"min": 326.65997314453125, |
|
"max": 78123.0546875, |
|
"count": 621 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.mean": { |
|
"value": 68.54293628808864, |
|
"min": 9.0, |
|
"max": 80.0551948051948, |
|
"count": 621 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.sum": { |
|
"value": 98976.0, |
|
"min": 72.0, |
|
"max": 100416.0, |
|
"count": 621 |
|
}, |
|
"SoccerTwos.Self-play.ELO.mean": { |
|
"value": 1170.8534892772898, |
|
"min": 1150.3353937746865, |
|
"max": 1250.6523380178, |
|
"count": 621 |
|
}, |
|
"SoccerTwos.Self-play.ELO.sum": { |
|
"value": 845356.2192582032, |
|
"min": 4804.985629723263, |
|
"max": 1037939.4706775222, |
|
"count": 621 |
|
}, |
|
"SoccerTwos.Step.mean": { |
|
"value": 99999939.0, |
|
"min": 68999989.0, |
|
"max": 99999939.0, |
|
"count": 621 |
|
}, |
|
"SoccerTwos.Step.sum": { |
|
"value": 99999939.0, |
|
"min": 68999989.0, |
|
"max": 99999939.0, |
|
"count": 621 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
|
"value": -0.0405665747821331, |
|
"min": -0.08486969023942947, |
|
"max": 0.1448543667793274, |
|
"count": 621 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
|
"value": -29.24850082397461, |
|
"min": -65.43453216552734, |
|
"max": 16.586124420166016, |
|
"count": 621 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": -0.040638986974954605, |
|
"min": -0.0855465903878212, |
|
"max": 0.14996777474880219, |
|
"count": 621 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": -29.300710678100586, |
|
"min": -65.9564208984375, |
|
"max": 16.9932861328125, |
|
"count": 621 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.mean": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 621 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.sum": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 621 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.mean": { |
|
"value": -0.05486158003588821, |
|
"min": -0.19329876561223724, |
|
"max": 0.9908000230789185, |
|
"count": 621 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.sum": { |
|
"value": -39.5551992058754, |
|
"min": -156.57200014591217, |
|
"max": 101.72799974679947, |
|
"count": 621 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.mean": { |
|
"value": -0.05486158003588821, |
|
"min": -0.19329876561223724, |
|
"max": 0.9908000230789185, |
|
"count": 621 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.sum": { |
|
"value": -39.5551992058754, |
|
"min": -156.57200014591217, |
|
"max": 101.72799974679947, |
|
"count": 621 |
|
}, |
|
"SoccerTwos.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 621 |
|
}, |
|
"SoccerTwos.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 621 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.mean": { |
|
"value": 0.011562750603237268, |
|
"min": 0.006540073479603355, |
|
"max": 0.017336187163891736, |
|
"count": 620 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.sum": { |
|
"value": 0.011562750603237268, |
|
"min": 0.006540073479603355, |
|
"max": 0.030448245476388063, |
|
"count": 620 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.mean": { |
|
"value": 0.0984947495162487, |
|
"min": 0.0835721002270778, |
|
"max": 0.11199088642994563, |
|
"count": 620 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.sum": { |
|
"value": 0.0984947495162487, |
|
"min": 0.0835721002270778, |
|
"max": 0.2153649392227332, |
|
"count": 620 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.mean": { |
|
"value": 0.09880854934453964, |
|
"min": 0.08427299776424964, |
|
"max": 0.1126904608681798, |
|
"count": 620 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.sum": { |
|
"value": 0.09880854934453964, |
|
"min": 0.08427299776424964, |
|
"max": 0.21592610919227204, |
|
"count": 620 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.mean": { |
|
"value": 4.891898372699995e-08, |
|
"min": 4.891898372699995e-08, |
|
"max": 9.290173803277699e-05, |
|
"count": 620 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.sum": { |
|
"value": 4.891898372699995e-08, |
|
"min": 4.891898372699995e-08, |
|
"max": 0.00018550815616399398, |
|
"count": 620 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.mean": { |
|
"value": 0.100016273, |
|
"min": 0.100016273, |
|
"max": 0.13096722300000002, |
|
"count": 620 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.sum": { |
|
"value": 0.100016273, |
|
"min": 0.100016273, |
|
"max": 0.261836006, |
|
"count": 620 |
|
}, |
|
"SoccerTwos.Policy.Beta.mean": { |
|
"value": 1.08120227e-05, |
|
"min": 1.08120227e-05, |
|
"max": 0.0015552644277000002, |
|
"count": 620 |
|
}, |
|
"SoccerTwos.Policy.Beta.sum": { |
|
"value": 1.08120227e-05, |
|
"min": 1.08120227e-05, |
|
"max": 0.0031056166994, |
|
"count": 620 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1677714024", |
|
"python_version": "3.9.5 (default, Nov 23 2021, 15:27:38) \n[GCC 9.3.0]", |
|
"command_line_arguments": "/home/akghxhs55/.local/share/virtualenvs/unit7-nHLSdMlF/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=/home/akghxhs55/study/hugging-face/deep-rl/unit7/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos-11 --no-graphics --resume", |
|
"mlagents_version": "0.31.0.dev0", |
|
"mlagents_envs_version": "0.31.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.11.0+cu115", |
|
"numpy_version": "1.21.2", |
|
"end_time_seconds": "1677752204" |
|
}, |
|
"total": 38179.97978298599, |
|
"count": 1, |
|
"self": 0.8270952310413122, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.009300585952587426, |
|
"count": 1, |
|
"self": 0.009300585952587426 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 38179.143387168995, |
|
"count": 1, |
|
"self": 27.044664017041214, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 3.966062439722009, |
|
"count": 79, |
|
"self": 3.966062439722009 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 38147.78208047617, |
|
"count": 2121550, |
|
"self": 27.518943287897855, |
|
"children": { |
|
"env_step": { |
|
"total": 30023.026193613303, |
|
"count": 2121550, |
|
"self": 20003.88848861691, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 10000.533994897502, |
|
"count": 2121550, |
|
"self": 172.42056694882922, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 9828.113427948672, |
|
"count": 3883314, |
|
"self": 9828.113427948672 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 18.603710098890588, |
|
"count": 2121550, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 38105.96762576746, |
|
"count": 2121550, |
|
"is_parallel": true, |
|
"self": 20734.46843218454, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.0016472090501338243, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.0004687310429289937, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0011784780072048306, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0011784780072048306 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.01564809901174158, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.000300175161100924, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.00022016989532858133, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00022016989532858133 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.014317468972876668, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.014317468972876668 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0008102849824354053, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.00017089187167584896, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0006393931107595563, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0006393931107595563 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.06000017421320081, |
|
"count": 156, |
|
"is_parallel": true, |
|
"self": 0.011994376429356635, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.04800579778384417, |
|
"count": 624, |
|
"is_parallel": true, |
|
"self": 0.04800579778384417 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 17371.439193408703, |
|
"count": 2121549, |
|
"is_parallel": true, |
|
"self": 568.4360090695554, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 326.56921866338234, |
|
"count": 2121549, |
|
"is_parallel": true, |
|
"self": 326.56921866338234 |
|
}, |
|
"communicator.exchange": { |
|
"total": 14999.379022408393, |
|
"count": 2121549, |
|
"is_parallel": true, |
|
"self": 14999.379022408393 |
|
}, |
|
"steps_from_proto": { |
|
"total": 1477.0549432673724, |
|
"count": 4243098, |
|
"is_parallel": true, |
|
"self": 292.3377271288773, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 1184.7172161384951, |
|
"count": 16972392, |
|
"is_parallel": true, |
|
"self": 1184.7172161384951 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 8097.2369435749715, |
|
"count": 2121550, |
|
"self": 193.23693259479478, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 3961.4725717210677, |
|
"count": 2121550, |
|
"self": 3939.7263424687553, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 21.746229252312332, |
|
"count": 63, |
|
"self": 21.746229252312332 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 3942.527439259109, |
|
"count": 942, |
|
"self": 2009.3178590056486, |
|
"children": { |
|
"TorchPOCAOptimizer.update": { |
|
"total": 1933.2095802534604, |
|
"count": 22608, |
|
"self": 1933.2095802534604 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 4.930188879370689e-07, |
|
"count": 1, |
|
"self": 4.930188879370689e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.3505797430407256, |
|
"count": 1, |
|
"self": 0.004716911003924906, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.3458628320368007, |
|
"count": 1, |
|
"self": 0.3458628320368007 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |