poca-SoccerTwos-7 / run_logs /timers.json

First Push

ce5aafd about 2 years ago

20.3 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 0.5079799890518188,
	"min": 0.5056769251823425,
	"max": 0.7852402925491333,
	"count": 621
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 51269.40234375,
	"min": 326.65997314453125,
	"max": 78123.0546875,
	"count": 621
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 68.54293628808864,
	"min": 9.0,
	"max": 80.0551948051948,
	"count": 621
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 98976.0,
	"min": 72.0,
	"max": 100416.0,
	"count": 621
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1170.8534892772898,
	"min": 1150.3353937746865,
	"max": 1250.6523380178,
	"count": 621
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 845356.2192582032,
	"min": 4804.985629723263,
	"max": 1037939.4706775222,
	"count": 621
	},
	"SoccerTwos.Step.mean": {
	"value": 99999939.0,
	"min": 68999989.0,
	"max": 99999939.0,
	"count": 621
	},
	"SoccerTwos.Step.sum": {
	"value": 99999939.0,
	"min": 68999989.0,
	"max": 99999939.0,
	"count": 621
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.0405665747821331,
	"min": -0.08486969023942947,
	"max": 0.1448543667793274,
	"count": 621
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -29.24850082397461,
	"min": -65.43453216552734,
	"max": 16.586124420166016,
	"count": 621
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.040638986974954605,
	"min": -0.0855465903878212,
	"max": 0.14996777474880219,
	"count": 621
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -29.300710678100586,
	"min": -65.9564208984375,
	"max": 16.9932861328125,
	"count": 621
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 621
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 621
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.05486158003588821,
	"min": -0.19329876561223724,
	"max": 0.9908000230789185,
	"count": 621
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -39.5551992058754,
	"min": -156.57200014591217,
	"max": 101.72799974679947,
	"count": 621
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.05486158003588821,
	"min": -0.19329876561223724,
	"max": 0.9908000230789185,
	"count": 621
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -39.5551992058754,
	"min": -156.57200014591217,
	"max": 101.72799974679947,
	"count": 621
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 621
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 621
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.011562750603237268,
	"min": 0.006540073479603355,
	"max": 0.017336187163891736,
	"count": 620
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.011562750603237268,
	"min": 0.006540073479603355,
	"max": 0.030448245476388063,
	"count": 620
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.0984947495162487,
	"min": 0.0835721002270778,
	"max": 0.11199088642994563,
	"count": 620
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.0984947495162487,
	"min": 0.0835721002270778,
	"max": 0.2153649392227332,
	"count": 620
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.09880854934453964,
	"min": 0.08427299776424964,
	"max": 0.1126904608681798,
	"count": 620
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.09880854934453964,
	"min": 0.08427299776424964,
	"max": 0.21592610919227204,
	"count": 620
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 4.891898372699995e-08,
	"min": 4.891898372699995e-08,
	"max": 9.290173803277699e-05,
	"count": 620
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 4.891898372699995e-08,
	"min": 4.891898372699995e-08,
	"max": 0.00018550815616399398,
	"count": 620
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.100016273,
	"min": 0.100016273,
	"max": 0.13096722300000002,
	"count": 620
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.100016273,
	"min": 0.100016273,
	"max": 0.261836006,
	"count": 620
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 1.08120227e-05,
	"min": 1.08120227e-05,
	"max": 0.0015552644277000002,
	"count": 620
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 1.08120227e-05,
	"min": 1.08120227e-05,
	"max": 0.0031056166994,
	"count": 620
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1677714024",
	"python_version": "3.9.5 (default, Nov 23 2021, 15:27:38) \n[GCC 9.3.0]",
	"command_line_arguments": "/home/akghxhs55/.local/share/virtualenvs/unit7-nHLSdMlF/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=/home/akghxhs55/study/hugging-face/deep-rl/unit7/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos-11 --no-graphics --resume",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu115",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1677752204"
	},
	"total": 38179.97978298599,
	"count": 1,
	"self": 0.8270952310413122,
	"children": {
	"run_training.setup": {
	"total": 0.009300585952587426,
	"count": 1,
	"self": 0.009300585952587426
	},
	"TrainerController.start_learning": {
	"total": 38179.143387168995,
	"count": 1,
	"self": 27.044664017041214,
	"children": {
	"TrainerController._reset_env": {
	"total": 3.966062439722009,
	"count": 79,
	"self": 3.966062439722009
	},
	"TrainerController.advance": {
	"total": 38147.78208047617,
	"count": 2121550,
	"self": 27.518943287897855,
	"children": {
	"env_step": {
	"total": 30023.026193613303,
	"count": 2121550,
	"self": 20003.88848861691,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 10000.533994897502,
	"count": 2121550,
	"self": 172.42056694882922,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 9828.113427948672,
	"count": 3883314,
	"self": 9828.113427948672
	}
	}
	},
	"workers": {
	"total": 18.603710098890588,
	"count": 2121550,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 38105.96762576746,
	"count": 2121550,
	"is_parallel": true,
	"self": 20734.46843218454,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0016472090501338243,
	"count": 2,
	"is_parallel": true,
	"self": 0.0004687310429289937,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0011784780072048306,
	"count": 8,
	"is_parallel": true,
	"self": 0.0011784780072048306
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.01564809901174158,
	"count": 1,
	"is_parallel": true,
	"self": 0.000300175161100924,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.00022016989532858133,
	"count": 1,
	"is_parallel": true,
	"self": 0.00022016989532858133
	},
	"communicator.exchange": {
	"total": 0.014317468972876668,
	"count": 1,
	"is_parallel": true,
	"self": 0.014317468972876668
	},
	"steps_from_proto": {
	"total": 0.0008102849824354053,
	"count": 2,
	"is_parallel": true,
	"self": 0.00017089187167584896,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0006393931107595563,
	"count": 8,
	"is_parallel": true,
	"self": 0.0006393931107595563
	}
	}
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.06000017421320081,
	"count": 156,
	"is_parallel": true,
	"self": 0.011994376429356635,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.04800579778384417,
	"count": 624,
	"is_parallel": true,
	"self": 0.04800579778384417
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 17371.439193408703,
	"count": 2121549,
	"is_parallel": true,
	"self": 568.4360090695554,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 326.56921866338234,
	"count": 2121549,
	"is_parallel": true,
	"self": 326.56921866338234
	},
	"communicator.exchange": {
	"total": 14999.379022408393,
	"count": 2121549,
	"is_parallel": true,
	"self": 14999.379022408393
	},
	"steps_from_proto": {
	"total": 1477.0549432673724,
	"count": 4243098,
	"is_parallel": true,
	"self": 292.3377271288773,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 1184.7172161384951,
	"count": 16972392,
	"is_parallel": true,
	"self": 1184.7172161384951
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 8097.2369435749715,
	"count": 2121550,
	"self": 193.23693259479478,
	"children": {
	"process_trajectory": {
	"total": 3961.4725717210677,
	"count": 2121550,
	"self": 3939.7263424687553,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 21.746229252312332,
	"count": 63,
	"self": 21.746229252312332
	}
	}
	},
	"_update_policy": {
	"total": 3942.527439259109,
	"count": 942,
	"self": 2009.3178590056486,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 1933.2095802534604,
	"count": 22608,
	"self": 1933.2095802534604
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 4.930188879370689e-07,
	"count": 1,
	"self": 4.930188879370689e-07
	},
	"TrainerController._save_models": {
	"total": 0.3505797430407256,
	"count": 1,
	"self": 0.004716911003924906,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.3458628320368007,
	"count": 1,
	"self": 0.3458628320368007
	}
	}
	}
	}
	}
	}
	}