megaminer2023 / run_logs /timers.json

init

2bfb03e over 1 year ago

15.2 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 3.0953874588012695,
	"min": 3.0953874588012695,
	"max": 3.2946317195892334,
	"count": 78
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 17928.484375,
	"min": 3954.2001953125,
	"max": 105428.21875,
	"count": 78
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 966.5,
	"min": 219.88888888888889,
	"max": 999.0,
	"count": 78
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 7732.0,
	"min": 2536.0,
	"max": 24632.0,
	"count": 78
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1202.5900716306517,
	"min": 1199.9202472092547,
	"max": 1206.5010921371231,
	"count": 54
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 2405.1801432613033,
	"min": 2403.498433353844,
	"max": 12057.767178482298,
	"count": 54
	},
	"SoccerTwos.Step.mean": {
	"value": 399123.0,
	"min": 4332.0,
	"max": 399123.0,
	"count": 80
	},
	"SoccerTwos.Step.sum": {
	"value": 399123.0,
	"min": 4332.0,
	"max": 399123.0,
	"count": 80
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.0028270359616726637,
	"min": -0.015790298581123352,
	"max": 0.009247126057744026,
	"count": 80
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -0.014135180041193962,
	"min": -0.12632238864898682,
	"max": 0.04623563215136528,
	"count": 80
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.0028270361945033073,
	"min": -0.015790289267897606,
	"max": 0.009247127920389175,
	"count": 80
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -0.014135180972516537,
	"min": -0.12632231414318085,
	"max": 0.04623563960194588,
	"count": 80
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 80
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 80
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.012919999659061432,
	"min": -0.5,
	"max": 0.5408363721587441,
	"count": 80
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 0.06459999829530716,
	"min": -5.0848000049591064,
	"max": 5.949200093746185,
	"count": 80
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.012919999659061432,
	"min": -0.5,
	"max": 0.5408363721587441,
	"count": 80
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 0.06459999829530716,
	"min": -5.0848000049591064,
	"max": 5.949200093746185,
	"count": 80
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.03599075341597199,
	"min": 0.02652264821117569,
	"max": 0.03958484005124774,
	"count": 78
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.03599075341597199,
	"min": 0.02737326630934452,
	"max": 0.1006289279997353,
	"count": 78
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.002975616512121633,
	"min": 4.912644244387317e-12,
	"max": 0.0040068723130389115,
	"count": 78
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.002975616512121633,
	"min": 9.825288488774635e-12,
	"max": 0.008013744626077823,
	"count": 78
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.0029756165039725602,
	"min": 4.912676342611613e-12,
	"max": 0.004006872307218146,
	"count": 78
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.0029756165039725602,
	"min": 9.825352685223225e-12,
	"max": 0.008013744614436292,
	"count": 78
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.00030000000000000014,
	"count": 78
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0009,
	"count": 78
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.09999999999999998,
	"min": 0.09999999999999996,
	"max": 0.1,
	"count": 78
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.09999999999999998,
	"min": 0.09999999999999996,
	"max": 0.29999999999999993,
	"count": 78
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.0004000000000000001,
	"min": 0.00039999999999999996,
	"max": 0.0004000000000000002,
	"count": 78
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.0004000000000000001,
	"min": 0.00039999999999999996,
	"max": 0.0012000000000000001,
	"count": 78
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 80
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 80
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1699128120",
	"python_version": "3.10.12 \| packaged by Anaconda, Inc. \| (main, Jul 5 2023, 19:01:18) [MSC v.1916 64 bit (AMD64)]",
	"command_line_arguments": "\\\\?\\C:\\Users\\darkd\\miniconda3\\envs\\rl\\Scripts\\mlagents-learn .\\config\\poca\\behaviors.yml --env=.\\training-envs-executable\\SoccerTwos\\SoccerTwos.exe --run-id=xovernightx --no-graphics --force",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.0.0+cpu",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1699130648"
	},
	"total": 2527.6832791999987,
	"count": 1,
	"self": 0.33226709999871673,
	"children": {
	"run_training.setup": {
	"total": 0.14834870000049705,
	"count": 1,
	"self": 0.14834870000049705
	},
	"TrainerController.start_learning": {
	"total": 2527.2026633999994,
	"count": 1,
	"self": 1.2376500002355897,
	"children": {
	"TrainerController._reset_env": {
	"total": 6.365150799974799,
	"count": 19,
	"self": 6.365150799974799
	},
	"TrainerController.advance": {
	"total": 2519.307256399792,
	"count": 33101,
	"self": 1.1794261996183195,
	"children": {
	"env_step": {
	"total": 934.8396340999607,
	"count": 33101,
	"self": 708.1390166005003,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 225.90577660004783,
	"count": 33101,
	"self": 7.087370800196368,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 218.81840579985146,
	"count": 65732,
	"self": 218.81840579985146
	}
	}
	},
	"workers": {
	"total": 0.7948408994125202,
	"count": 33101,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2520.518991699988,
	"count": 33101,
	"is_parallel": true,
	"self": 1967.1660637001332,
	"children": {
	"steps_from_proto": {
	"total": 0.04562999999325257,
	"count": 38,
	"is_parallel": true,
	"self": 0.010100100022100378,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.03552989997115219,
	"count": 152,
	"is_parallel": true,
	"self": 0.03552989997115219
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 553.3072979998615,
	"count": 33101,
	"is_parallel": true,
	"self": 27.095727399908355,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 25.477302699480788,
	"count": 33101,
	"is_parallel": true,
	"self": 25.477302699480788
	},
	"communicator.exchange": {
	"total": 406.09700419979345,
	"count": 33101,
	"is_parallel": true,
	"self": 406.09700419979345
	},
	"steps_from_proto": {
	"total": 94.63726370067889,
	"count": 66202,
	"is_parallel": true,
	"self": 20.000750102903112,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 74.63651359777577,
	"count": 264808,
	"is_parallel": true,
	"self": 74.63651359777577
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 1583.288196100213,
	"count": 33101,
	"self": 7.677287199570856,
	"children": {
	"process_trajectory": {
	"total": 88.717625300691,
	"count": 33101,
	"self": 88.717625300691
	},
	"_update_policy": {
	"total": 1486.8932835999512,
	"count": 122,
	"self": 292.86508180006786,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 1194.0282017998834,
	"count": 7060,
	"self": 1194.0282017998834
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.4999968698248267e-06,
	"count": 1,
	"self": 1.4999968698248267e-06
	},
	"TrainerController._save_models": {
	"total": 0.29260470000008354,
	"count": 1,
	"self": 0.010557099994912278,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.28204760000517126,
	"count": 1,
	"self": 0.28204760000517126
	}
	}
	}
	}
	}
	}
	}