First Push`

775fd9e over 2 years ago

15.7 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 2.9924488067626953,
	"min": 2.958897590637207,
	"max": 3.1828112602233887,
	"count": 300
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 77660.03125,
	"min": 21516.66015625,
	"max": 137188.0625,
	"count": 300
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 475.54545454545456,
	"min": 334.06666666666666,
	"max": 999.0,
	"count": 300
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 20924.0,
	"min": 4976.0,
	"max": 30936.0,
	"count": 300
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1241.8774269485682,
	"min": 1192.8382636217825,
	"max": 1247.5560014737573,
	"count": 282
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 22353.793685074226,
	"min": 2387.111447047758,
	"max": 34624.33795049888,
	"count": 282
	},
	"SoccerTwos.Step.mean": {
	"value": 2999666.0,
	"min": 9484.0,
	"max": 2999666.0,
	"count": 300
	},
	"SoccerTwos.Step.sum": {
	"value": 2999666.0,
	"min": 9484.0,
	"max": 2999666.0,
	"count": 300
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.016900047659873962,
	"min": -0.019958587363362312,
	"max": -0.001513068564236164,
	"count": 300
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -0.3549010157585144,
	"min": -0.3693455159664154,
	"max": -0.01775738224387169,
	"count": 300
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.01757766678929329,
	"min": -0.019750839099287987,
	"max": -0.0010202398989349604,
	"count": 300
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -0.3691309988498688,
	"min": -0.3691309988498688,
	"max": -0.012242878787219524,
	"count": 300
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 300
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 300
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.11979047457377116,
	"min": -0.682741176117869,
	"max": 0.338373335202535,
	"count": 300
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -2.5155999660491943,
	"min": -13.14359998703003,
	"max": 5.208000034093857,
	"count": 300
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.11979047457377116,
	"min": -0.682741176117869,
	"max": 0.338373335202535,
	"count": 300
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -2.5155999660491943,
	"min": -13.14359998703003,
	"max": 5.208000034093857,
	"count": 300
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 300
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 300
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.008282075870859747,
	"min": 0.005789831588238788,
	"max": 0.010839468071208103,
	"count": 36
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.008282075870859747,
	"min": 0.005789831588238788,
	"max": 0.010839468071208103,
	"count": 36
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.006328290343905489,
	"min": 0.001657259821270903,
	"max": 0.009326495820035537,
	"count": 36
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.006328290343905489,
	"min": 0.001657259821270903,
	"max": 0.009326495820035537,
	"count": 36
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.006342333027472099,
	"min": 0.0016584567182386914,
	"max": 0.009329031966626645,
	"count": 36
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.006342333027472099,
	"min": 0.0016584567182386914,
	"max": 0.009329031966626645,
	"count": 36
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 7.372099385666599e-06,
	"min": 7.372099385666599e-06,
	"max": 0.0011668776027601998,
	"count": 36
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 7.372099385666599e-06,
	"min": 7.372099385666599e-06,
	"max": 0.0011668776027601998,
	"count": 36
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.10061433333333329,
	"min": 0.10061433333333329,
	"max": 0.19723980000000008,
	"count": 36
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.10061433333333329,
	"min": 0.10061433333333329,
	"max": 0.19723980000000008,
	"count": 36
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 4.065523333333305e-05,
	"min": 4.065523333333305e-05,
	"max": 0.004862266020000001,
	"count": 36
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 4.065523333333305e-05,
	"min": 4.065523333333305e-05,
	"max": 0.004862266020000001,
	"count": 36
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1677574592",
	"python_version": "3.9.16 (main, Jan 11 2023, 16:16:36) [MSC v.1916 64 bit (AMD64)]",
	"command_line_arguments": "C:\\Users\\gmojkowski\\.conda\\envs\\rl\\Scripts\\mlagents-learn ml-agents/config/poca/SoccerTwos.yaml --env SoccerTwos/SoccerTwos.exe --run-id=resnet_base_v4 --no-graphics --initialize-from=resnet_base_v3",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.13.1+cpu",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1677618311"
	},
	"total": 43718.9919943,
	"count": 1,
	"self": 0.4404387999966275,
	"children": {
	"run_training.setup": {
	"total": 0.22507939999999982,
	"count": 1,
	"self": 0.22507939999999982
	},
	"TrainerController.start_learning": {
	"total": 43718.3264761,
	"count": 1,
	"self": 6.2553304009270505,
	"children": {
	"TrainerController._reset_env": {
	"total": 7.25175750001204,
	"count": 15,
	"self": 7.25175750001204
	},
	"TrainerController.advance": {
	"total": 43704.68255109906,
	"count": 195046,
	"self": 6.6376943998620845,
	"children": {
	"env_step": {
	"total": 27823.66736159923,
	"count": 195046,
	"self": 26713.80841279826,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 1105.5911817002898,
	"count": 195046,
	"self": 37.86665240134971,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 1067.72452929894,
	"count": 386592,
	"self": 1067.72452929894
	}
	}
	},
	"workers": {
	"total": 4.2677671006802465,
	"count": 195046,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 43703.49372489968,
	"count": 195046,
	"is_parallel": true,
	"self": 17770.0365155002,
	"children": {
	"steps_from_proto": {
	"total": 0.05832419999175542,
	"count": 30,
	"is_parallel": true,
	"self": 0.006691800038452378,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.05163239995330304,
	"count": 120,
	"is_parallel": true,
	"self": 0.05163239995330304
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 25933.398885199487,
	"count": 195046,
	"is_parallel": true,
	"self": 56.72683119988142,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 521.6316486982222,
	"count": 195046,
	"is_parallel": true,
	"self": 521.6316486982222
	},
	"communicator.exchange": {
	"total": 24396.046228599782,
	"count": 195046,
	"is_parallel": true,
	"self": 24396.046228599782
	},
	"steps_from_proto": {
	"total": 958.9941767016019,
	"count": 390092,
	"is_parallel": true,
	"self": 111.15929309924877,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 847.8348836023531,
	"count": 1560368,
	"is_parallel": true,
	"self": 847.8348836023531
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 15874.377495099965,
	"count": 195046,
	"self": 46.30661719941418,
	"children": {
	"process_trajectory": {
	"total": 8990.299759200574,
	"count": 195046,
	"self": 8988.298889900569,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 2.0008693000054336,
	"count": 10,
	"self": 2.0008693000054336
	}
	}
	},
	"_update_policy": {
	"total": 6837.771118699977,
	"count": 36,
	"self": 692.7114432000171,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 6145.05967549996,
	"count": 1080,
	"self": 6145.05967549996
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 8.999995770864189e-07,
	"count": 1,
	"self": 8.999995770864189e-07
	},
	"TrainerController._save_models": {
	"total": 0.13683620000665542,
	"count": 1,
	"self": 0.0033173000119859353,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.13351889999466948,
	"count": 1,
	"self": 0.13351889999466948
	}
	}
	}
	}
	}
	}
	}