First Push

f7ffbcd almost 2 years ago

15.6 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 3.295811891555786,
	"min": 3.2958104610443115,
	"max": 3.2958128452301025,
	"count": 10
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 76251.90625,
	"min": 32061.64453125,
	"max": 105466.0078125,
	"count": 10
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 901.6666666666666,
	"min": 457.14285714285717,
	"max": 949.2,
	"count": 10
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 21640.0,
	"min": 12800.0,
	"max": 27424.0,
	"count": 10
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1199.3174515811288,
	"min": 1197.3801008004168,
	"max": 1200.0228273122877,
	"count": 10
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 2398.6349031622576,
	"min": 2396.1189814205263,
	"max": 12000.228273122877,
	"count": 10
	},
	"SoccerTwos.Step.mean": {
	"value": 99242.0,
	"min": 9728.0,
	"max": 99242.0,
	"count": 10
	},
	"SoccerTwos.Step.sum": {
	"value": 99242.0,
	"min": 9728.0,
	"max": 99242.0,
	"count": 10
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.0925903245806694,
	"min": -0.09259041398763657,
	"max": -0.09259025007486343,
	"count": 10
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -1.0184935331344604,
	"min": -1.4814465045928955,
	"max": -1.0184929370880127,
	"count": 10
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.09259033203125,
	"min": -0.0925903394818306,
	"max": -0.09259026497602463,
	"count": 10
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -1.01849365234375,
	"min": -1.4814449548721313,
	"max": -1.0184929370880127,
	"count": 10
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 10
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 10
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.18181818181818182,
	"min": -0.36363636363636365,
	"max": 0.2736923052714421,
	"count": 10
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -2.0,
	"min": -4.544000029563904,
	"max": 3.5579999685287476,
	"count": 10
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.18181818181818182,
	"min": -0.36363636363636365,
	"max": 0.2736923052714421,
	"count": 10
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -2.0,
	"min": -4.544000029563904,
	"max": 3.5579999685287476,
	"count": 10
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 10
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 10
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1677622138",
	"python_version": "3.9.16 (main, Jan 11 2023, 16:05:54) \n[GCC 11.2.0]",
	"command_line_arguments": "/home/akriel/anaconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu113",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1677622243"
	},
	"total": 105.266430096,
	"count": 1,
	"self": 0.3191557019999891,
	"children": {
	"run_training.setup": {
	"total": 0.007034048000008397,
	"count": 1,
	"self": 0.007034048000008397
	},
	"TrainerController.start_learning": {
	"total": 104.940240346,
	"count": 1,
	"self": 0.1252862329993718,
	"children": {
	"TrainerController._reset_env": {
	"total": 4.857088169000008,
	"count": 1,
	"self": 4.857088169000008
	},
	"TrainerController.advance": {
	"total": 99.7949521520006,
	"count": 6766,
	"self": 0.1260310760013681,
	"children": {
	"env_step": {
	"total": 93.19740691099804,
	"count": 6766,
	"self": 68.33193762600021,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 24.78813652399853,
	"count": 6766,
	"self": 0.587359405997347,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 24.200777118001184,
	"count": 13462,
	"self": 24.200777118001184
	}
	}
	},
	"workers": {
	"total": 0.07733276099929753,
	"count": 6766,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 104.50876852200096,
	"count": 6766,
	"is_parallel": true,
	"self": 49.93664935800044,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.004105511000034312,
	"count": 2,
	"is_parallel": true,
	"self": 0.0015562140000326963,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0025492970000016157,
	"count": 8,
	"is_parallel": true,
	"self": 0.0025492970000016157
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.02470437100001277,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004798270000208049,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0003650399999912679,
	"count": 1,
	"is_parallel": true,
	"self": 0.0003650399999912679
	},
	"communicator.exchange": {
	"total": 0.022389144000015904,
	"count": 1,
	"is_parallel": true,
	"self": 0.022389144000015904
	},
	"steps_from_proto": {
	"total": 0.0014703599999847938,
	"count": 2,
	"is_parallel": true,
	"self": 0.0002902839999592288,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001180076000025565,
	"count": 8,
	"is_parallel": true,
	"self": 0.001180076000025565
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 54.572119164000526,
	"count": 6765,
	"is_parallel": true,
	"self": 3.1604819609981973,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 2.213269317002073,
	"count": 6765,
	"is_parallel": true,
	"self": 2.213269317002073
	},
	"communicator.exchange": {
	"total": 39.91398190599966,
	"count": 6765,
	"is_parallel": true,
	"self": 39.91398190599966
	},
	"steps_from_proto": {
	"total": 9.284385980000593,
	"count": 13530,
	"is_parallel": true,
	"self": 1.8419112900046173,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 7.442474689995976,
	"count": 54120,
	"is_parallel": true,
	"self": 7.442474689995976
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 6.471514165001196,
	"count": 6766,
	"self": 0.7807448480007508,
	"children": {
	"process_trajectory": {
	"total": 5.690769317000445,
	"count": 6766,
	"self": 5.690769317000445
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.8160000081479666e-06,
	"count": 1,
	"self": 1.8160000081479666e-06
	},
	"TrainerController._save_models": {
	"total": 0.16291197600000373,
	"count": 1,
	"self": 0.0012980780000191317,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.1616138979999846,
	"count": 1,
	"self": 0.1616138979999846
	}
	}
	}
	}
	}
	}
	}