First Push

c9b2961 verified 9 days ago

20.1 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.9199421405792236,
	"min": 1.9163777828216553,
	"max": 3.295650005340576,
	"count": 500
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 38521.71875,
	"min": 31440.37109375,
	"max": 110100.953125,
	"count": 500
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 61.775,
	"min": 48.584158415841586,
	"max": 999.0,
	"count": 500
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19768.0,
	"min": 16436.0,
	"max": 23784.0,
	"count": 500
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1628.5910647050919,
	"min": 1198.5591097434185,
	"max": 1628.5910647050919,
	"count": 487
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 260574.57035281468,
	"min": 2399.3006309080756,
	"max": 319455.80218327563,
	"count": 487
	},
	"SoccerTwos.Step.mean": {
	"value": 4999847.0,
	"min": 9106.0,
	"max": 4999847.0,
	"count": 500
	},
	"SoccerTwos.Step.sum": {
	"value": 4999847.0,
	"min": 9106.0,
	"max": 4999847.0,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": 0.05501215159893036,
	"min": -0.0878828912973404,
	"max": 0.17502635717391968,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": 8.856956481933594,
	"min": -12.671778678894043,
	"max": 20.595542907714844,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.05289475992321968,
	"min": -0.0878741592168808,
	"max": 0.18384036421775818,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": 8.516056060791016,
	"min": -12.723438262939453,
	"max": 20.90155029296875,
	"count": 500
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 500
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.14707205236328313,
	"min": -0.48869091272354126,
	"max": 0.5638300001621246,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 23.678600430488586,
	"min": -46.74059993028641,
	"max": 61.60879975557327,
	"count": 500
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.14707205236328313,
	"min": -0.48869091272354126,
	"max": 0.5638300001621246,
	"count": 500
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 23.678600430488586,
	"min": -46.74059993028641,
	"max": 61.60879975557327,
	"count": 500
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 500
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 500
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.01428732877636018,
	"min": 0.010442969878052584,
	"max": 0.02359669313300401,
	"count": 240
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.01428732877636018,
	"min": 0.010442969878052584,
	"max": 0.02359669313300401,
	"count": 240
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.10719360237320265,
	"min": 0.00023785107526540136,
	"max": 0.11659352357188861,
	"count": 240
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.10719360237320265,
	"min": 0.00023785107526540136,
	"max": 0.11659352357188861,
	"count": 240
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.10894363522529601,
	"min": 0.00023359292827080936,
	"max": 0.11885522902011872,
	"count": 240
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.10894363522529601,
	"min": 0.00023359292827080936,
	"max": 0.11885522902011872,
	"count": 240
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 240
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 240
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 240
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 240
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 240
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 240
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1741958239",
	"python_version": "3.10.12 (main, Nov 6 2024, 20:22:13) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn SoccerTwos.yaml --env=/kaggle/working/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force",
	"mlagents_version": "1.2.0.dev0",
	"mlagents_envs_version": "1.2.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.5.1+cu121",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1741968144"
	},
	"total": 9904.581475075,
	"count": 1,
	"self": 0.32192011799998,
	"children": {
	"run_training.setup": {
	"total": 0.08083185199984655,
	"count": 1,
	"self": 0.08083185199984655
	},
	"TrainerController.start_learning": {
	"total": 9904.178723105,
	"count": 1,
	"self": 6.924276529858616,
	"children": {
	"TrainerController._reset_env": {
	"total": 6.20342662900066,
	"count": 25,
	"self": 6.20342662900066
	},
	"TrainerController.advance": {
	"total": 9890.869237523139,
	"count": 338741,
	"self": 7.404843273210645,
	"children": {
	"env_step": {
	"total": 7645.443256884875,
	"count": 338741,
	"self": 5435.857759721461,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 2205.5843031790323,
	"count": 338741,
	"self": 50.44182486279169,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 2155.1424783162406,
	"count": 631900,
	"self": 2155.1424783162406
	}
	}
	},
	"workers": {
	"total": 4.0011939843816435,
	"count": 338741,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 9888.487831582568,
	"count": 338741,
	"is_parallel": true,
	"self": 5347.010806606722,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.003522467000038887,
	"count": 2,
	"is_parallel": true,
	"self": 0.0010157399997297034,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0025067270003091835,
	"count": 8,
	"is_parallel": true,
	"self": 0.0025067270003091835
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.029894303999753902,
	"count": 1,
	"is_parallel": true,
	"self": 0.0007916449994809227,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0004639429998860578,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004639429998860578
	},
	"communicator.exchange": {
	"total": 0.026138181000078475,
	"count": 1,
	"is_parallel": true,
	"self": 0.026138181000078475
	},
	"steps_from_proto": {
	"total": 0.002500535000308446,
	"count": 2,
	"is_parallel": true,
	"self": 0.0005926500007262803,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0019078849995821656,
	"count": 8,
	"is_parallel": true,
	"self": 0.0019078849995821656
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 4541.426408038844,
	"count": 338740,
	"is_parallel": true,
	"self": 244.702487298111,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 164.58644384480885,
	"count": 338740,
	"is_parallel": true,
	"self": 164.58644384480885
	},
	"communicator.exchange": {
	"total": 3356.8593818411014,
	"count": 338740,
	"is_parallel": true,
	"self": 3356.8593818411014
	},
	"steps_from_proto": {
	"total": 775.2780950548231,
	"count": 677480,
	"is_parallel": true,
	"self": 144.7892130085702,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 630.4888820462529,
	"count": 2709920,
	"is_parallel": true,
	"self": 630.4888820462529
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.050616937001450424,
	"count": 48,
	"is_parallel": true,
	"self": 0.009881477006274508,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.040735459995175916,
	"count": 192,
	"is_parallel": true,
	"self": 0.040735459995175916
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 2238.0211373650536,
	"count": 338741,
	"self": 60.651900614383976,
	"children": {
	"process_trajectory": {
	"total": 979.8792215666804,
	"count": 338741,
	"self": 977.9070523826772,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 1.972169184003178,
	"count": 10,
	"self": 1.972169184003178
	}
	}
	},
	"_update_policy": {
	"total": 1197.4900151839893,
	"count": 240,
	"self": 681.5843652289486,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 515.9056499550406,
	"count": 7200,
	"self": 515.9056499550406
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 9.820014383876696e-07,
	"count": 1,
	"self": 9.820014383876696e-07
	},
	"TrainerController._save_models": {
	"total": 0.1817814410005667,
	"count": 1,
	"self": 0.0018027969999820925,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.1799786440005846,
	"count": 1,
	"self": 0.1799786440005846
	}
	}
	}
	}
	}
	}
	}