poca-SoccerTwos / run_logs /timers.json
ezrab's picture
First Push
c9b2961 verified
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 1.9199421405792236,
"min": 1.9163777828216553,
"max": 3.295650005340576,
"count": 500
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 38521.71875,
"min": 31440.37109375,
"max": 110100.953125,
"count": 500
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 61.775,
"min": 48.584158415841586,
"max": 999.0,
"count": 500
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 19768.0,
"min": 16436.0,
"max": 23784.0,
"count": 500
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1628.5910647050919,
"min": 1198.5591097434185,
"max": 1628.5910647050919,
"count": 487
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 260574.57035281468,
"min": 2399.3006309080756,
"max": 319455.80218327563,
"count": 487
},
"SoccerTwos.Step.mean": {
"value": 4999847.0,
"min": 9106.0,
"max": 4999847.0,
"count": 500
},
"SoccerTwos.Step.sum": {
"value": 4999847.0,
"min": 9106.0,
"max": 4999847.0,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": 0.05501215159893036,
"min": -0.0878828912973404,
"max": 0.17502635717391968,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": 8.856956481933594,
"min": -12.671778678894043,
"max": 20.595542907714844,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.05289475992321968,
"min": -0.0878741592168808,
"max": 0.18384036421775818,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": 8.516056060791016,
"min": -12.723438262939453,
"max": 20.90155029296875,
"count": 500
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 500
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": 0.14707205236328313,
"min": -0.48869091272354126,
"max": 0.5638300001621246,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": 23.678600430488586,
"min": -46.74059993028641,
"max": 61.60879975557327,
"count": 500
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": 0.14707205236328313,
"min": -0.48869091272354126,
"max": 0.5638300001621246,
"count": 500
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": 23.678600430488586,
"min": -46.74059993028641,
"max": 61.60879975557327,
"count": 500
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 500
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 500
},
"SoccerTwos.Losses.PolicyLoss.mean": {
"value": 0.01428732877636018,
"min": 0.010442969878052584,
"max": 0.02359669313300401,
"count": 240
},
"SoccerTwos.Losses.PolicyLoss.sum": {
"value": 0.01428732877636018,
"min": 0.010442969878052584,
"max": 0.02359669313300401,
"count": 240
},
"SoccerTwos.Losses.ValueLoss.mean": {
"value": 0.10719360237320265,
"min": 0.00023785107526540136,
"max": 0.11659352357188861,
"count": 240
},
"SoccerTwos.Losses.ValueLoss.sum": {
"value": 0.10719360237320265,
"min": 0.00023785107526540136,
"max": 0.11659352357188861,
"count": 240
},
"SoccerTwos.Losses.BaselineLoss.mean": {
"value": 0.10894363522529601,
"min": 0.00023359292827080936,
"max": 0.11885522902011872,
"count": 240
},
"SoccerTwos.Losses.BaselineLoss.sum": {
"value": 0.10894363522529601,
"min": 0.00023359292827080936,
"max": 0.11885522902011872,
"count": 240
},
"SoccerTwos.Policy.LearningRate.mean": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 240
},
"SoccerTwos.Policy.LearningRate.sum": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 240
},
"SoccerTwos.Policy.Epsilon.mean": {
"value": 0.20000000000000007,
"min": 0.20000000000000007,
"max": 0.20000000000000007,
"count": 240
},
"SoccerTwos.Policy.Epsilon.sum": {
"value": 0.20000000000000007,
"min": 0.20000000000000007,
"max": 0.20000000000000007,
"count": 240
},
"SoccerTwos.Policy.Beta.mean": {
"value": 0.005000000000000001,
"min": 0.005000000000000001,
"max": 0.005000000000000001,
"count": 240
},
"SoccerTwos.Policy.Beta.sum": {
"value": 0.005000000000000001,
"min": 0.005000000000000001,
"max": 0.005000000000000001,
"count": 240
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1741958239",
"python_version": "3.10.12 (main, Nov 6 2024, 20:22:13) [GCC 11.4.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn SoccerTwos.yaml --env=/kaggle/working/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force",
"mlagents_version": "1.2.0.dev0",
"mlagents_envs_version": "1.2.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.5.1+cu121",
"numpy_version": "1.23.5",
"end_time_seconds": "1741968144"
},
"total": 9904.581475075,
"count": 1,
"self": 0.32192011799998,
"children": {
"run_training.setup": {
"total": 0.08083185199984655,
"count": 1,
"self": 0.08083185199984655
},
"TrainerController.start_learning": {
"total": 9904.178723105,
"count": 1,
"self": 6.924276529858616,
"children": {
"TrainerController._reset_env": {
"total": 6.20342662900066,
"count": 25,
"self": 6.20342662900066
},
"TrainerController.advance": {
"total": 9890.869237523139,
"count": 338741,
"self": 7.404843273210645,
"children": {
"env_step": {
"total": 7645.443256884875,
"count": 338741,
"self": 5435.857759721461,
"children": {
"SubprocessEnvManager._take_step": {
"total": 2205.5843031790323,
"count": 338741,
"self": 50.44182486279169,
"children": {
"TorchPolicy.evaluate": {
"total": 2155.1424783162406,
"count": 631900,
"self": 2155.1424783162406
}
}
},
"workers": {
"total": 4.0011939843816435,
"count": 338741,
"self": 0.0,
"children": {
"worker_root": {
"total": 9888.487831582568,
"count": 338741,
"is_parallel": true,
"self": 5347.010806606722,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.003522467000038887,
"count": 2,
"is_parallel": true,
"self": 0.0010157399997297034,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0025067270003091835,
"count": 8,
"is_parallel": true,
"self": 0.0025067270003091835
}
}
},
"UnityEnvironment.step": {
"total": 0.029894303999753902,
"count": 1,
"is_parallel": true,
"self": 0.0007916449994809227,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0004639429998860578,
"count": 1,
"is_parallel": true,
"self": 0.0004639429998860578
},
"communicator.exchange": {
"total": 0.026138181000078475,
"count": 1,
"is_parallel": true,
"self": 0.026138181000078475
},
"steps_from_proto": {
"total": 0.002500535000308446,
"count": 2,
"is_parallel": true,
"self": 0.0005926500007262803,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0019078849995821656,
"count": 8,
"is_parallel": true,
"self": 0.0019078849995821656
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 4541.426408038844,
"count": 338740,
"is_parallel": true,
"self": 244.702487298111,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 164.58644384480885,
"count": 338740,
"is_parallel": true,
"self": 164.58644384480885
},
"communicator.exchange": {
"total": 3356.8593818411014,
"count": 338740,
"is_parallel": true,
"self": 3356.8593818411014
},
"steps_from_proto": {
"total": 775.2780950548231,
"count": 677480,
"is_parallel": true,
"self": 144.7892130085702,
"children": {
"_process_rank_one_or_two_observation": {
"total": 630.4888820462529,
"count": 2709920,
"is_parallel": true,
"self": 630.4888820462529
}
}
}
}
},
"steps_from_proto": {
"total": 0.050616937001450424,
"count": 48,
"is_parallel": true,
"self": 0.009881477006274508,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.040735459995175916,
"count": 192,
"is_parallel": true,
"self": 0.040735459995175916
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 2238.0211373650536,
"count": 338741,
"self": 60.651900614383976,
"children": {
"process_trajectory": {
"total": 979.8792215666804,
"count": 338741,
"self": 977.9070523826772,
"children": {
"RLTrainer._checkpoint": {
"total": 1.972169184003178,
"count": 10,
"self": 1.972169184003178
}
}
},
"_update_policy": {
"total": 1197.4900151839893,
"count": 240,
"self": 681.5843652289486,
"children": {
"TorchPOCAOptimizer.update": {
"total": 515.9056499550406,
"count": 7200,
"self": 515.9056499550406
}
}
}
}
}
}
},
"trainer_threads": {
"total": 9.820014383876696e-07,
"count": 1,
"self": 9.820014383876696e-07
},
"TrainerController._save_models": {
"total": 0.1817814410005667,
"count": 1,
"self": 0.0018027969999820925,
"children": {
"RLTrainer._checkpoint": {
"total": 0.1799786440005846,
"count": 1,
"self": 0.1799786440005846
}
}
}
}
}
}
}