{ "name": "root", "gauges": { "SoccerTwos.Policy.Entropy.mean": { "value": 1.542044997215271, "min": 1.440100073814392, "max": 1.6137632131576538, "count": 300 }, "SoccerTwos.Policy.Entropy.sum": { "value": 32814.71875, "min": 25896.232421875, "max": 35227.22265625, "count": 300 }, "SoccerTwos.Environment.EpisodeLength.mean": { "value": 58.80952380952381, "min": 44.72477064220183, "max": 86.49122807017544, "count": 300 }, "SoccerTwos.Environment.EpisodeLength.sum": { "value": 19760.0, "min": 18724.0, "max": 20772.0, "count": 300 }, "SoccerTwos.Self-play.ELO.mean": { "value": 1653.1870649019568, "min": 1567.552494060283, "max": 1655.0609915835641, "count": 300 }, "SoccerTwos.Self-play.ELO.sum": { "value": 277735.42690352874, "min": 185288.5933308388, "max": 353285.91771309637, "count": 300 }, "SoccerTwos.Step.mean": { "value": 14999930.0, "min": 12009982.0, "max": 14999930.0, "count": 300 }, "SoccerTwos.Step.sum": { "value": 14999930.0, "min": 12009982.0, "max": 14999930.0, "count": 300 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { "value": -0.04682938754558563, "min": -0.11298096179962158, "max": 0.093830406665802, "count": 300 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { "value": -7.820508003234863, "min": -17.991260528564453, "max": 17.358625411987305, "count": 300 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { "value": -0.04404613748192787, "min": -0.10972505807876587, "max": 0.09695275872945786, "count": 300 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { "value": -7.3557047843933105, "min": -17.871688842773438, "max": 17.936260223388672, "count": 300 }, "SoccerTwos.Environment.CumulativeReward.mean": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 300 }, "SoccerTwos.Environment.CumulativeReward.sum": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 300 }, "SoccerTwos.Policy.ExtrinsicReward.mean": { "value": -0.12098922201259407, "min": -0.2797437529079616, "max": 0.27960924881731153, "count": 300 }, "SoccerTwos.Policy.ExtrinsicReward.sum": { "value": -20.20520007610321, "min": -46.605599999427795, "max": 48.3724000453949, "count": 300 }, "SoccerTwos.Environment.GroupCumulativeReward.mean": { "value": -0.12098922201259407, "min": -0.2797437529079616, "max": 0.27960924881731153, "count": 300 }, "SoccerTwos.Environment.GroupCumulativeReward.sum": { "value": -20.20520007610321, "min": -46.605599999427795, "max": 48.3724000453949, "count": 300 }, "SoccerTwos.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 300 }, "SoccerTwos.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 300 }, "SoccerTwos.Losses.PolicyLoss.mean": { "value": 0.016679967249122758, "min": 0.013073392383133372, "max": 0.024770521942991765, "count": 145 }, "SoccerTwos.Losses.PolicyLoss.sum": { "value": 0.016679967249122758, "min": 0.013073392383133372, "max": 0.024770521942991765, "count": 145 }, "SoccerTwos.Losses.ValueLoss.mean": { "value": 0.10101278101404508, "min": 0.08707024628917376, "max": 0.11337359274427096, "count": 145 }, "SoccerTwos.Losses.ValueLoss.sum": { "value": 0.10101278101404508, "min": 0.08707024628917376, "max": 0.11337359274427096, "count": 145 }, "SoccerTwos.Losses.BaselineLoss.mean": { "value": 0.10257193421324094, "min": 0.08828358178337416, "max": 0.11552387624979019, "count": 145 }, "SoccerTwos.Losses.BaselineLoss.sum": { "value": 0.10257193421324094, "min": 0.08828358178337416, "max": 0.11552387624979019, "count": 145 }, "SoccerTwos.Policy.LearningRate.mean": { "value": 0.0003, "min": 0.0003, "max": 0.0003, "count": 145 }, "SoccerTwos.Policy.LearningRate.sum": { "value": 0.0003, "min": 0.0003, "max": 0.0003, "count": 145 }, "SoccerTwos.Policy.Epsilon.mean": { "value": 0.20000000000000007, "min": 0.20000000000000007, "max": 0.20000000000000007, "count": 145 }, "SoccerTwos.Policy.Epsilon.sum": { "value": 0.20000000000000007, "min": 0.20000000000000007, "max": 0.20000000000000007, "count": 145 }, "SoccerTwos.Policy.Beta.mean": { "value": 0.005000000000000001, "min": 0.005000000000000001, "max": 0.005000000000000001, "count": 145 }, "SoccerTwos.Policy.Beta.sum": { "value": 0.005000000000000001, "min": 0.005000000000000001, "max": 0.005000000000000001, "count": 145 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1675923540", "python_version": "3.9.16 (main, Feb 6 2023, 20:06:40) \n[GCC 9.3.0]", "command_line_arguments": "/usr/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --resume", "mlagents_version": "0.31.0.dev0", "mlagents_envs_version": "0.31.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.11.0+cu102", "numpy_version": "1.21.2", "end_time_seconds": "1675935835" }, "total": 12295.671090400021, "count": 1, "self": 0.32222739997087047, "children": { "run_training.setup": { "total": 0.047608000051695853, "count": 1, "self": 0.047608000051695853 }, "TrainerController.start_learning": { "total": 12295.301254999998, "count": 1, "self": 7.271457104652654, "children": { "TrainerController._reset_env": { "total": 1.7654651998891495, "count": 16, "self": 1.7654651998891495 }, "TrainerController.advance": { "total": 12285.502733295492, "count": 207000, "self": 7.892098882293794, "children": { "env_step": { "total": 6744.709322719427, "count": 207000, "self": 5854.004936416459, "children": { "SubprocessEnvManager._take_step": { "total": 886.3216951006325, "count": 207000, "self": 38.47987049946096, "children": { "TorchPolicy.evaluate": { "total": 847.8418246011715, "count": 376556, "self": 847.8418246011715 } } }, "workers": { "total": 4.382691202335991, "count": 207000, "self": 0.0, "children": { "worker_root": { "total": 12277.59570988745, "count": 207000, "is_parallel": true, "self": 7156.613118898065, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.004712300025857985, "count": 2, "is_parallel": true, "self": 0.0014410000294446945, "children": { "_process_rank_one_or_two_observation": { "total": 0.0032712999964132905, "count": 8, "is_parallel": true, "self": 0.0032712999964132905 } } }, "UnityEnvironment.step": { "total": 0.059866299969144166, "count": 1, "is_parallel": true, "self": 0.0009093000553548336, "children": { "UnityEnvironment._generate_step_input": { "total": 0.0013091000146232545, "count": 1, "is_parallel": true, "self": 0.0013091000146232545 }, "communicator.exchange": { "total": 0.055025899957399815, "count": 1, "is_parallel": true, "self": 0.055025899957399815 }, "steps_from_proto": { "total": 0.002621999941766262, "count": 2, "is_parallel": true, "self": 0.000580199935939163, "children": { "_process_rank_one_or_two_observation": { "total": 0.002041800005827099, "count": 8, "is_parallel": true, "self": 0.002041800005827099 } } } } } } }, "steps_from_proto": { "total": 0.034881899948231876, "count": 30, "is_parallel": true, "self": 0.007476300408598036, "children": { "_process_rank_one_or_two_observation": { "total": 0.02740559953963384, "count": 120, "is_parallel": true, "self": 0.02740559953963384 } } }, "UnityEnvironment.step": { "total": 5120.947709089436, "count": 206999, "is_parallel": true, "self": 169.77864146704087, "children": { "UnityEnvironment._generate_step_input": { "total": 129.137426803587, "count": 206999, "is_parallel": true, "self": 129.137426803587 }, "communicator.exchange": { "total": 4308.419570893282, "count": 206999, "is_parallel": true, "self": 4308.419570893282 }, "steps_from_proto": { "total": 513.6120699255262, "count": 413998, "is_parallel": true, "self": 112.80534110986628, "children": { "_process_rank_one_or_two_observation": { "total": 400.8067288156599, "count": 1655992, "is_parallel": true, "self": 400.8067288156599 } } } } } } } } } } }, "trainer_advance": { "total": 5532.901311693771, "count": 207000, "self": 41.952493078657426, "children": { "process_trajectory": { "total": 997.4942364149028, "count": 207000, "self": 996.1923424148699, "children": { "RLTrainer._checkpoint": { "total": 1.3018940000329167, "count": 6, "self": 1.3018940000329167 } } }, "_update_policy": { "total": 4493.454582200211, "count": 145, "self": 565.9212106984342, "children": { "TorchPOCAOptimizer.update": { "total": 3927.533371501777, "count": 4350, "self": 3927.533371501777 } } } } } } }, "trainer_threads": { "total": 1.9999570213258266e-06, "count": 1, "self": 1.9999570213258266e-06 }, "TrainerController._save_models": { "total": 0.7615974000073038, "count": 1, "self": 0.0016035999869927764, "children": { "RLTrainer._checkpoint": { "total": 0.759993800020311, "count": 1, "self": 0.759993800020311 } } } } } } }