{ "name": "root", "gauges": { "SoccerTwos.Policy.Entropy.mean": { "value": 0.5649459958076477, "min": 0.5644735097885132, "max": 0.572594165802002, "count": 5 }, "SoccerTwos.Policy.Entropy.sum": { "value": 118484.9921875, "min": 84210.671875, "max": 118484.9921875, "count": 5 }, "SoccerTwos.Environment.EpisodeLength.mean": { "value": 65.57866666666666, "min": 65.45161290322581, "max": 70.0, "count": 5 }, "SoccerTwos.Environment.EpisodeLength.sum": { "value": 196736.0, "min": 137972.0, "max": 197956.0, "count": 5 }, "SoccerTwos.Self-play.ELO.mean": { "value": 1865.6228489712353, "min": 1845.2267003969812, "max": 1865.6228489712353, "count": 5 }, "SoccerTwos.Self-play.ELO.sum": { "value": 2798434.273456853, "min": 1956507.9199565013, "max": 2798434.273456853, "count": 5 }, "SoccerTwos.Step.mean": { "value": 376899937.0, "min": 376499999.0, "max": 376899937.0, "count": 5 }, "SoccerTwos.Step.sum": { "value": 376899937.0, "min": 376499999.0, "max": 376899937.0, "count": 5 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { "value": -0.019592909142374992, "min": -0.026459304615855217, "max": -0.002913642907515168, "count": 5 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { "value": -29.40895652770996, "min": -38.12785720825195, "max": -4.0994954109191895, "count": 5 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { "value": -0.019337261095643044, "min": -0.026621351018548012, "max": -0.003080854658037424, "count": 5 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { "value": -29.02522850036621, "min": -38.361366271972656, "max": -4.3347625732421875, "count": 5 }, "SoccerTwos.Environment.CumulativeReward.mean": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 5 }, "SoccerTwos.Environment.CumulativeReward.sum": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 5 }, "SoccerTwos.Policy.ExtrinsicReward.mean": { "value": -0.05957335102645498, "min": -0.09744899410245156, "max": 0.00926141178387334, "count": 5 }, "SoccerTwos.Policy.ExtrinsicReward.sum": { "value": -89.41959989070892, "min": -140.4240005016327, "max": 13.512399792671204, "count": 5 }, "SoccerTwos.Environment.GroupCumulativeReward.mean": { "value": -0.05957335102645498, "min": -0.09744899410245156, "max": 0.00926141178387334, "count": 5 }, "SoccerTwos.Environment.GroupCumulativeReward.sum": { "value": -89.41959989070892, "min": -140.4240005016327, "max": 13.512399792671204, "count": 5 }, "SoccerTwos.Losses.PolicyLoss.mean": { "value": 0.01779162102092717, "min": 0.01779162102092717, "max": 0.019526905030620077, "count": 5 }, "SoccerTwos.Losses.PolicyLoss.sum": { "value": 0.08895810510463585, "min": 0.05858071509186023, "max": 0.0932162393767309, "count": 5 }, "SoccerTwos.Losses.ValueLoss.mean": { "value": 0.05479174551864465, "min": 0.05327670603990555, "max": 0.056572384966744306, "count": 5 }, "SoccerTwos.Losses.ValueLoss.sum": { "value": 0.27395872759322326, "min": 0.16971715490023292, "max": 0.27395872759322326, "count": 5 }, "SoccerTwos.Losses.BaselineLoss.mean": { "value": 0.055094341660539316, "min": 0.05364057421684265, "max": 0.05683861263096333, "count": 5 }, "SoccerTwos.Losses.BaselineLoss.sum": { "value": 0.27547170830269657, "min": 0.17051583789289, "max": 0.27547170830269657, "count": 5 }, "SoccerTwos.Policy.LearningRate.mean": { "value": 0.00012463175680414045, "min": 0.00012463175680414045, "max": 0.00012470578311379397, "count": 5 }, "SoccerTwos.Policy.LearningRate.sum": { "value": 0.0006231587840207023, "min": 0.0003741173493413819, "max": 0.0006234464890768497, "count": 5 }, "SoccerTwos.Policy.Epsilon.mean": { "value": 0.25, "min": 0.25, "max": 0.25, "count": 5 }, "SoccerTwos.Policy.Epsilon.sum": { "value": 1.25, "min": 0.75, "max": 1.25, "count": 5 }, "SoccerTwos.Policy.Beta.mean": { "value": 0.003119561392044001, "min": 0.003119561392044001, "max": 0.003121408349393334, "count": 5 }, "SoccerTwos.Policy.Beta.sum": { "value": 0.015597806960220005, "min": 0.009364225048180002, "max": 0.015604985204960004, "count": 5 }, "SoccerTwos.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 5 }, "SoccerTwos.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 5 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1678655040", "python_version": "3.9.16 (main, Dec 7 2022, 01:11:51) \n[GCC 9.4.0]", "command_line_arguments": "/home/jonatan/PycharmProjects/HuggingFaceDLUnit7/venv3.9/bin/mlagents-learn ./config/poca/0046.yaml --env=ml-agents/training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=0046 --num-envs=4 --no-graphics --resume", "mlagents_version": "0.31.0.dev0", "mlagents_envs_version": "0.31.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.13.0+cu117", "numpy_version": "1.21.2", "end_time_seconds": "1678655366" }, "total": 325.82815397699596, "count": 1, "self": 0.05252380797173828, "children": { "run_training.setup": { "total": 0.04478141001891345, "count": 1, "self": 0.04478141001891345 }, "TrainerController.start_learning": { "total": 325.7308487590053, "count": 1, "self": 0.46060029487125576, "children": { "TrainerController._reset_env": { "total": 1.6848510290146805, "count": 4, "self": 1.6848510290146805 }, "TrainerController.advance": { "total": 323.3811118831509, "count": 22354, "self": 0.3797436287277378, "children": { "env_step": { "total": 175.81198098266032, "count": 22354, "self": 55.943261835956946, "children": { "SubprocessEnvManager._take_step": { "total": 119.59067042183597, "count": 32994, "self": 2.918875542934984, "children": { "TorchPolicy.evaluate": { "total": 116.67179487890098, "count": 60524, "self": 116.67179487890098 } } }, "workers": { "total": 0.2780487248674035, "count": 22354, "self": 0.0, "children": { "worker_root": { "total": 1279.8886924744584, "count": 32986, "is_parallel": true, "self": 912.9872178463847, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.0032067029969766736, "count": 2, "is_parallel": true, "self": 0.0006467999191954732, "children": { "_process_rank_one_or_two_observation": { "total": 0.0025599030777812004, "count": 8, "is_parallel": true, "self": 0.0025599030777812004 } } }, "UnityEnvironment.step": { "total": 0.021771005005575716, "count": 1, "is_parallel": true, "self": 0.0006596740568056703, "children": { "UnityEnvironment._generate_step_input": { "total": 0.0006626609829254448, "count": 1, "is_parallel": true, "self": 0.0006626609829254448 }, "communicator.exchange": { "total": 0.018955052946694195, "count": 1, "is_parallel": true, "self": 0.018955052946694195 }, "steps_from_proto": { "total": 0.0014936170191504061, "count": 2, "is_parallel": true, "self": 0.00027803104603663087, "children": { "_process_rank_one_or_two_observation": { "total": 0.0012155859731137753, "count": 8, "is_parallel": true, "self": 0.0012155859731137753 } } } } } } }, "steps_from_proto": { "total": 0.023772606102284044, "count": 24, "is_parallel": true, "self": 0.003904474782757461, "children": { "_process_rank_one_or_two_observation": { "total": 0.019868131319526583, "count": 96, "is_parallel": true, "self": 0.019868131319526583 } } }, "UnityEnvironment.step": { "total": 366.87770202197134, "count": 32985, "is_parallel": true, "self": 24.48025857488392, "children": { "UnityEnvironment._generate_step_input": { "total": 15.887670361611526, "count": 32985, "is_parallel": true, "self": 15.887670361611526 }, "communicator.exchange": { "total": 264.5647421096219, "count": 32985, "is_parallel": true, "self": 264.5647421096219 }, "steps_from_proto": { "total": 61.945030975854024, "count": 65970, "is_parallel": true, "self": 10.734944129711948, "children": { "_process_rank_one_or_two_observation": { "total": 51.210086846142076, "count": 263880, "is_parallel": true, "self": 51.210086846142076 } } } } } } } } } } }, "trainer_advance": { "total": 147.18938727176283, "count": 22354, "self": 4.191262548614759, "children": { "process_trajectory": { "total": 63.20415392232826, "count": 22354, "self": 63.20415392232826 }, "_update_policy": { "total": 79.7939708008198, "count": 23, "self": 55.70710274198791, "children": { "TorchPOCAOptimizer.update": { "total": 24.086868058831897, "count": 690, "self": 24.086868058831897 } } } } } } }, "trainer_threads": { "total": 1.101987436413765e-06, "count": 1, "self": 1.101987436413765e-06 }, "TrainerController._save_models": { "total": 0.20428444998105988, "count": 1, "self": 0.002235173946246505, "children": { "RLTrainer._checkpoint": { "total": 0.20204927603481337, "count": 1, "self": 0.20204927603481337 } } } } } } }