{ "name": "root", "gauges": { "SoccerTwos.Policy.Entropy.mean": { "value": 0.866117000579834, "min": 0.8086401224136353, "max": 2.135493516921997, "count": 14989 }, "SoccerTwos.Policy.Entropy.sum": { "value": 18708.126953125, "min": 10466.740234375, "max": 105615.1484375, "count": 14989 }, "SoccerTwos.Environment.EpisodeLength.mean": { "value": 66.29166666666667, "min": 26.98324022346369, "max": 125.325, "count": 14989 }, "SoccerTwos.Environment.EpisodeLength.sum": { "value": 19092.0, "min": 14712.0, "max": 22936.0, "count": 14989 }, "SoccerTwos.Self-play.ELO.mean": { "value": 1707.7936415009024, "min": 1549.168502889312, "max": 1746.4515803198233, "count": 14989 }, "SoccerTwos.Self-play.ELO.sum": { "value": 245922.28437612994, "min": 120430.73786124286, "max": 605872.0984318862, "count": 14989 }, "SoccerTwos.Step.mean": { "value": 199999964.0, "min": 50119986.0, "max": 199999964.0, "count": 14989 }, "SoccerTwos.Step.sum": { "value": 199999964.0, "min": 50119986.0, "max": 199999964.0, "count": 14989 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { "value": -0.04558149352669716, "min": -0.16296879947185516, "max": 0.10279054194688797, "count": 14989 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { "value": -6.700479507446289, "min": -33.77891540527344, "max": 16.427635192871094, "count": 14989 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { "value": -0.04524017497897148, "min": -0.16307416558265686, "max": 0.10262896120548248, "count": 14989 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { "value": -6.65030574798584, "min": -34.11742401123047, "max": 16.870479583740234, "count": 14989 }, "SoccerTwos.Environment.CumulativeReward.mean": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 14989 }, "SoccerTwos.Environment.CumulativeReward.sum": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 14989 }, "SoccerTwos.Policy.ExtrinsicReward.mean": { "value": -0.17092517241328753, "min": -0.47276239211742693, "max": 0.5691900824712328, "count": 14989 }, "SoccerTwos.Policy.ExtrinsicReward.sum": { "value": -25.126000344753265, "min": -87.17599999904633, "max": 83.58380001783371, "count": 14989 }, "SoccerTwos.Environment.GroupCumulativeReward.mean": { "value": -0.17092517241328753, "min": -0.47276239211742693, "max": 0.5691900824712328, "count": 14989 }, "SoccerTwos.Environment.GroupCumulativeReward.sum": { "value": -25.126000344753265, "min": -87.17599999904633, "max": 83.58380001783371, "count": 14989 }, "SoccerTwos.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 14989 }, "SoccerTwos.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 14989 }, "SoccerTwos.Losses.PolicyLoss.mean": { "value": 0.018238363913648453, "min": 0.008571711436282688, "max": 0.026601446373388172, "count": 7245 }, "SoccerTwos.Losses.PolicyLoss.sum": { "value": 0.018238363913648453, "min": 0.008571711436282688, "max": 0.026601446373388172, "count": 7245 }, "SoccerTwos.Losses.ValueLoss.mean": { "value": 0.09880388751626015, "min": 0.06719134338200092, "max": 0.15229609956343967, "count": 7245 }, "SoccerTwos.Losses.ValueLoss.sum": { "value": 0.09880388751626015, "min": 0.06719134338200092, "max": 0.15229609956343967, "count": 7245 }, "SoccerTwos.Losses.BaselineLoss.mean": { "value": 0.09918721541762351, "min": 0.06746410404642424, "max": 0.15259439150492352, "count": 7245 }, "SoccerTwos.Losses.BaselineLoss.sum": { "value": 0.09918721541762351, "min": 0.06746410404642424, "max": 0.15259439150492352, "count": 7245 }, "SoccerTwos.Policy.LearningRate.mean": { "value": 6.048997025493988e-09, "min": 6.048997025493988e-09, "max": 0.0001498667620666315, "count": 7245 }, "SoccerTwos.Policy.LearningRate.sum": { "value": 6.048997025493988e-09, "min": 6.048997025493988e-09, "max": 0.0001498667620666315, "count": 7245 }, "SoccerTwos.Policy.Epsilon.mean": { "value": 0.20000000000000007, "min": 0.20000000000000007, "max": 0.20000000000000007, "count": 7245 }, "SoccerTwos.Policy.Epsilon.sum": { "value": 0.20000000000000007, "min": 0.20000000000000007, "max": 0.20000000000000007, "count": 7245 }, "SoccerTwos.Policy.Beta.mean": { "value": 1.0297152549999698e-05, "min": 1.0297152549999698e-05, "max": 0.00749584351315, "count": 7245 }, "SoccerTwos.Policy.Beta.sum": { "value": 1.0297152549999698e-05, "min": 1.0297152549999698e-05, "max": 0.00749584351315, "count": 7245 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1681458589", "python_version": "3.9.16 (main, Mar 8 2023, 14:00:05) \n[GCC 11.2.0]", "command_line_arguments": "/data/qyh/env/ml-agents/bin/mlagents-learn ./results/configuration.yaml", "mlagents_version": "0.31.0.dev0", "mlagents_envs_version": "0.31.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.11.0+cu102", "numpy_version": "1.21.2", "end_time_seconds": "1681660711" }, "total": 202121.95327740815, "count": 1, "self": 0.7371731949970126, "children": { "run_training.setup": { "total": 0.08580901497043669, "count": 1, "self": 0.08580901497043669 }, "TrainerController.start_learning": { "total": 202121.13029519818, "count": 1, "self": 75.58960591861978, "children": { "TrainerController._reset_env": { "total": 239.88585016061552, "count": 750, "self": 239.88585016061552 }, "TrainerController.advance": { "total": 201805.20052092662, "count": 889082, "self": 43.436931712087244, "children": { "env_step": { "total": 109403.14526834106, "count": 889082, "self": 35718.75220445846, "children": { "SubprocessEnvManager._take_step": { "total": 73588.09211776033, "count": 11064486, "self": 1956.4829019042663, "children": { "TorchPolicy.evaluate": { "total": 71631.60921585606, "count": 20304662, "self": 71631.60921585606 } } }, "workers": { "total": 96.30094612226821, "count": 889082, "self": 0.0, "children": { "worker_root": { "total": 3786373.531351197, "count": 11061955, "is_parallel": true, "self": 3543006.6518733725, "children": { "run_training.setup": { "total": 1.372944239526987, "count": 16, "is_parallel": true, "self": 0.8564431574195623, "children": { "steps_from_proto": { "total": 0.05167464469559491, "count": 20, "is_parallel": true, "self": 0.012508621672168374, "children": { "_process_rank_one_or_two_observation": { "total": 0.03916602302342653, "count": 80, "is_parallel": true, "self": 0.03916602302342653 } } }, "UnityEnvironment.step": { "total": 0.46482643741182983, "count": 10, "is_parallel": true, "self": 0.012752049136906862, "children": { "UnityEnvironment._generate_step_input": { "total": 0.009736666223034263, "count": 10, "is_parallel": true, "self": 0.009736666223034263 }, "communicator.exchange": { "total": 0.4049945876467973, "count": 10, "is_parallel": true, "self": 0.4049945876467973 }, "steps_from_proto": { "total": 0.037343134405091405, "count": 20, "is_parallel": true, "self": 0.007720504887402058, "children": { "_process_rank_one_or_two_observation": { "total": 0.029622629517689347, "count": 80, "is_parallel": true, "self": 0.029622629517689347 } } } } } } }, "steps_from_proto": { "total": 63.20921622682363, "count": 23968, "is_parallel": true, "self": 10.96054931380786, "children": { "_process_rank_one_or_two_observation": { "total": 52.24866691301577, "count": 95872, "is_parallel": true, "self": 52.24866691301577 } } }, "UnityEnvironment.step": { "total": 243302.29731735843, "count": 11061929, "is_parallel": true, "self": 16865.871614304837, "children": { "UnityEnvironment._generate_step_input": { "total": 10229.591617493192, "count": 11061929, "is_parallel": true, "self": 10229.591617493192 }, "communicator.exchange": { "total": 170588.07838961575, "count": 11061929, "is_parallel": true, "self": 170588.07838961575 }, "steps_from_proto": { "total": 45618.75569594465, "count": 22123858, "is_parallel": true, "self": 8546.25141385477, "children": { "_process_rank_one_or_two_observation": { "total": 37072.50428208988, "count": 88495432, "is_parallel": true, "self": 37072.50428208988 } } } } }, "TrainerController.start_learning": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "TrainerController._reset_env": { "total": 765.6606953628361, "count": 2576, "is_parallel": true, "self": 765.6606953628361 }, "TrainerController.advance": { "total": 553472.6433439851, "count": 3113472, "is_parallel": true, "self": 127.54399403184652, "children": { "env_step": { "total": 312836.9059403762, "count": 3113472, "is_parallel": true, "self": 104029.15610423265, "children": { "SubprocessEnvManager._take_step": { "total": 208505.66601867974, "count": 37653456, "is_parallel": true, "self": 5868.197185412049, "children": { "TorchPolicy.evaluate": { "total": 202637.4688332677, "count": 69410080, "is_parallel": true, "self": 202637.4688332677 } } }, "workers": { "total": 301.0074671693146, "count": 3113472, "is_parallel": true, "self": 0.0, "children": { "worker_root": { "total": 8863163.5911063, "count": 37643536, "is_parallel": true, "self": 8047015.4603802115, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.8267943151295185, "count": 320, "is_parallel": true, "self": 0.20013794675469398, "children": { "_process_rank_one_or_two_observation": { "total": 0.6266563683748245, "count": 1280, "is_parallel": true, "self": 0.6266563683748245 } } }, "UnityEnvironment.step": { "total": 7.437222998589277, "count": 160, "is_parallel": true, "self": 0.2040327861905098, "children": { "UnityEnvironment._generate_step_input": { "total": 0.1557866595685482, "count": 160, "is_parallel": true, "self": 0.1557866595685482 }, "communicator.exchange": { "total": 6.479913402348757, "count": 160, "is_parallel": true, "self": 6.479913402348757 }, "steps_from_proto": { "total": 0.5974901504814625, "count": 320, "is_parallel": true, "self": 0.12352807819843292, "children": { "_process_rank_one_or_two_observation": { "total": 0.47396207228302956, "count": 1280, "is_parallel": true, "self": 0.47396207228302956 } } } } } } }, "steps_from_proto": { "total": 189.85917573422194, "count": 81920, "is_parallel": true, "self": 32.98321542516351, "children": { "_process_rank_one_or_two_observation": { "total": 156.87596030905843, "count": 327680, "is_parallel": true, "self": 156.87596030905843 } } }, "UnityEnvironment.step": { "total": 815958.2715503536, "count": 37643376, "is_parallel": true, "self": 50899.1951662004, "children": { "UnityEnvironment._generate_step_input": { "total": 34107.74587376788, "count": 37643376, "is_parallel": true, "self": 34107.74587376788 }, "communicator.exchange": { "total": 584456.3526424319, "count": 37643376, "is_parallel": true, "self": 584456.3526424319 }, "steps_from_proto": { "total": 146494.97786795348, "count": 75286752, "is_parallel": true, "self": 28645.180666983128, "children": { "_process_rank_one_or_two_observation": { "total": 117849.79720097035, "count": 301147008, "is_parallel": true, "self": 117849.79720097035 } } } } } } } } }, "steps_from_proto": { "total": 0.13184957904741168, "count": 32, "is_parallel": true, "self": 0.023764571640640497, "children": { "_process_rank_one_or_two_observation": { "total": 0.10808500740677118, "count": 128, "is_parallel": true, "self": 0.10808500740677118 } } }, "UnityEnvironment.step": { "total": 0.9445007154718041, "count": 16, "is_parallel": true, "self": 0.08671622956171632, "children": { "UnityEnvironment._generate_step_input": { "total": 0.033300156239420176, "count": 16, "is_parallel": true, "self": 0.033300156239420176 }, "communicator.exchange": { "total": 0.6965830507688224, "count": 16, "is_parallel": true, "self": 0.6965830507688224 }, "steps_from_proto": { "total": 0.12790127890184522, "count": 32, "is_parallel": true, "self": 0.016938731539994478, "children": { "_process_rank_one_or_two_observation": { "total": 0.11096254736185074, "count": 128, "is_parallel": true, "self": 0.11096254736185074 } } } } } } }, "trainer_advance": { "total": 240508.193409577, "count": 3113472, "is_parallel": true, "self": 4416.851860079914, "children": { "process_trajectory": { "total": 98595.71652773768, "count": 3113472, "is_parallel": true, "self": 98254.31838959828, "children": { "RLTrainer._checkpoint": { "total": 341.3981381393969, "count": 1008, "is_parallel": true, "self": 341.3981381393969 } } }, "_update_policy": { "total": 137495.62502175942, "count": 24656, "is_parallel": true, "self": 92660.20954589918, "children": { "TorchPOCAOptimizer.update": { "total": 44835.41547586024, "count": 739680, "is_parallel": true, "self": 44835.41547586024 } } } } } } } } } } } } } } }, "trainer_advance": { "total": 92358.61832087347, "count": 889082, "self": 1729.3800815341529, "children": { "process_trajectory": { "total": 39200.872351852246, "count": 889082, "self": 39080.471363719786, "children": { "RLTrainer._checkpoint": { "total": 120.40098813246004, "count": 300, "self": 120.40098813246004 } } }, "_update_policy": { "total": 51428.365887487074, "count": 7245, "self": 35151.995161822764, "children": { "TorchPOCAOptimizer.update": { "total": 16276.37072566431, "count": 217350, "self": 16276.37072566431 } } } } } } }, "trainer_threads": { "total": 1.4849938452243805e-06, "count": 1, "self": 1.4849938452243805e-06 }, "TrainerController._save_models": { "total": 0.4543167073279619, "count": 1, "self": 0.0035243132151663303, "children": { "RLTrainer._checkpoint": { "total": 0.4507923941127956, "count": 1, "self": 0.4507923941127956 } } } } } } }