{ "name": "root", "gauges": { "SoccerTwos.Policy.Entropy.mean": { "value": 1.517268180847168, "min": 1.4903794527053833, "max": 1.5201311111450195, "count": 3 }, "SoccerTwos.Policy.Entropy.sum": { "value": 29908.390625, "min": 667.6900024414062, "max": 32737.54296875, "count": 3 }, "SoccerTwos.Environment.EpisodeLength.mean": { "value": 65.22972972972973, "min": 9.0, "max": 65.22972972972973, "count": 3 }, "SoccerTwos.Environment.EpisodeLength.sum": { "value": 19308.0, "min": 72.0, "max": 20136.0, "count": 3 }, "SoccerTwos.Self-play.ELO.mean": { "value": 1210.0421697606719, "min": 1200.4971269630323, "max": 1210.0421697606719, "count": 3 }, "SoccerTwos.Self-play.ELO.sum": { "value": 179086.24112457945, "min": 4801.988507852129, "max": 197767.91558502865, "count": 3 }, "SoccerTwos.Step.mean": { "value": 120019923.0, "min": 119999987.0, "max": 120019923.0, "count": 3 }, "SoccerTwos.Step.sum": { "value": 120019923.0, "min": 119999987.0, "max": 120019923.0, "count": 3 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { "value": -0.008530313149094582, "min": -0.018430374562740326, "max": 0.11498736590147018, "count": 3 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { "value": -1.2710167169570923, "min": -3.0225815773010254, "max": 0.22997473180294037, "count": 3 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { "value": -0.009896667674183846, "min": -0.019665079191327095, "max": 0.12343143671751022, "count": 3 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { "value": -1.4746034145355225, "min": -3.2250728607177734, "max": 0.24686287343502045, "count": 3 }, "SoccerTwos.Environment.CumulativeReward.mean": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 3 }, "SoccerTwos.Environment.CumulativeReward.sum": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 3 }, "SoccerTwos.Policy.ExtrinsicReward.mean": { "value": 0.07723892615145485, "min": 0.07723892615145485, "max": 0.9918000102043152, "count": 3 }, "SoccerTwos.Policy.ExtrinsicReward.sum": { "value": 11.508599996566772, "min": 1.9836000204086304, "max": 13.760800123214722, "count": 3 }, "SoccerTwos.Environment.GroupCumulativeReward.mean": { "value": 0.07723892615145485, "min": 0.07723892615145485, "max": 0.9918000102043152, "count": 3 }, "SoccerTwos.Environment.GroupCumulativeReward.sum": { "value": 11.508599996566772, "min": 1.9836000204086304, "max": 13.760800123214722, "count": 3 }, "SoccerTwos.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 3 }, "SoccerTwos.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 3 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1679883328", "python_version": "3.9.16 (main, Mar 8 2023, 14:00:05) \n[GCC 11.2.0]", "command_line_arguments": "/opt/conda/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/linux/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --resume", "mlagents_version": "0.31.0.dev0", "mlagents_envs_version": "0.31.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.11.0+cu115", "numpy_version": "1.21.2", "end_time_seconds": "1679883366" }, "total": 38.56977228799997, "count": 1, "self": 0.06740989299987632, "children": { "run_training.setup": { "total": 0.010300079999979062, "count": 1, "self": 0.010300079999979062 }, "TrainerController.start_learning": { "total": 38.49206231500011, "count": 1, "self": 0.033290510006509066, "children": { "TrainerController._reset_env": { "total": 3.5705099850001716, "count": 2, "self": 3.5705099850001716 }, "TrainerController.advance": { "total": 34.735449429993196, "count": 1589, "self": 0.03484026699516107, "children": { "env_step": { "total": 30.001520048000202, "count": 1589, "self": 19.518561332992704, "children": { "SubprocessEnvManager._take_step": { "total": 10.46364094100295, "count": 1589, "self": 0.17991580500051896, "children": { "TorchPolicy.evaluate": { "total": 10.283725136002431, "count": 2892, "self": 10.283725136002431 } } }, "workers": { "total": 0.019317774004548482, "count": 1588, "self": 0.0, "children": { "worker_root": { "total": 38.26803507299769, "count": 1588, "is_parallel": true, "self": 21.78477827799452, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.0023607900002389215, "count": 2, "is_parallel": true, "self": 0.0008767130004798673, "children": { "_process_rank_one_or_two_observation": { "total": 0.0014840769997590542, "count": 8, "is_parallel": true, "self": 0.0014840769997590542 } } }, "UnityEnvironment.step": { "total": 0.018528570999933436, "count": 1, "is_parallel": true, "self": 0.00038828300012028194, "children": { "UnityEnvironment._generate_step_input": { "total": 0.00027503499995873426, "count": 1, "is_parallel": true, "self": 0.00027503499995873426 }, "communicator.exchange": { "total": 0.01683400599995366, "count": 1, "is_parallel": true, "self": 0.01683400599995366 }, "steps_from_proto": { "total": 0.001031246999900759, "count": 2, "is_parallel": true, "self": 0.000221451000243178, "children": { "_process_rank_one_or_two_observation": { "total": 0.000809795999657581, "count": 8, "is_parallel": true, "self": 0.000809795999657581 } } } } } } }, "steps_from_proto": { "total": 0.000973369999883289, "count": 2, "is_parallel": true, "self": 0.0001988459996482561, "children": { "_process_rank_one_or_two_observation": { "total": 0.0007745240002350329, "count": 8, "is_parallel": true, "self": 0.0007745240002350329 } } }, "UnityEnvironment.step": { "total": 16.48228342500329, "count": 1587, "is_parallel": true, "self": 0.5538142500083723, "children": { "UnityEnvironment._generate_step_input": { "total": 0.33954139499837765, "count": 1587, "is_parallel": true, "self": 0.33954139499837765 }, "communicator.exchange": { "total": 14.079308392995927, "count": 1587, "is_parallel": true, "self": 14.079308392995927 }, "steps_from_proto": { "total": 1.5096193870006118, "count": 3174, "is_parallel": true, "self": 0.32058106701128963, "children": { "_process_rank_one_or_two_observation": { "total": 1.1890383199893222, "count": 12696, "is_parallel": true, "self": 1.1890383199893222 } } } } } } } } } } }, "trainer_advance": { "total": 4.699089114997832, "count": 1588, "self": 0.21049799600041297, "children": { "process_trajectory": { "total": 4.4885911189974195, "count": 1588, "self": 4.267367384997442, "children": { "RLTrainer._checkpoint": { "total": 0.2212237339999774, "count": 1, "self": 0.2212237339999774 } } } } } } }, "trainer_threads": { "total": 6.75000137562165e-07, "count": 1, "self": 6.75000137562165e-07 }, "TrainerController._save_models": { "total": 0.15281171500009805, "count": 1, "self": 0.0013204310000674013, "children": { "RLTrainer._checkpoint": { "total": 0.15149128400003065, "count": 1, "self": 0.15149128400003065 } } } } } } }