{ "name": "root", "gauges": { "Pyramids.Policy.Entropy.mean": { "value": 0.5240244269371033, "min": 0.5240244269371033, "max": 1.5604443550109863, "count": 33 }, "Pyramids.Policy.Entropy.sum": { "value": 15603.3505859375, "min": 15603.3505859375, "max": 49934.21875, "count": 33 }, "Pyramids.Step.mean": { "value": 989827.0, "min": 29912.0, "max": 989827.0, "count": 33 }, "Pyramids.Step.sum": { "value": 989827.0, "min": 29912.0, "max": 989827.0, "count": 33 }, "Pyramids.Policy.ExtrinsicValueEstimate.mean": { "value": 0.47195708751678467, "min": -0.11839296668767929, "max": 0.5243668556213379, "count": 33 }, "Pyramids.Policy.ExtrinsicValueEstimate.sum": { "value": 73.15335083007812, "min": -14.088763236999512, "max": 79.17939758300781, "count": 33 }, "Pyramids.Policy.RndValueEstimate.mean": { "value": 0.034837398678064346, "min": 0.014649661257863045, "max": 0.41853392124176025, "count": 33 }, "Pyramids.Policy.RndValueEstimate.sum": { "value": 5.399796962738037, "min": 2.0949015617370605, "max": 49.805538177490234, "count": 33 }, "Pyramids.Losses.PolicyLoss.mean": { "value": 0.04392328329101604, "min": 0.04392328329101604, "max": 0.05385815075984552, "count": 33 }, "Pyramids.Losses.PolicyLoss.sum": { "value": 0.3074629830371123, "min": 0.16157445227953657, "max": 0.4029338099547507, "count": 33 }, "Pyramids.Losses.ValueLoss.mean": { "value": 0.017007534372775506, "min": 0.001628449542701528, "max": 0.019308498711325228, "count": 33 }, "Pyramids.Losses.ValueLoss.sum": { "value": 0.11905274060942854, "min": 0.011399146798910695, "max": 0.1351594909792766, "count": 33 }, "Pyramids.Policy.LearningRate.mean": { "value": 7.620140317128576e-06, "min": 7.620140317128576e-06, "max": 0.00029516160161279994, "count": 33 }, "Pyramids.Policy.LearningRate.sum": { "value": 5.334098221990003e-05, "min": 5.334098221990003e-05, "max": 0.0018782307739230995, "count": 33 }, "Pyramids.Policy.Epsilon.mean": { "value": 0.10254001428571431, "min": 0.10254001428571431, "max": 0.19838719999999999, "count": 33 }, "Pyramids.Policy.Epsilon.sum": { "value": 0.7177801000000001, "min": 0.5951616, "max": 1.3260769000000001, "count": 33 }, "Pyramids.Policy.Beta.mean": { "value": 0.0002637474271428573, "min": 0.0002637474271428573, "max": 0.009838881280000001, "count": 33 }, "Pyramids.Policy.Beta.sum": { "value": 0.0018462319900000013, "min": 0.0018462319900000013, "max": 0.06261508231, "count": 33 }, "Pyramids.Losses.RNDLoss.mean": { "value": 0.017371272668242455, "min": 0.01701119728386402, "max": 0.7396652102470398, "count": 33 }, "Pyramids.Losses.RNDLoss.sum": { "value": 0.12159890681505203, "min": 0.1190783753991127, "max": 2.2189955711364746, "count": 33 }, "Pyramids.Environment.EpisodeLength.mean": { "value": 385.2987012987013, "min": 348.7011494252874, "max": 999.0, "count": 33 }, "Pyramids.Environment.EpisodeLength.sum": { "value": 29668.0, "min": 17236.0, "max": 33706.0, "count": 33 }, "Pyramids.Environment.CumulativeReward.mean": { "value": 1.5107844003609248, "min": -1.0000000596046448, "max": 1.5876545325502174, "count": 33 }, "Pyramids.Environment.CumulativeReward.sum": { "value": 116.33039882779121, "min": -27.664801836013794, "max": 135.34819811582565, "count": 33 }, "Pyramids.Policy.ExtrinsicReward.mean": { "value": 1.5107844003609248, "min": -1.0000000596046448, "max": 1.5876545325502174, "count": 33 }, "Pyramids.Policy.ExtrinsicReward.sum": { "value": 116.33039882779121, "min": -27.664801836013794, "max": 135.34819811582565, "count": 33 }, "Pyramids.Policy.RndReward.mean": { "value": 0.06773548879261528, "min": 0.06295230909584804, "max": 11.090575384057086, "count": 33 }, "Pyramids.Policy.RndReward.sum": { "value": 5.215632637031376, "min": 4.847327800380299, "max": 255.083233833313, "count": 33 }, "Pyramids.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 33 }, "Pyramids.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 33 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1674368628", "python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]", "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", "mlagents_version": "0.29.0.dev0", "mlagents_envs_version": "0.29.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.8.1+cu102", "numpy_version": "1.21.6", "end_time_seconds": "1674370414" }, "total": 1785.822968471, "count": 1, "self": 0.47895825499995226, "children": { "run_training.setup": { "total": 0.09914366099997096, "count": 1, "self": 0.09914366099997096 }, "TrainerController.start_learning": { "total": 1785.244866555, "count": 1, "self": 1.1131324259840767, "children": { "TrainerController._reset_env": { "total": 6.06497550600011, "count": 1, "self": 6.06497550600011 }, "TrainerController.advance": { "total": 1777.9846226120155, "count": 63720, "self": 1.146976587987865, "children": { "env_step": { "total": 1249.3115349429675, "count": 63720, "self": 1150.9779937049723, "children": { "SubprocessEnvManager._take_step": { "total": 97.62427970501813, "count": 63720, "self": 4.068538166007329, "children": { "TorchPolicy.evaluate": { "total": 93.5557415390108, "count": 62590, "self": 31.474505881949653, "children": { "TorchPolicy.sample_actions": { "total": 62.08123565706114, "count": 62590, "self": 62.08123565706114 } } } } }, "workers": { "total": 0.7092615329770524, "count": 63720, "self": 0.0, "children": { "worker_root": { "total": 1781.4459608130917, "count": 63720, "is_parallel": true, "self": 720.5651224371013, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.001775920000000042, "count": 1, "is_parallel": true, "self": 0.0006120049999935873, "children": { "_process_rank_one_or_two_observation": { "total": 0.0011639150000064546, "count": 8, "is_parallel": true, "self": 0.0011639150000064546 } } }, "UnityEnvironment.step": { "total": 0.04738303699991775, "count": 1, "is_parallel": true, "self": 0.0004737369999929797, "children": { "UnityEnvironment._generate_step_input": { "total": 0.00042197099992336007, "count": 1, "is_parallel": true, "self": 0.00042197099992336007 }, "communicator.exchange": { "total": 0.0447465419999844, "count": 1, "is_parallel": true, "self": 0.0447465419999844 }, "steps_from_proto": { "total": 0.0017407870000170078, "count": 1, "is_parallel": true, "self": 0.0004731369999717572, "children": { "_process_rank_one_or_two_observation": { "total": 0.0012676500000452506, "count": 8, "is_parallel": true, "self": 0.0012676500000452506 } } } } } } }, "UnityEnvironment.step": { "total": 1060.8808383759904, "count": 63719, "is_parallel": true, "self": 26.506139344005533, "children": { "UnityEnvironment._generate_step_input": { "total": 20.98834946001216, "count": 63719, "is_parallel": true, "self": 20.98834946001216 }, "communicator.exchange": { "total": 918.392368103008, "count": 63719, "is_parallel": true, "self": 918.392368103008 }, "steps_from_proto": { "total": 94.99398146896465, "count": 63719, "is_parallel": true, "self": 20.362303769981963, "children": { "_process_rank_one_or_two_observation": { "total": 74.63167769898268, "count": 509752, "is_parallel": true, "self": 74.63167769898268 } } } } } } } } } } }, "trainer_advance": { "total": 527.5261110810602, "count": 63720, "self": 2.2673867050991703, "children": { "process_trajectory": { "total": 125.55169884495604, "count": 63720, "self": 125.36900244295589, "children": { "RLTrainer._checkpoint": { "total": 0.18269640200014692, "count": 2, "self": 0.18269640200014692 } } }, "_update_policy": { "total": 399.707025531005, "count": 228, "self": 188.07272992402272, "children": { "TorchPPOOptimizer.update": { "total": 211.63429560698228, "count": 11385, "self": 211.63429560698228 } } } } } } }, "trainer_threads": { "total": 7.430003279296216e-07, "count": 1, "self": 7.430003279296216e-07 }, "TrainerController._save_models": { "total": 0.08213526800000182, "count": 1, "self": 0.0013929020001341996, "children": { "RLTrainer._checkpoint": { "total": 0.08074236599986762, "count": 1, "self": 0.08074236599986762 } } } } } } }