{ "name": "root", "gauges": { "Pyramids.Policy.Entropy.mean": { "value": 0.28290992975234985, "min": 0.15782222151756287, "max": 1.3641231060028076, "count": 43 }, "Pyramids.Policy.Entropy.sum": { "value": 8505.404296875, "min": 4757.39306640625, "max": 41382.0390625, "count": 43 }, "Pyramids.Step.mean": { "value": 1289944.0, "min": 29903.0, "max": 1289944.0, "count": 43 }, "Pyramids.Step.sum": { "value": 1289944.0, "min": 29903.0, "max": 1289944.0, "count": 43 }, "Pyramids.Policy.ExtrinsicValueEstimate.mean": { "value": 0.5713533759117126, "min": -0.1167815700173378, "max": 0.5713533759117126, "count": 43 }, "Pyramids.Policy.ExtrinsicValueEstimate.sum": { "value": 159.4075927734375, "min": -28.144357681274414, "max": 159.4075927734375, "count": 43 }, "Pyramids.Policy.RndValueEstimate.mean": { "value": 0.060451261699199677, "min": 0.029307974502444267, "max": 0.3584674000740051, "count": 43 }, "Pyramids.Policy.RndValueEstimate.sum": { "value": 16.865901947021484, "min": 8.118309020996094, "max": 86.39064025878906, "count": 43 }, "Pyramids.Losses.PolicyLoss.mean": { "value": 0.07308289039396205, "min": 0.06349791702052159, "max": 0.07387458801572364, "count": 43 }, "Pyramids.Losses.PolicyLoss.sum": { "value": 1.0231604655154687, "min": 0.5712917902329517, "max": 1.1081188202358545, "count": 43 }, "Pyramids.Losses.ValueLoss.mean": { "value": 0.0165385166250869, "min": 0.00042530709157215246, "max": 0.0166178956611215, "count": 43 }, "Pyramids.Losses.ValueLoss.sum": { "value": 0.23153923275121657, "min": 0.0059542992820101346, "max": 0.24384010157384048, "count": 43 }, "Pyramids.Policy.LearningRate.mean": { "value": 5.869334307324177e-06, "min": 5.869334307324177e-06, "max": 0.00029615457820488455, "count": 43 }, "Pyramids.Policy.LearningRate.sum": { "value": 8.217068030253849e-05, "min": 8.217068030253849e-05, "max": 0.003764050299162769, "count": 43 }, "Pyramids.Policy.Epsilon.mean": { "value": 0.10195641208791208, "min": 0.10195641208791208, "max": 0.19871819230769233, "count": 43 }, "Pyramids.Policy.Epsilon.sum": { "value": 1.427389769230769, "min": 1.427389769230769, "max": 2.654683384615385, "count": 43 }, "Pyramids.Policy.Beta.mean": { "value": 0.00020544556758241763, "min": 0.00020544556758241763, "max": 0.009871947411538462, "count": 43 }, "Pyramids.Policy.Beta.sum": { "value": 0.002876237946153847, "min": 0.002876237946153847, "max": 0.1254828701230769, "count": 43 }, "Pyramids.Losses.RNDLoss.mean": { "value": 0.04451805353164673, "min": 0.04354657605290413, "max": 0.5241837501525879, "count": 43 }, "Pyramids.Losses.RNDLoss.sum": { "value": 0.6232527494430542, "min": 0.609652042388916, "max": 4.193470001220703, "count": 43 }, "Pyramids.Environment.EpisodeLength.mean": { "value": 321.2696629213483, "min": 321.2696629213483, "max": 999.0, "count": 43 }, "Pyramids.Environment.EpisodeLength.sum": { "value": 28593.0, "min": 16190.0, "max": 33407.0, "count": 43 }, "Pyramids.Environment.CumulativeReward.mean": { "value": 1.6112876254855917, "min": -0.9995533841351668, "max": 1.619279526851394, "count": 43 }, "Pyramids.Environment.CumulativeReward.sum": { "value": 143.40459866821766, "min": -29.986601524055004, "max": 143.40459866821766, "count": 43 }, "Pyramids.Policy.ExtrinsicReward.mean": { "value": 1.6112876254855917, "min": -0.9995533841351668, "max": 1.619279526851394, "count": 43 }, "Pyramids.Policy.ExtrinsicReward.sum": { "value": 143.40459866821766, "min": -29.986601524055004, "max": 143.40459866821766, "count": 43 }, "Pyramids.Policy.RndReward.mean": { "value": 0.14400465802807527, "min": 0.14400465802807527, "max": 10.126450840164633, "count": 43 }, "Pyramids.Policy.RndReward.sum": { "value": 12.8164145644987, "min": 12.8164145644987, "max": 172.14966428279877, "count": 43 }, "Pyramids.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 43 }, "Pyramids.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 43 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1660961446", "python_version": "3.7.13 (default, Apr 24 2022, 01:04:09) \n[GCC 7.5.0]", "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./trained-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", "mlagents_version": "0.29.0.dev0", "mlagents_envs_version": "0.29.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.8.1+cu102", "numpy_version": "1.21.6", "end_time_seconds": "1660963560" }, "total": 2114.259811897, "count": 1, "self": 0.3213135709997914, "children": { "run_training.setup": { "total": 0.04345352100006039, "count": 1, "self": 0.04345352100006039 }, "TrainerController.start_learning": { "total": 2113.895044805, "count": 1, "self": 1.7680599919908673, "children": { "TrainerController._reset_env": { "total": 5.463571630000047, "count": 1, "self": 5.463571630000047 }, "TrainerController.advance": { "total": 2106.5639303400094, "count": 82942, "self": 1.8261499469672344, "children": { "env_step": { "total": 1230.264099614989, "count": 82942, "self": 1103.0478694140102, "children": { "SubprocessEnvManager._take_step": { "total": 126.27569378999158, "count": 82942, "self": 5.753857396977423, "children": { "TorchPolicy.evaluate": { "total": 120.52183639301415, "count": 81325, "self": 41.321728532932866, "children": { "TorchPolicy.sample_actions": { "total": 79.20010786008129, "count": 81325, "self": 79.20010786008129 } } } } }, "workers": { "total": 0.9405364109871925, "count": 82942, "self": 0.0, "children": { "worker_root": { "total": 2111.1408283789665, "count": 82942, "is_parallel": true, "self": 1125.389301435961, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.005273472999988371, "count": 1, "is_parallel": true, "self": 0.0041152009998768335, "children": { "_process_rank_one_or_two_observation": { "total": 0.0011582720001115376, "count": 8, "is_parallel": true, "self": 0.0011582720001115376 } } }, "UnityEnvironment.step": { "total": 0.032692130000100406, "count": 1, "is_parallel": true, "self": 0.00032922699995197036, "children": { "UnityEnvironment._generate_step_input": { "total": 0.00027252799998223054, "count": 1, "is_parallel": true, "self": 0.00027252799998223054 }, "communicator.exchange": { "total": 0.03103145200009294, "count": 1, "is_parallel": true, "self": 0.03103145200009294 }, "steps_from_proto": { "total": 0.0010589230000732641, "count": 1, "is_parallel": true, "self": 0.0003180750001092747, "children": { "_process_rank_one_or_two_observation": { "total": 0.0007408479999639894, "count": 8, "is_parallel": true, "self": 0.0007408479999639894 } } } } } } }, "UnityEnvironment.step": { "total": 985.7515269430055, "count": 82941, "is_parallel": true, "self": 22.0653133079702, "children": { "UnityEnvironment._generate_step_input": { "total": 16.780598970038113, "count": 82941, "is_parallel": true, "self": 16.780598970038113 }, "communicator.exchange": { "total": 871.0220757840096, "count": 82941, "is_parallel": true, "self": 871.0220757840096 }, "steps_from_proto": { "total": 75.88353888098754, "count": 82941, "is_parallel": true, "self": 20.24116092800466, "children": { "_process_rank_one_or_two_observation": { "total": 55.64237795298288, "count": 663528, "is_parallel": true, "self": 55.64237795298288 } } } } } } } } } } }, "trainer_advance": { "total": 874.4736807780532, "count": 82942, "self": 3.3104847330450866, "children": { "process_trajectory": { "total": 203.60261897200985, "count": 82942, "self": 203.40802821600937, "children": { "RLTrainer._checkpoint": { "total": 0.19459075600047981, "count": 2, "self": 0.19459075600047981 } } }, "_update_policy": { "total": 667.5605770729983, "count": 598, "self": 263.961000961977, "children": { "TorchPPOOptimizer.update": { "total": 403.5995761110213, "count": 29607, "self": 403.5995761110213 } } } } } } }, "trainer_threads": { "total": 1.1140000424347818e-06, "count": 1, "self": 1.1140000424347818e-06 }, "TrainerController._save_models": { "total": 0.09948172899976271, "count": 1, "self": 0.0014616369999203016, "children": { "RLTrainer._checkpoint": { "total": 0.09802009199984241, "count": 1, "self": 0.09802009199984241 } } } } } } }