{ "name": "root", "gauges": { "Pyramids.Policy.Entropy.mean": { "value": 0.14231178164482117, "min": 0.1303008496761322, "max": 1.4535048007965088, "count": 100 }, "Pyramids.Policy.Entropy.sum": { "value": 4305.78515625, "min": 3904.85595703125, "max": 44093.5234375, "count": 100 }, "Pyramids.Step.mean": { "value": 2999904.0, "min": 29926.0, "max": 2999904.0, "count": 100 }, "Pyramids.Step.sum": { "value": 2999904.0, "min": 29926.0, "max": 2999904.0, "count": 100 }, "Pyramids.Policy.ExtrinsicValueEstimate.mean": { "value": 0.7379971146583557, "min": -0.10925323516130447, "max": 0.8656940460205078, "count": 100 }, "Pyramids.Policy.ExtrinsicValueEstimate.sum": { "value": 221.39913940429688, "min": -26.220775604248047, "max": 260.57391357421875, "count": 100 }, "Pyramids.Policy.RndValueEstimate.mean": { "value": 0.0035940746311098337, "min": -0.029801063239574432, "max": 0.42362481355667114, "count": 100 }, "Pyramids.Policy.RndValueEstimate.sum": { "value": 1.078222393989563, "min": -7.718475341796875, "max": 100.39907836914062, "count": 100 }, "Pyramids.Losses.PolicyLoss.mean": { "value": 0.06862654977155908, "min": 0.06414837308090404, "max": 0.07319979948806576, "count": 100 }, "Pyramids.Losses.PolicyLoss.sum": { "value": 0.9607716968018271, "min": 0.4850072082033081, "max": 1.0779539941771268, "count": 100 }, "Pyramids.Losses.ValueLoss.mean": { "value": 0.016393984046137594, "min": 8.172818660874845e-05, "max": 0.01647787087098954, "count": 100 }, "Pyramids.Losses.ValueLoss.sum": { "value": 0.22951577664592632, "min": 0.0010624664259137298, "max": 0.2471680630648431, "count": 100 }, "Pyramids.Policy.LearningRate.mean": { "value": 1.568820905664288e-06, "min": 1.568820905664288e-06, "max": 0.0002984113433866952, "count": 100 }, "Pyramids.Policy.LearningRate.sum": { "value": 2.1963492679300033e-05, "min": 2.1963492679300033e-05, "max": 0.004011024262991932, "count": 100 }, "Pyramids.Policy.Epsilon.mean": { "value": 0.10052290714285715, "min": 0.10052290714285715, "max": 0.19947044761904764, "count": 100 }, "Pyramids.Policy.Epsilon.sum": { "value": 1.4073207, "min": 1.3962931333333335, "max": 2.782517166666666, "count": 100 }, "Pyramids.Policy.Beta.mean": { "value": 6.223842357142869e-05, "min": 6.223842357142869e-05, "max": 0.009947097717142857, "count": 100 }, "Pyramids.Policy.Beta.sum": { "value": 0.0008713379300000016, "min": 0.0008713379300000016, "max": 0.13370710586, "count": 100 }, "Pyramids.Losses.RNDLoss.mean": { "value": 0.005444384645670652, "min": 0.005028969142585993, "max": 0.4283823072910309, "count": 100 }, "Pyramids.Losses.RNDLoss.sum": { "value": 0.07622138410806656, "min": 0.07040556520223618, "max": 2.998676061630249, "count": 100 }, "Pyramids.Environment.EpisodeLength.mean": { "value": 241.9140625, "min": 206.25, "max": 999.0, "count": 100 }, "Pyramids.Environment.EpisodeLength.sum": { "value": 30965.0, "min": 16725.0, "max": 32953.0, "count": 100 }, "Pyramids.Environment.CumulativeReward.mean": { "value": 1.7580629770211347, "min": -0.9998194065786177, "max": 1.7795560131681727, "count": 100 }, "Pyramids.Environment.CumulativeReward.sum": { "value": 223.2739980816841, "min": -30.99440160393715, "max": 250.91739785671234, "count": 100 }, "Pyramids.Policy.ExtrinsicReward.mean": { "value": 1.7580629770211347, "min": -0.9998194065786177, "max": 1.7795560131681727, "count": 100 }, "Pyramids.Policy.ExtrinsicReward.sum": { "value": 223.2739980816841, "min": -30.99440160393715, "max": 250.91739785671234, "count": 100 }, "Pyramids.Policy.RndReward.mean": { "value": 0.013571105703439263, "min": 0.011564384719135238, "max": 8.362442617907243, "count": 100 }, "Pyramids.Policy.RndReward.sum": { "value": 1.7235304243367864, "min": 1.5391103338879475, "max": 142.16152450442314, "count": 100 }, "Pyramids.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 100 }, "Pyramids.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 100 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1677656859", "python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]", "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids --no-graphics", "mlagents_version": "0.29.0.dev0", "mlagents_envs_version": "0.29.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.8.1+cu102", "numpy_version": "1.22.4", "end_time_seconds": "1677670144" }, "total": 13285.625529079003, "count": 1, "self": 0.940808802999527, "children": { "run_training.setup": { "total": 0.1580522900003416, "count": 1, "self": 0.1580522900003416 }, "TrainerController.start_learning": { "total": 13284.526667986003, "count": 1, "self": 8.513846662179276, "children": { "TrainerController._reset_env": { "total": 6.756042122000508, "count": 1, "self": 6.756042122000508 }, "TrainerController.advance": { "total": 13269.100194726823, "count": 194946, "self": 8.423122134750884, "children": { "env_step": { "total": 9033.157149722825, "count": 194946, "self": 8528.99708593086, "children": { "SubprocessEnvManager._take_step": { "total": 498.81065572308944, "count": 194946, "self": 24.299723959469702, "children": { "TorchPolicy.evaluate": { "total": 474.51093176361974, "count": 187565, "self": 105.17648576021747, "children": { "TorchPolicy.sample_actions": { "total": 369.33444600340226, "count": 187565, "self": 369.33444600340226 } } } } }, "workers": { "total": 5.349408068876073, "count": 194946, "self": 0.0, "children": { "worker_root": { "total": 13256.058694319152, "count": 194946, "is_parallel": true, "self": 5367.6513512620295, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.003673924999020528, "count": 1, "is_parallel": true, "self": 0.0011515779988258146, "children": { "_process_rank_one_or_two_observation": { "total": 0.0025223470001947135, "count": 8, "is_parallel": true, "self": 0.0025223470001947135 } } }, "UnityEnvironment.step": { "total": 0.0707237360002182, "count": 1, "is_parallel": true, "self": 0.0006880049986648373, "children": { "UnityEnvironment._generate_step_input": { "total": 0.0006140100012999028, "count": 1, "is_parallel": true, "self": 0.0006140100012999028 }, "communicator.exchange": { "total": 0.06716437100112671, "count": 1, "is_parallel": true, "self": 0.06716437100112671 }, "steps_from_proto": { "total": 0.0022573499991267454, "count": 1, "is_parallel": true, "self": 0.0005709369979740586, "children": { "_process_rank_one_or_two_observation": { "total": 0.0016864130011526868, "count": 8, "is_parallel": true, "self": 0.0016864130011526868 } } } } } } }, "UnityEnvironment.step": { "total": 7888.4073430571225, "count": 194945, "is_parallel": true, "self": 150.1931942046067, "children": { "UnityEnvironment._generate_step_input": { "total": 92.45847508466613, "count": 194945, "is_parallel": true, "self": 92.45847508466613 }, "communicator.exchange": { "total": 7203.784618341477, "count": 194945, "is_parallel": true, "self": 7203.784618341477 }, "steps_from_proto": { "total": 441.9710554263729, "count": 194945, "is_parallel": true, "self": 114.2965543723476, "children": { "_process_rank_one_or_two_observation": { "total": 327.6745010540253, "count": 1559560, "is_parallel": true, "self": 327.6745010540253 } } } } } } } } } } }, "trainer_advance": { "total": 4227.519922869247, "count": 194946, "self": 17.281063348538737, "children": { "process_trajectory": { "total": 773.5327418526867, "count": 194946, "self": 772.813155588683, "children": { "RLTrainer._checkpoint": { "total": 0.7195862640037376, "count": 6, "self": 0.7195862640037376 } } }, "_update_policy": { "total": 3436.7061176680218, "count": 1398, "self": 895.9034614514167, "children": { "TorchPPOOptimizer.update": { "total": 2540.802656216605, "count": 68358, "self": 2540.802656216605 } } } } } } }, "trainer_threads": { "total": 9.81002813205123e-07, "count": 1, "self": 9.81002813205123e-07 }, "TrainerController._save_models": { "total": 0.1565834939974593, "count": 1, "self": 0.004206261997751426, "children": { "RLTrainer._checkpoint": { "total": 0.15237723199970787, "count": 1, "self": 0.15237723199970787 } } } } } } }