|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.8218531012535095, |
|
"min": 0.8218531012535095, |
|
"max": 1.4017139673233032, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 24787.08984375, |
|
"min": 22427.423828125, |
|
"max": 38343.68359375, |
|
"count": 16 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 479892.0, |
|
"min": 29983.0, |
|
"max": 479892.0, |
|
"count": 16 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 479892.0, |
|
"min": 29983.0, |
|
"max": 479892.0, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.16719870269298553, |
|
"min": -0.09453507512807846, |
|
"max": 0.18006311357021332, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 41.79967498779297, |
|
"min": -22.499347686767578, |
|
"max": 45.19584274291992, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": 0.04031394422054291, |
|
"min": 0.008605342358350754, |
|
"max": 0.4116668403148651, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": 10.078486442565918, |
|
"min": 2.1169142723083496, |
|
"max": 66.13185119628906, |
|
"count": 16 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.07071494894710777, |
|
"min": 0.06409087616463414, |
|
"max": 0.07432501029365489, |
|
"count": 16 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 0.9900092852595088, |
|
"min": 0.22297503088096465, |
|
"max": 1.0283716070727107, |
|
"count": 16 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.01113278306284984, |
|
"min": 0.0015895596431628114, |
|
"max": 0.01113278306284984, |
|
"count": 16 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.15585896287989776, |
|
"min": 0.008619954277795236, |
|
"max": 0.15585896287989776, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 2.0581250282471426e-05, |
|
"min": 2.0581250282471426e-05, |
|
"max": 0.0002865078044974, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 0.00028813750395459994, |
|
"min": 0.00028813750395459994, |
|
"max": 0.0028506831497724003, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.10686038571428572, |
|
"min": 0.10686038571428572, |
|
"max": 0.1955026, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 1.4960454, |
|
"min": 0.5865078, |
|
"max": 2.3381796, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 0.0006953525328571428, |
|
"min": 0.0006953525328571428, |
|
"max": 0.009550709740000001, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.00973493546, |
|
"min": 0.00973493546, |
|
"max": 0.09505773724000002, |
|
"count": 16 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.016086162999272346, |
|
"min": 0.015609530732035637, |
|
"max": 0.23164601624011993, |
|
"count": 16 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.22520627081394196, |
|
"min": 0.21853342652320862, |
|
"max": 1.1311066150665283, |
|
"count": 16 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 658.0909090909091, |
|
"min": 656.1777777777778, |
|
"max": 999.0, |
|
"count": 16 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 28956.0, |
|
"min": 15984.0, |
|
"max": 32536.0, |
|
"count": 16 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 0.7508090504191138, |
|
"min": -1.0000000521540642, |
|
"max": 0.7508090504191138, |
|
"count": 16 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 33.03559821844101, |
|
"min": -26.086401507258415, |
|
"max": 33.03559821844101, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 0.7508090504191138, |
|
"min": -1.0000000521540642, |
|
"max": 0.7508090504191138, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 33.03559821844101, |
|
"min": -26.086401507258415, |
|
"max": 33.03559821844101, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.1074948328314349, |
|
"min": 0.10620525570638063, |
|
"max": 2.8118732445515118, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 4.729772644583136, |
|
"min": 4.729772644583136, |
|
"max": 36.554352179169655, |
|
"count": 16 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 16 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 16 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1736783484", |
|
"python_version": "3.10.12 (main, Nov 6 2024, 20:22:13) [GCC 11.4.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --resume", |
|
"mlagents_version": "1.2.0.dev0", |
|
"mlagents_envs_version": "1.2.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "2.5.1+cu121", |
|
"numpy_version": "1.23.5", |
|
"end_time_seconds": "1736784508" |
|
}, |
|
"total": 1024.626133001, |
|
"count": 1, |
|
"self": 0.4771244139999453, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.05486030099996242, |
|
"count": 1, |
|
"self": 0.05486030099996242 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 1024.094148286, |
|
"count": 1, |
|
"self": 0.6168152419968465, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 2.1712185540000064, |
|
"count": 1, |
|
"self": 2.1712185540000064 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 1021.2239919380033, |
|
"count": 30786, |
|
"self": 0.6336862899715925, |
|
"children": { |
|
"env_step": { |
|
"total": 695.8379171090241, |
|
"count": 30786, |
|
"self": 625.2730052410059, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 70.18478575300469, |
|
"count": 30786, |
|
"self": 2.1632423169855883, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 68.0215434360191, |
|
"count": 30436, |
|
"self": 68.0215434360191 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 0.3801261150135815, |
|
"count": 30786, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 1021.860913875991, |
|
"count": 30786, |
|
"is_parallel": true, |
|
"self": 451.09090727198486, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.00209486099993228, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0006973370000196155, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0013975239999126643, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0013975239999126643 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.0452558769998177, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005682189998879039, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0004359550000572199, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0004359550000572199 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.04256188099998326, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.04256188099998326 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0016898219998893182, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0003678539997054031, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0013219680001839151, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0013219680001839151 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 570.7700066040061, |
|
"count": 30785, |
|
"is_parallel": true, |
|
"self": 15.56219973903876, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 11.16187519201435, |
|
"count": 30785, |
|
"is_parallel": true, |
|
"self": 11.16187519201435 |
|
}, |
|
"communicator.exchange": { |
|
"total": 497.36558166495774, |
|
"count": 30785, |
|
"is_parallel": true, |
|
"self": 497.36558166495774 |
|
}, |
|
"steps_from_proto": { |
|
"total": 46.68035000799523, |
|
"count": 30785, |
|
"is_parallel": true, |
|
"self": 9.347248153031842, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 37.33310185496339, |
|
"count": 246280, |
|
"is_parallel": true, |
|
"self": 37.33310185496339 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 324.7523885390076, |
|
"count": 30786, |
|
"self": 1.1181802269559284, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 62.56286166304949, |
|
"count": 30786, |
|
"self": 62.44559191104986, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.11726975199962908, |
|
"count": 1, |
|
"self": 0.11726975199962908 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 261.0713466490022, |
|
"count": 210, |
|
"self": 147.64122675499607, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 113.43011989400611, |
|
"count": 11070, |
|
"self": 113.43011989400611 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 9.169998520519584e-07, |
|
"count": 1, |
|
"self": 9.169998520519584e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.08212163500002134, |
|
"count": 1, |
|
"self": 0.0020013969997307868, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.08012023800029056, |
|
"count": 1, |
|
"self": 0.08012023800029056 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |