poca-SoccerTwos / run_logs /timers.json
georgysavva's picture
First Push
47d141b verified
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 1.9712942838668823,
"min": 1.9661911725997925,
"max": 3.2957358360290527,
"count": 500
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 40813.67578125,
"min": 15614.361328125,
"max": 105463.515625,
"count": 500
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 60.55555555555556,
"min": 42.293103448275865,
"max": 999.0,
"count": 500
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 19620.0,
"min": 10788.0,
"max": 30272.0,
"count": 500
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1559.6469771497655,
"min": 1200.7492804441454,
"max": 1577.0405009914823,
"count": 491
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 252662.810298262,
"min": 2401.4985608882907,
"max": 362080.720767181,
"count": 491
},
"SoccerTwos.Step.mean": {
"value": 4999992.0,
"min": 9152.0,
"max": 4999992.0,
"count": 500
},
"SoccerTwos.Step.sum": {
"value": 4999992.0,
"min": 9152.0,
"max": 4999992.0,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": -0.0013691852800548077,
"min": -0.09895986318588257,
"max": 0.17183257639408112,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": -0.22317719459533691,
"min": -16.72421646118164,
"max": 26.218730926513672,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": -0.00021639192709699273,
"min": -0.09728053957223892,
"max": 0.18304979801177979,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": -0.03527188301086426,
"min": -16.440410614013672,
"max": 27.166671752929688,
"count": 500
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 500
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": -0.014895704626305703,
"min": -0.42857142857142855,
"max": 0.3610380973134722,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": -2.4279998540878296,
"min": -51.80679976940155,
"max": 57.0787992477417,
"count": 500
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": -0.014895704626305703,
"min": -0.42857142857142855,
"max": 0.3610380973134722,
"count": 500
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": -2.4279998540878296,
"min": -51.80679976940155,
"max": 57.0787992477417,
"count": 500
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 500
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 500
},
"SoccerTwos.Losses.PolicyLoss.mean": {
"value": 0.015365875405647482,
"min": 0.0106980721452904,
"max": 0.023673540592426434,
"count": 240
},
"SoccerTwos.Losses.PolicyLoss.sum": {
"value": 0.015365875405647482,
"min": 0.0106980721452904,
"max": 0.023673540592426434,
"count": 240
},
"SoccerTwos.Losses.ValueLoss.mean": {
"value": 0.09721296106775602,
"min": 0.0001224813905234138,
"max": 0.11625648538271587,
"count": 240
},
"SoccerTwos.Losses.ValueLoss.sum": {
"value": 0.09721296106775602,
"min": 0.0001224813905234138,
"max": 0.11625648538271587,
"count": 240
},
"SoccerTwos.Losses.BaselineLoss.mean": {
"value": 0.09830297008156777,
"min": 0.00012409707390664455,
"max": 0.11816722899675369,
"count": 240
},
"SoccerTwos.Losses.BaselineLoss.sum": {
"value": 0.09830297008156777,
"min": 0.00012409707390664455,
"max": 0.11816722899675369,
"count": 240
},
"SoccerTwos.Policy.LearningRate.mean": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 240
},
"SoccerTwos.Policy.LearningRate.sum": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 240
},
"SoccerTwos.Policy.Epsilon.mean": {
"value": 0.20000000000000007,
"min": 0.2,
"max": 0.20000000000000007,
"count": 240
},
"SoccerTwos.Policy.Epsilon.sum": {
"value": 0.20000000000000007,
"min": 0.2,
"max": 0.20000000000000007,
"count": 240
},
"SoccerTwos.Policy.Beta.mean": {
"value": 0.005000000000000001,
"min": 0.005,
"max": 0.005000000000000001,
"count": 240
},
"SoccerTwos.Policy.Beta.sum": {
"value": 0.005000000000000001,
"min": 0.005,
"max": 0.005000000000000001,
"count": 240
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1719005436",
"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
"command_line_arguments": "/home/georgy/miniconda3/envs/hf-rl-course/bin/mlagents-learn ./configs/SoccerTwos.yaml --env=../ml-agents/training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics",
"mlagents_version": "1.1.0.dev0",
"mlagents_envs_version": "1.1.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.3.1+cu121",
"numpy_version": "1.23.5",
"end_time_seconds": "1719012450"
},
"total": 7013.90845661913,
"count": 1,
"self": 0.2687763930298388,
"children": {
"run_training.setup": {
"total": 0.014317912980914116,
"count": 1,
"self": 0.014317912980914116
},
"TrainerController.start_learning": {
"total": 7013.62536231312,
"count": 1,
"self": 5.0036841097753495,
"children": {
"TrainerController._reset_env": {
"total": 1.7660642263945192,
"count": 25,
"self": 1.7660642263945192
},
"TrainerController.advance": {
"total": 7006.711907642661,
"count": 339089,
"self": 4.354088980238885,
"children": {
"env_step": {
"total": 5576.542560391128,
"count": 339089,
"self": 4388.083748762729,
"children": {
"SubprocessEnvManager._take_step": {
"total": 1185.1619284837507,
"count": 339089,
"self": 27.26024706894532,
"children": {
"TorchPolicy.evaluate": {
"total": 1157.9016814148054,
"count": 630752,
"self": 1157.9016814148054
}
}
},
"workers": {
"total": 3.2968831446487457,
"count": 339089,
"self": 0.0,
"children": {
"worker_root": {
"total": 7005.051289109746,
"count": 339089,
"is_parallel": true,
"self": 3254.795083300909,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.003715916071087122,
"count": 2,
"is_parallel": true,
"self": 0.0007357143331319094,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0029802017379552126,
"count": 8,
"is_parallel": true,
"self": 0.0029802017379552126
}
}
},
"UnityEnvironment.step": {
"total": 0.02689134795218706,
"count": 1,
"is_parallel": true,
"self": 0.0008379898499697447,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0006968711968511343,
"count": 1,
"is_parallel": true,
"self": 0.0006968711968511343
},
"communicator.exchange": {
"total": 0.022590431850403547,
"count": 1,
"is_parallel": true,
"self": 0.022590431850403547
},
"steps_from_proto": {
"total": 0.002766055054962635,
"count": 2,
"is_parallel": true,
"self": 0.0004009511321783066,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0023651039227843285,
"count": 8,
"is_parallel": true,
"self": 0.0023651039227843285
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 3750.204459583154,
"count": 339088,
"is_parallel": true,
"self": 238.5870046846103,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 156.512111854041,
"count": 339088,
"is_parallel": true,
"self": 156.512111854041
},
"communicator.exchange": {
"total": 2673.0863169804215,
"count": 339088,
"is_parallel": true,
"self": 2673.0863169804215
},
"steps_from_proto": {
"total": 682.0190260640811,
"count": 678176,
"is_parallel": true,
"self": 108.02852755994536,
"children": {
"_process_rank_one_or_two_observation": {
"total": 573.9904985041358,
"count": 2712704,
"is_parallel": true,
"self": 573.9904985041358
}
}
}
}
},
"steps_from_proto": {
"total": 0.051746225683018565,
"count": 48,
"is_parallel": true,
"self": 0.008203333243727684,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.04354289243929088,
"count": 192,
"is_parallel": true,
"self": 0.04354289243929088
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 1425.8152582712937,
"count": 339089,
"self": 44.6332890947815,
"children": {
"process_trajectory": {
"total": 566.3861913965084,
"count": 339089,
"self": 565.0334996974561,
"children": {
"RLTrainer._checkpoint": {
"total": 1.3526916990522295,
"count": 10,
"self": 1.3526916990522295
}
}
},
"_update_policy": {
"total": 814.7957777800038,
"count": 240,
"self": 509.6999193832744,
"children": {
"TorchPOCAOptimizer.update": {
"total": 305.09585839672945,
"count": 7203,
"self": 305.09585839672945
}
}
}
}
}
}
},
"trainer_threads": {
"total": 5.711335688829422e-07,
"count": 1,
"self": 5.711335688829422e-07
},
"TrainerController._save_models": {
"total": 0.14370576315559447,
"count": 1,
"self": 0.0014321389608085155,
"children": {
"RLTrainer._checkpoint": {
"total": 0.14227362419478595,
"count": 1,
"self": 0.14227362419478595
}
}
}
}
}
}
}