First Push

7d3a00f 11 months ago

15.7 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.5281283855438232,
	"min": 1.51893949508667,
	"max": 3.295815944671631,
	"count": 1518
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 31198.26953125,
	"min": 14103.87109375,
	"max": 130326.140625,
	"count": 1518
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 63.35526315789474,
	"min": 43.846846846846844,
	"max": 999.0,
	"count": 1518
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19260.0,
	"min": 14112.0,
	"max": 26076.0,
	"count": 1518
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1684.6709307184121,
	"min": 1178.148824031623,
	"max": 1684.6709307184121,
	"count": 1451
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 256069.98146919865,
	"min": 2356.297648063246,
	"max": 345320.29804062785,
	"count": 1451
	},
	"SoccerTwos.Step.mean": {
	"value": 15179987.0,
	"min": 9054.0,
	"max": 15179987.0,
	"count": 1518
	},
	"SoccerTwos.Step.sum": {
	"value": 15179987.0,
	"min": 9054.0,
	"max": 15179987.0,
	"count": 1518
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": 0.026739638298749924,
	"min": -0.1436135172843933,
	"max": 0.2555159032344818,
	"count": 1518
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": 4.091164588928223,
	"min": -23.983457565307617,
	"max": 30.277732849121094,
	"count": 1518
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.02780262380838394,
	"min": -0.15162380039691925,
	"max": 0.2591020464897156,
	"count": 1518
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": 4.253801345825195,
	"min": -25.32117462158203,
	"max": 27.891921997070312,
	"count": 1518
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 1518
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 1518
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.10177124481575162,
	"min": -0.7142857142857143,
	"max": 0.6802690971981395,
	"count": 1518
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 15.571000456809998,
	"min": -61.30559992790222,
	"max": 61.87840008735657,
	"count": 1518
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.10177124481575162,
	"min": -0.7142857142857143,
	"max": 0.6802690971981395,
	"count": 1518
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 15.571000456809998,
	"min": -61.30559992790222,
	"max": 61.87840008735657,
	"count": 1518
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 1518
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 1518
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.022751482788589784,
	"min": 0.01206635746639222,
	"max": 0.028181853886053432,
	"count": 730
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.022751482788589784,
	"min": 0.01206635746639222,
	"max": 0.028181853886053432,
	"count": 730
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.09225530885159969,
	"min": 1.3613655616140364e-07,
	"max": 0.12491751350462436,
	"count": 730
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.09225530885159969,
	"min": 1.3613655616140364e-07,
	"max": 0.12491751350462436,
	"count": 730
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.09491726122796536,
	"min": 1.362520134939871e-07,
	"max": 0.13019061665982007,
	"count": 730
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.09491726122796536,
	"min": 1.362520134939871e-07,
	"max": 0.13019061665982007,
	"count": 730
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.00027864246233939204,
	"min": 0.00027864246233939204,
	"max": 0.00039979000005250007,
	"count": 730
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.00027864246233939204,
	"min": 0.00027864246233939204,
	"max": 0.00039979000005250007,
	"count": 730
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.169660608,
	"min": 0.169660608,
	"max": 0.19994749999999997,
	"count": 730
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.169660608,
	"min": 0.169660608,
	"max": 0.19994749999999997,
	"count": 730
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.0034860643392000006,
	"min": 0.0034860643392000006,
	"max": 0.00499738025,
	"count": 730
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.0034860643392000006,
	"min": 0.0034860643392000006,
	"max": 0.00499738025,
	"count": 730
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1701964854",
	"python_version": "3.10.1 (tags/v3.10.1:2cd268a, Dec 6 2021, 19:10:37) [MSC v.1929 64 bit (AMD64)]",
	"command_line_arguments": "\\\\?\\D:\\backup\\PycharmProjects\\ml-agents\\venv\\Scripts\\mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos --no-graphics --force",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.1.1+cpu",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1702027803"
	},
	"total": 62948.622758000005,
	"count": 1,
	"self": 0.819124700006796,
	"children": {
	"run_training.setup": {
	"total": 0.11583329999848502,
	"count": 1,
	"self": 0.11583329999848502
	},
	"TrainerController.start_learning": {
	"total": 62947.6878,
	"count": 1,
	"self": 23.613129600860702,
	"children": {
	"TrainerController._reset_env": {
	"total": 6.999240200027998,
	"count": 76,
	"self": 6.999240200027998
	},
	"TrainerController.advance": {
	"total": 62914.08007509912,
	"count": 1028470,
	"self": 23.77957069518743,
	"children": {
	"env_step": {
	"total": 17688.274200101354,
	"count": 1028470,
	"self": 13484.518638708934,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 4189.176620897037,
	"count": 1028470,
	"self": 126.30452050052918,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 4062.8721003965074,
	"count": 1916096,
	"self": 4062.8721003965074
	}
	}
	},
	"workers": {
	"total": 14.578940495382994,
	"count": 1028469,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 62905.74303450515,
	"count": 1028469,
	"is_parallel": true,
	"self": 51959.60016410397,
	"children": {
	"steps_from_proto": {
	"total": 0.12947239996356075,
	"count": 152,
	"is_parallel": true,
	"self": 0.025777700015169103,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.10369469994839164,
	"count": 608,
	"is_parallel": true,
	"self": 0.10369469994839164
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 10946.013398001214,
	"count": 1028469,
	"is_parallel": true,
	"self": 529.7143207028057,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 417.8714918990627,
	"count": 1028469,
	"is_parallel": true,
	"self": 417.8714918990627
	},
	"communicator.exchange": {
	"total": 8264.872950007,
	"count": 1028469,
	"is_parallel": true,
	"self": 8264.872950007
	},
	"steps_from_proto": {
	"total": 1733.5546353923455,
	"count": 2056938,
	"is_parallel": true,
	"self": 346.06766029520077,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 1387.4869750971448,
	"count": 8227752,
	"is_parallel": true,
	"self": 1387.4869750971448
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 45202.02630430258,
	"count": 1028469,
	"self": 177.75935199018568,
	"children": {
	"process_trajectory": {
	"total": 4369.7174340123565,
	"count": 1028469,
	"self": 4298.999762812375,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 70.71767119998185,
	"count": 30,
	"self": 70.71767119998185
	}
	}
	},
	"_update_policy": {
	"total": 40654.54951830003,
	"count": 730,
	"self": 2319.1410130987933,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 38335.40850520124,
	"count": 29208,
	"self": 38335.40850520124
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.2999953469261527e-06,
	"count": 1,
	"self": 1.2999953469261527e-06
	},
	"TrainerController._save_models": {
	"total": 2.995353799997247,
	"count": 1,
	"self": 0.07506540000031237,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 2.9202883999969345,
	"count": 1,
	"self": 2.9202883999969345
	}
	}
	}
	}
	}
	}
	}