poca-SoccerTwosv2 / run_logs /timers.json

Second Push

cc8d7bc over 1 year ago

15.6 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.8565446138381958,
	"min": 1.8300139904022217,
	"max": 3.2036256790161133,
	"count": 401
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 34992.15234375,
	"min": 32595.626953125,
	"max": 102866.40625,
	"count": 401
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 80.8360655737705,
	"min": 48.53465346534654,
	"max": 884.8333333333334,
	"count": 401
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19724.0,
	"min": 1484.0,
	"max": 25944.0,
	"count": 401
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1594.5005268827101,
	"min": 1199.8062420984254,
	"max": 1615.6039021747852,
	"count": 401
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 194529.06427969065,
	"min": 2408.5595086931794,
	"max": 310671.0313586862,
	"count": 401
	},
	"SoccerTwos.Step.mean": {
	"value": 4499688.0,
	"min": 499928.0,
	"max": 4499688.0,
	"count": 401
	},
	"SoccerTwos.Step.sum": {
	"value": 4499688.0,
	"min": 499928.0,
	"max": 4499688.0,
	"count": 401
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.007189917378127575,
	"min": -0.10055205225944519,
	"max": 0.21586117148399353,
	"count": 401
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -0.8771699070930481,
	"min": -16.395347595214844,
	"max": 29.357118606567383,
	"count": 401
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.00981832854449749,
	"min": -0.10455340147018433,
	"max": 0.22598282992839813,
	"count": 401
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -1.1978360414505005,
	"min": -16.937650680541992,
	"max": 30.733665466308594,
	"count": 401
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 401
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 401
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.01649508466486071,
	"min": -1.0,
	"max": 0.5655735284090042,
	"count": 401
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 2.0124003291130066,
	"min": -57.84639984369278,
	"max": 76.91799986362457,
	"count": 401
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.01649508466486071,
	"min": -1.0,
	"max": 0.5655735284090042,
	"count": 401
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 2.0124003291130066,
	"min": -57.84639984369278,
	"max": 76.91799986362457,
	"count": 401
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 401
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 401
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.01713785919030973,
	"min": 0.010751689630463563,
	"max": 0.02467565069285532,
	"count": 193
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.01713785919030973,
	"min": 0.010751689630463563,
	"max": 0.02467565069285532,
	"count": 193
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.07816493560870488,
	"min": 0.001869278926945602,
	"max": 0.11182952572902044,
	"count": 193
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.07816493560870488,
	"min": 0.001869278926945602,
	"max": 0.11182952572902044,
	"count": 193
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.07915815537174543,
	"min": 0.0018843572567372273,
	"max": 0.11378700186808904,
	"count": 193
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.07915815537174543,
	"min": 0.0018843572567372273,
	"max": 0.11378700186808904,
	"count": 193
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 193
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 193
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 193
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 193
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 193
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 193
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1679669529",
	"python_version": "3.9.16 (main, Mar 8 2023, 10:39:24) [MSC v.1916 64 bit (AMD64)]",
	"command_line_arguments": "C:\\Users\\joaop\\miniconda3\\envs\\rl\\Scripts\\mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos --no-graphics --resume",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.0.0+cpu",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1679692907"
	},
	"total": 23378.376714600003,
	"count": 1,
	"self": 0.8634517000027699,
	"children": {
	"run_training.setup": {
	"total": 0.19488839999999996,
	"count": 1,
	"self": 0.19488839999999996
	},
	"TrainerController.start_learning": {
	"total": 23377.3183745,
	"count": 1,
	"self": 10.698057600424363,
	"children": {
	"TrainerController._reset_env": {
	"total": 6.217875199999011,
	"count": 21,
	"self": 6.217875199999011
	},
	"TrainerController.advance": {
	"total": 23360.136206399577,
	"count": 271861,
	"self": 10.819512099318672,
	"children": {
	"env_step": {
	"total": 8126.954050799219,
	"count": 271861,
	"self": 6263.979860599473,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 1856.6918990994225,
	"count": 271861,
	"self": 67.9788764986547,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 1788.7130226007678,
	"count": 502870,
	"self": 1788.7130226007678
	}
	}
	},
	"workers": {
	"total": 6.282291100323192,
	"count": 271861,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 23356.25566779996,
	"count": 271861,
	"is_parallel": true,
	"self": 18305.991184700397,
	"children": {
	"steps_from_proto": {
	"total": 0.08139189999524987,
	"count": 42,
	"is_parallel": true,
	"self": 0.016833400005478616,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.06455849998977126,
	"count": 168,
	"is_parallel": true,
	"self": 0.06455849998977126
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 5050.183091199568,
	"count": 271861,
	"is_parallel": true,
	"self": 272.647700600568,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 244.5002960992781,
	"count": 271861,
	"is_parallel": true,
	"self": 244.5002960992781
	},
	"communicator.exchange": {
	"total": 3645.9851571996655,
	"count": 271861,
	"is_parallel": true,
	"self": 3645.9851571996655
	},
	"steps_from_proto": {
	"total": 887.0499373000555,
	"count": 543722,
	"is_parallel": true,
	"self": 174.81389119825144,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 712.236046101804,
	"count": 2174888,
	"is_parallel": true,
	"self": 712.236046101804
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 15222.362643501041,
	"count": 271861,
	"self": 75.56815480070145,
	"children": {
	"process_trajectory": {
	"total": 2167.6675626003457,
	"count": 271861,
	"self": 2164.528453300348,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 3.139109299997987,
	"count": 9,
	"self": 3.139109299997987
	}
	}
	},
	"_update_policy": {
	"total": 12979.126926099994,
	"count": 193,
	"self": 1164.9475176999513,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 11814.179408400043,
	"count": 5790,
	"self": 11814.179408400043
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.9999970390927047e-06,
	"count": 1,
	"self": 1.9999970390927047e-06
	},
	"TrainerController._save_models": {
	"total": 0.2662333000007493,
	"count": 1,
	"self": 0.017151000000012573,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.24908230000073672,
	"count": 1,
	"self": 0.24908230000073672
	}
	}
	}
	}
	}
	}
	}