First Push

87486df almost 2 years ago

15.6 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 3.128203868865967,
	"min": 3.128203868865967,
	"max": 3.2957658767700195,
	"count": 206
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 72374.125,
	"min": 1788.0172119140625,
	"max": 136265.984375,
	"count": 206
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 999.0,
	"min": 409.09090909090907,
	"max": 999.0,
	"count": 206
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19980.0,
	"min": 3996.0,
	"max": 31704.0,
	"count": 206
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1187.140805796752,
	"min": 1186.3808015537347,
	"max": 1202.2230085734304,
	"count": 113
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 2374.281611593504,
	"min": 2372.7616031074695,
	"max": 12019.077019209795,
	"count": 113
	},
	"SoccerTwos.Step.mean": {
	"value": 2059882.0,
	"min": 9870.0,
	"max": 2059882.0,
	"count": 206
	},
	"SoccerTwos.Step.sum": {
	"value": 2059882.0,
	"min": 9870.0,
	"max": 2059882.0,
	"count": 206
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.0022739688865840435,
	"min": -0.08057760447263718,
	"max": 0.01258127298206091,
	"count": 206
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -0.02273968979716301,
	"min": -1.0474029779434204,
	"max": 0.13839399814605713,
	"count": 206
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.002308222698047757,
	"min": -0.08055799454450607,
	"max": 0.011082419194281101,
	"count": 206
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -0.023082226514816284,
	"min": -1.04714035987854,
	"max": 0.12190660834312439,
	"count": 206
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 206
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 206
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.0,
	"min": -0.42857142857142855,
	"max": 0.24627691965836745,
	"count": 206
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 0.0,
	"min": -6.515599966049194,
	"max": 3.201599955558777,
	"count": 206
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.0,
	"min": -0.42857142857142855,
	"max": 0.24627691965836745,
	"count": 206
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 0.0,
	"min": -6.515599966049194,
	"max": 3.201599955558777,
	"count": 206
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 206
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 206
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.017127007464296184,
	"min": 0.012718712531326067,
	"max": 0.02266532371577341,
	"count": 95
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.017127007464296184,
	"min": 0.012718712531326067,
	"max": 0.02266532371577341,
	"count": 95
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 2.6337931018360906e-07,
	"min": 3.0373415900915764e-08,
	"max": 0.0047818772417182725,
	"count": 95
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 2.6337931018360906e-07,
	"min": 3.0373415900915764e-08,
	"max": 0.0047818772417182725,
	"count": 95
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 2.3908658306481814e-07,
	"min": 4.447467993884402e-08,
	"max": 0.004926235570261876,
	"count": 95
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 2.3908658306481814e-07,
	"min": 4.447467993884402e-08,
	"max": 0.004926235570261876,
	"count": 95
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 95
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 95
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000004,
	"max": 0.20000000000000007,
	"count": 95
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000004,
	"max": 0.20000000000000007,
	"count": 95
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 95
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 95
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1681498125",
	"python_version": "3.9.16 \| packaged by conda-forge \| (main, Feb 1 2023, 21:38:11) \n[Clang 14.0.6 ]",
	"command_line_arguments": "/Users/mattsthilaire/miniforge3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.exe --run-id=SoccerTwos-msthil --no-graphics",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1681506612"
	},
	"total": 8486.658130917001,
	"count": 1,
	"self": 0.17415554100080044,
	"children": {
	"run_training.setup": {
	"total": 0.0225070839999999,
	"count": 1,
	"self": 0.0225070839999999
	},
	"TrainerController.start_learning": {
	"total": 8486.461468292,
	"count": 1,
	"self": 1.6383473169535137,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.047540998997704,
	"count": 11,
	"self": 2.047540998997704
	},
	"TrainerController.advance": {
	"total": 8482.65708543405,
	"count": 135273,
	"self": 1.5377856332906958,
	"children": {
	"env_step": {
	"total": 7091.909376126942,
	"count": 135273,
	"self": 6852.133794364885,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 238.60045398310086,
	"count": 135273,
	"self": 7.588517586055616,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 231.01193639704525,
	"count": 268664,
	"self": 231.01193639704525
	}
	}
	},
	"workers": {
	"total": 1.175127778956595,
	"count": 135272,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 8482.058684237982,
	"count": 135272,
	"is_parallel": true,
	"self": 1874.931821495833,
	"children": {
	"steps_from_proto": {
	"total": 0.018282249998494038,
	"count": 22,
	"is_parallel": true,
	"self": 0.0021257099963478687,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.01615654000214617,
	"count": 88,
	"is_parallel": true,
	"self": 0.01615654000214617
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 6607.10858049215,
	"count": 135272,
	"is_parallel": true,
	"self": 16.547839282236964,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 114.60310194199081,
	"count": 135272,
	"is_parallel": true,
	"self": 114.60310194199081
	},
	"communicator.exchange": {
	"total": 6235.002833573965,
	"count": 135272,
	"is_parallel": true,
	"self": 6235.002833573965
	},
	"steps_from_proto": {
	"total": 240.95480569395727,
	"count": 270544,
	"is_parallel": true,
	"self": 26.317884138651635,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 214.63692155530563,
	"count": 1082176,
	"is_parallel": true,
	"self": 214.63692155530563
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 1389.2099236738163,
	"count": 135272,
	"self": 13.43716021274804,
	"children": {
	"process_trajectory": {
	"total": 209.26003329406998,
	"count": 135272,
	"self": 208.83696458606923,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.4230687080007556,
	"count": 4,
	"self": 0.4230687080007556
	}
	}
	},
	"_update_policy": {
	"total": 1166.5127301669984,
	"count": 95,
	"self": 177.76332381099155,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 988.7494063560068,
	"count": 2859,
	"self": 988.7494063560068
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 6.249993020901456e-07,
	"count": 1,
	"self": 6.249993020901456e-07
	},
	"TrainerController._save_models": {
	"total": 0.11849391699979606,
	"count": 1,
	"self": 0.0015337090007960796,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.11696020799899998,
	"count": 1,
	"self": 0.11696020799899998
	}
	}
	}
	}
	}
	}
	}