poca-SoccerTwos-4090 / run_logs /timers.json

First Push

454551a over 1 year ago

20.3 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 2.12961745262146,
	"min": 2.0128607749938965,
	"max": 3.2957048416137695,
	"count": 500
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 47294.546875,
	"min": 25215.341796875,
	"max": 114234.984375,
	"count": 500
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 85.3103448275862,
	"min": 65.40789473684211,
	"max": 999.0,
	"count": 500
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19792.0,
	"min": 9760.0,
	"max": 29316.0,
	"count": 500
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1385.1089533898953,
	"min": 1195.1336256730665,
	"max": 1421.5866581636521,
	"count": 455
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 160672.63859322786,
	"min": 2392.120072047985,
	"max": 214171.3717349403,
	"count": 455
	},
	"SoccerTwos.Step.mean": {
	"value": 4999996.0,
	"min": 9398.0,
	"max": 4999996.0,
	"count": 500
	},
	"SoccerTwos.Step.sum": {
	"value": 4999996.0,
	"min": 9398.0,
	"max": 4999996.0,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": 0.01985156163573265,
	"min": -0.16638648509979248,
	"max": 0.19962865114212036,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": 2.302781105041504,
	"min": -13.310918807983398,
	"max": 21.16063690185547,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.022537339478731155,
	"min": -0.16885781288146973,
	"max": 0.19671636819839478,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": 2.6143314838409424,
	"min": -13.508625030517578,
	"max": 20.8519344329834,
	"count": 500
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 500
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.11248275843159906,
	"min": -0.625,
	"max": 0.4899577435473321,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 13.04799997806549,
	"min": -35.64599967002869,
	"max": 38.842000007629395,
	"count": 500
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.11248275843159906,
	"min": -0.625,
	"max": 0.4899577435473321,
	"count": 500
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 13.04799997806549,
	"min": -35.64599967002869,
	"max": 38.842000007629395,
	"count": 500
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 500
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 500
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.034032461155826844,
	"min": 0.01110359470185358,
	"max": 0.03661396849978094,
	"count": 239
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.034032461155826844,
	"min": 0.01110359470185358,
	"max": 0.03661396849978094,
	"count": 239
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.05795758267243703,
	"min": 9.818604667088948e-06,
	"max": 4.2202854732672375,
	"count": 239
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.05795758267243703,
	"min": 9.818604667088948e-06,
	"max": 4.2202854732672375,
	"count": 239
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.058396623780330024,
	"min": 6.856276786493254e-06,
	"max": 3.7242351276800036,
	"count": 239
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.058396623780330024,
	"min": 6.856276786493254e-06,
	"max": 3.7242351276800036,
	"count": 239
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.003000000000000001,
	"min": 0.0030000000000000005,
	"max": 0.003000000000000001,
	"count": 239
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.003000000000000001,
	"min": 0.0030000000000000005,
	"max": 0.003000000000000001,
	"count": 239
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000004,
	"max": 0.20000000000000007,
	"count": 239
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000004,
	"max": 0.20000000000000007,
	"count": 239
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 239
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 239
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1698455272",
	"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
	"command_line_arguments": "/home/acm/anaconda3/envs/ML-Agents/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos-AI --no-graphics --force",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu113",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1698459197"
	},
	"total": 3925.1916756709106,
	"count": 1,
	"self": 0.16659858589991927,
	"children": {
	"run_training.setup": {
	"total": 0.004986475920304656,
	"count": 1,
	"self": 0.004986475920304656
	},
	"TrainerController.start_learning": {
	"total": 3925.0200906090904,
	"count": 1,
	"self": 2.2291876182425767,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.799344047671184,
	"count": 25,
	"self": 2.799344047671184
	},
	"TrainerController.advance": {
	"total": 3919.90416892129,
	"count": 330773,
	"self": 2.2556251359637827,
	"children": {
	"env_step": {
	"total": 3191.1467194603756,
	"count": 330773,
	"self": 2677.3377099183854,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 512.3794183228165,
	"count": 330773,
	"self": 17.684439467266202,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 494.6949788555503,
	"count": 634300,
	"self": 494.6949788555503
	}
	}
	},
	"workers": {
	"total": 1.4295912191737443,
	"count": 330773,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 3915.8305289507844,
	"count": 330773,
	"is_parallel": true,
	"self": 1587.0276870804373,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0012380797415971756,
	"count": 2,
	"is_parallel": true,
	"self": 0.0002693717833608389,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0009687079582363367,
	"count": 8,
	"is_parallel": true,
	"self": 0.0009687079582363367
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.012806799029931426,
	"count": 1,
	"is_parallel": true,
	"self": 0.0002779781352728605,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.00026643695309758186,
	"count": 1,
	"is_parallel": true,
	"self": 0.00026643695309758186
	},
	"communicator.exchange": {
	"total": 0.01133758807554841,
	"count": 1,
	"is_parallel": true,
	"self": 0.01133758807554841
	},
	"steps_from_proto": {
	"total": 0.0009247958660125732,
	"count": 2,
	"is_parallel": true,
	"self": 0.00017542671412229538,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0007493691518902779,
	"count": 8,
	"is_parallel": true,
	"self": 0.0007493691518902779
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 2328.770504897693,
	"count": 330772,
	"is_parallel": true,
	"self": 132.92572601302527,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 90.27883003675379,
	"count": 330772,
	"is_parallel": true,
	"self": 90.27883003675379
	},
	"communicator.exchange": {
	"total": 1675.3324669057038,
	"count": 330772,
	"is_parallel": true,
	"self": 1675.3324669057038
	},
	"steps_from_proto": {
	"total": 430.23348194221035,
	"count": 661544,
	"is_parallel": true,
	"self": 69.62733378470875,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 360.6061481575016,
	"count": 2646176,
	"is_parallel": true,
	"self": 360.6061481575016
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.032336972653865814,
	"count": 48,
	"is_parallel": true,
	"self": 0.005629630060866475,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.02670734259299934,
	"count": 192,
	"is_parallel": true,
	"self": 0.02670734259299934
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 726.5018243249506,
	"count": 330773,
	"self": 24.77505039377138,
	"children": {
	"process_trajectory": {
	"total": 230.86068614642136,
	"count": 330773,
	"self": 229.9018766155932,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.9588095308281481,
	"count": 10,
	"self": 0.9588095308281481
	}
	}
	},
	"_update_policy": {
	"total": 470.86608778475784,
	"count": 239,
	"self": 342.3568942944985,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 128.50919349025935,
	"count": 7176,
	"self": 128.50919349025935
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 4.409812390804291e-07,
	"count": 1,
	"self": 4.409812390804291e-07
	},
	"TrainerController._save_models": {
	"total": 0.08738958090543747,
	"count": 1,
	"self": 0.0005776879843324423,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.08681189292110503,
	"count": 1,
	"self": 0.08681189292110503
	}
	}
	}
	}
	}
	}
	}