{ "name": "root", "gauges": { "SoccerTwos.Policy.Entropy.mean": { "value": 3.1573421955108643, "min": 3.1193549633026123, "max": 3.2956697940826416, "count": 204 }, "SoccerTwos.Policy.Entropy.sum": { "value": 91537.6640625, "min": 22145.384765625, "max": 113804.59375, "count": 204 }, "SoccerTwos.Environment.EpisodeLength.mean": { "value": 740.2857142857143, "min": 471.5, "max": 999.0, "count": 204 }, "SoccerTwos.Environment.EpisodeLength.sum": { "value": 20728.0, "min": 13260.0, "max": 28076.0, "count": 204 }, "SoccerTwos.Self-play.ELO.mean": { "value": 1196.044530811736, "min": 1194.5995997367977, "max": 1215.4939278097893, "count": 159 }, "SoccerTwos.Self-play.ELO.sum": { "value": 9568.356246493888, "min": 2389.1991994735954, "max": 14396.330814613222, "count": 159 }, "SoccerTwos.Step.mean": { "value": 2039646.0, "min": 9054.0, "max": 2039646.0, "count": 204 }, "SoccerTwos.Step.sum": { "value": 2039646.0, "min": 9054.0, "max": 2039646.0, "count": 204 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { "value": 0.013888576999306679, "min": -0.013252537697553635, "max": 0.05611197650432587, "count": 204 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { "value": 0.1944400817155838, "min": -0.2175348848104477, "max": 0.8977916240692139, "count": 204 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { "value": 0.014462905004620552, "min": -0.012911916710436344, "max": 0.056133802980184555, "count": 204 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { "value": 0.20248067378997803, "min": -0.21378286182880402, "max": 0.8981384038925171, "count": 204 }, "SoccerTwos.Environment.CumulativeReward.mean": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 204 }, "SoccerTwos.Environment.CumulativeReward.sum": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 204 }, "SoccerTwos.Policy.ExtrinsicReward.mean": { "value": 0.019714287349155972, "min": -0.5625, "max": 0.34826666514078775, "count": 204 }, "SoccerTwos.Policy.ExtrinsicReward.sum": { "value": 0.2760000228881836, "min": -9.0, "max": 5.359999984502792, "count": 204 }, "SoccerTwos.Environment.GroupCumulativeReward.mean": { "value": 0.019714287349155972, "min": -0.5625, "max": 0.34826666514078775, "count": 204 }, "SoccerTwos.Environment.GroupCumulativeReward.sum": { "value": 0.2760000228881836, "min": -9.0, "max": 5.359999984502792, "count": 204 }, "SoccerTwos.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 204 }, "SoccerTwos.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 204 }, "SoccerTwos.Losses.PolicyLoss.mean": { "value": 0.016578856820706277, "min": 0.0104911725250228, "max": 0.023848259889443096, "count": 95 }, "SoccerTwos.Losses.PolicyLoss.sum": { "value": 0.016578856820706277, "min": 0.0104911725250228, "max": 0.023848259889443096, "count": 95 }, "SoccerTwos.Losses.ValueLoss.mean": { "value": 0.004163745751914878, "min": 2.5253433932448386e-06, "max": 0.0048438915982842445, "count": 95 }, "SoccerTwos.Losses.ValueLoss.sum": { "value": 0.004163745751914878, "min": 2.5253433932448386e-06, "max": 0.0048438915982842445, "count": 95 }, "SoccerTwos.Losses.BaselineLoss.mean": { "value": 0.004275392834097147, "min": 2.5751679269584807e-06, "max": 0.004879755914832155, "count": 95 }, "SoccerTwos.Losses.BaselineLoss.sum": { "value": 0.004275392834097147, "min": 2.5751679269584807e-06, "max": 0.004879755914832155, "count": 95 }, "SoccerTwos.Policy.LearningRate.mean": { "value": 0.0003, "min": 0.0003, "max": 0.0003, "count": 95 }, "SoccerTwos.Policy.LearningRate.sum": { "value": 0.0003, "min": 0.0003, "max": 0.0003, "count": 95 }, "SoccerTwos.Policy.Epsilon.mean": { "value": 0.20000000000000007, "min": 0.20000000000000007, "max": 0.20000000000000007, "count": 95 }, "SoccerTwos.Policy.Epsilon.sum": { "value": 0.20000000000000007, "min": 0.20000000000000007, "max": 0.20000000000000007, "count": 95 }, "SoccerTwos.Policy.Beta.mean": { "value": 0.005000000000000001, "min": 0.005000000000000001, "max": 0.005000000000000001, "count": 95 }, "SoccerTwos.Policy.Beta.sum": { "value": 0.005000000000000001, "min": 0.005000000000000001, "max": 0.005000000000000001, "count": 95 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1678549238", "python_version": "3.9.16 (main, Mar 8 2023, 14:00:05) \n[GCC 11.2.0]", "command_line_arguments": "/home/fer/miniconda3/envs/rl/bin/mlagents-learn ./SoccerTwos.yaml --env=./SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force", "mlagents_version": "0.31.0.dev0", "mlagents_envs_version": "0.31.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.11.0+cu113", "numpy_version": "1.21.2", "end_time_seconds": "1678551788" }, "total": 2549.631119179001, "count": 1, "self": 0.052769633000934846, "children": { "run_training.setup": { "total": 0.007245131999297882, "count": 1, "self": 0.007245131999297882 }, "TrainerController.start_learning": { "total": 2549.5711044140007, "count": 1, "self": 2.7172993279000366, "children": { "TrainerController._reset_env": { "total": 4.349112961001083, "count": 11, "self": 4.349112961001083 }, "TrainerController.advance": { "total": 2542.3395385041003, "count": 133268, "self": 3.1790522586106817, "children": { "env_step": { "total": 1984.838998668829, "count": 133268, "self": 1421.5724086424852, "children": { "SubprocessEnvManager._take_step": { "total": 561.4521566224412, "count": 133268, "self": 15.476844517868813, "children": { "TorchPolicy.evaluate": { "total": 545.9753121045724, "count": 264599, "self": 545.9753121045724 } } }, "workers": { "total": 1.8144334039025125, "count": 133267, "self": 0.0, "children": { "worker_root": { "total": 2545.490670408546, "count": 133267, "is_parallel": true, "self": 1425.9446901018728, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.001545119999718736, "count": 2, "is_parallel": true, "self": 0.0004526110005826922, "children": { "_process_rank_one_or_two_observation": { "total": 0.0010925089991360437, "count": 8, "is_parallel": true, "self": 0.0010925089991360437 } } }, "UnityEnvironment.step": { "total": 0.019817124000837794, "count": 1, "is_parallel": true, "self": 0.0004965509997418849, "children": { "UnityEnvironment._generate_step_input": { "total": 0.00046378200022445526, "count": 1, "is_parallel": true, "self": 0.00046378200022445526 }, "communicator.exchange": { "total": 0.01740983200033952, "count": 1, "is_parallel": true, "self": 0.01740983200033952 }, "steps_from_proto": { "total": 0.0014469590005319333, "count": 2, "is_parallel": true, "self": 0.0002938880024885293, "children": { "_process_rank_one_or_two_observation": { "total": 0.001153070998043404, "count": 8, "is_parallel": true, "self": 0.001153070998043404 } } } } } } }, "UnityEnvironment.step": { "total": 1119.531721983678, "count": 133266, "is_parallel": true, "self": 68.2219598996544, "children": { "UnityEnvironment._generate_step_input": { "total": 47.15250782205294, "count": 133266, "is_parallel": true, "self": 47.15250782205294 }, "communicator.exchange": { "total": 810.4720720318765, "count": 133266, "is_parallel": true, "self": 810.4720720318765 }, "steps_from_proto": { "total": 193.68518223009414, "count": 266532, "is_parallel": true, "self": 37.63077084696488, "children": { "_process_rank_one_or_two_observation": { "total": 156.05441138312926, "count": 1066128, "is_parallel": true, "self": 156.05441138312926 } } } } }, "steps_from_proto": { "total": 0.014258322995374328, "count": 20, "is_parallel": true, "self": 0.0028566979963216, "children": { "_process_rank_one_or_two_observation": { "total": 0.011401624999052729, "count": 80, "is_parallel": true, "self": 0.011401624999052729 } } } } } } } } }, "trainer_advance": { "total": 554.3214875766607, "count": 133267, "self": 24.025186708360707, "children": { "process_trajectory": { "total": 149.61244848931165, "count": 133267, "self": 148.90445992631066, "children": { "RLTrainer._checkpoint": { "total": 0.7079885630009812, "count": 4, "self": 0.7079885630009812 } } }, "_update_policy": { "total": 380.6838523789884, "count": 95, "self": 218.16326152800502, "children": { "TorchPOCAOptimizer.update": { "total": 162.52059085098335, "count": 2850, "self": 162.52059085098335 } } } } } } }, "trainer_threads": { "total": 8.319984772242606e-07, "count": 1, "self": 8.319984772242606e-07 }, "TrainerController._save_models": { "total": 0.16515278900078556, "count": 1, "self": 0.0012243510009284364, "children": { "RLTrainer._checkpoint": { "total": 0.16392843799985712, "count": 1, "self": 0.16392843799985712 } } } } } } }