{ "name": "root", "gauges": { "Pyramids.Policy.Entropy.mean": { "value": 0.7464560270309448, "min": 0.7464560270309448, "max": 1.4029273986816406, "count": 16 }, "Pyramids.Policy.Entropy.sum": { "value": 22405.625, "min": 22405.625, "max": 42559.20703125, "count": 16 }, "Pyramids.Step.mean": { "value": 479986.0, "min": 29952.0, "max": 479986.0, "count": 16 }, "Pyramids.Step.sum": { "value": 479986.0, "min": 29952.0, "max": 479986.0, "count": 16 }, "Pyramids.Policy.ExtrinsicValueEstimate.mean": { "value": -0.007536211516708136, "min": -0.08861368149518967, "max": 0.028692930936813354, "count": 16 }, "Pyramids.Policy.ExtrinsicValueEstimate.sum": { "value": -1.8539080619812012, "min": -21.267284393310547, "max": 7.0584611892700195, "count": 16 }, "Pyramids.Policy.RndValueEstimate.mean": { "value": 0.023149048909544945, "min": 0.023149048909544945, "max": 0.266669899225235, "count": 16 }, "Pyramids.Policy.RndValueEstimate.sum": { "value": 5.694665908813477, "min": 5.694665908813477, "max": 63.200767517089844, "count": 16 }, "Pyramids.Losses.PolicyLoss.mean": { "value": 0.06964277009787372, "min": 0.06656558413778985, "max": 0.07596241547337088, "count": 16 }, "Pyramids.Losses.PolicyLoss.sum": { "value": 0.974998781370232, "min": 0.4851144522407772, "max": 0.9991759692419174, "count": 16 }, "Pyramids.Losses.ValueLoss.mean": { "value": 0.0028964160404766084, "min": 0.0008843073084158285, "max": 0.005411580702630522, "count": 16 }, "Pyramids.Losses.ValueLoss.sum": { "value": 0.04054982456667252, "min": 0.0067436495732724954, "max": 0.07576212983682731, "count": 16 }, "Pyramids.Policy.LearningRate.mean": { "value": 2.1303650041671426e-05, "min": 2.1303650041671426e-05, "max": 0.00029030126037577137, "count": 16 }, "Pyramids.Policy.LearningRate.sum": { "value": 0.0002982511005834, "min": 0.0002982511005834, "max": 0.0026349669216778, "count": 16 }, "Pyramids.Policy.Epsilon.mean": { "value": 0.10710118571428572, "min": 0.10710118571428572, "max": 0.19676708571428575, "count": 16 }, "Pyramids.Policy.Epsilon.sum": { "value": 1.4994166, "min": 1.3382272, "max": 2.2550920000000003, "count": 16 }, "Pyramids.Policy.Beta.mean": { "value": 0.000719408452857143, "min": 0.000719408452857143, "max": 0.00967703186285714, "count": 16 }, "Pyramids.Policy.Beta.sum": { "value": 0.010071718340000002, "min": 0.010071718340000002, "max": 0.08786438778000001, "count": 16 }, "Pyramids.Losses.RNDLoss.mean": { "value": 0.019943514838814735, "min": 0.019943514838814735, "max": 0.3411950170993805, "count": 16 }, "Pyramids.Losses.RNDLoss.sum": { "value": 0.2792091965675354, "min": 0.2792091965675354, "max": 2.3883650302886963, "count": 16 }, "Pyramids.Environment.EpisodeLength.mean": { "value": 921.8285714285714, "min": 844.2727272727273, "max": 999.0, "count": 16 }, "Pyramids.Environment.EpisodeLength.sum": { "value": 32264.0, "min": 15984.0, "max": 32328.0, "count": 16 }, "Pyramids.Environment.CumulativeReward.mean": { "value": -0.29362862088850566, "min": -1.0000000521540642, "max": -0.1173758041678053, "count": 16 }, "Pyramids.Environment.CumulativeReward.sum": { "value": -10.277001731097698, "min": -32.000001668930054, "max": -3.8734015375375748, "count": 16 }, "Pyramids.Policy.ExtrinsicReward.mean": { "value": -0.29362862088850566, "min": -1.0000000521540642, "max": -0.1173758041678053, "count": 16 }, "Pyramids.Policy.ExtrinsicReward.sum": { "value": -10.277001731097698, "min": -32.000001668930054, "max": -3.8734015375375748, "count": 16 }, "Pyramids.Policy.RndReward.mean": { "value": 0.19050542868073014, "min": 0.18536401506174693, "max": 6.625431148335338, "count": 16 }, "Pyramids.Policy.RndReward.sum": { "value": 6.667690003825555, "min": 6.117012497037649, "max": 106.0068983733654, "count": 16 }, "Pyramids.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 16 }, "Pyramids.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 16 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1674682032", "python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]", "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./trained-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --force", "mlagents_version": "0.29.0.dev0", "mlagents_envs_version": "0.29.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.8.1+cu102", "numpy_version": "1.21.6", "end_time_seconds": "1674682986" }, "total": 953.1708651980001, "count": 1, "self": 0.43987947400023586, "children": { "run_training.setup": { "total": 0.10250952900003085, "count": 1, "self": 0.10250952900003085 }, "TrainerController.start_learning": { "total": 952.6284761949998, "count": 1, "self": 0.5830455149725822, "children": { "TrainerController._reset_env": { "total": 5.932209274000002, "count": 1, "self": 5.932209274000002 }, "TrainerController.advance": { "total": 946.0236782040273, "count": 31569, "self": 0.6459622010434032, "children": { "env_step": { "total": 624.9368654209877, "count": 31569, "self": 572.6706140259781, "children": { "SubprocessEnvManager._take_step": { "total": 51.89972149500454, "count": 31569, "self": 2.1489310709976053, "children": { "TorchPolicy.evaluate": { "total": 49.75079042400694, "count": 31319, "self": 16.940194671001336, "children": { "TorchPolicy.sample_actions": { "total": 32.8105957530056, "count": 31319, "self": 32.8105957530056 } } } } }, "workers": { "total": 0.36652990000504815, "count": 31569, "self": 0.0, "children": { "worker_root": { "total": 950.2774944440102, "count": 31569, "is_parallel": true, "self": 427.69851899902267, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.0018109750000121494, "count": 1, "is_parallel": true, "self": 0.0006856730001345568, "children": { "_process_rank_one_or_two_observation": { "total": 0.0011253019998775926, "count": 8, "is_parallel": true, "self": 0.0011253019998775926 } } }, "UnityEnvironment.step": { "total": 0.04688734499995917, "count": 1, "is_parallel": true, "self": 0.0004948399998738751, "children": { "UnityEnvironment._generate_step_input": { "total": 0.00044313099999726546, "count": 1, "is_parallel": true, "self": 0.00044313099999726546 }, "communicator.exchange": { "total": 0.044324056000050405, "count": 1, "is_parallel": true, "self": 0.044324056000050405 }, "steps_from_proto": { "total": 0.0016253180000376233, "count": 1, "is_parallel": true, "self": 0.0004613410001184093, "children": { "_process_rank_one_or_two_observation": { "total": 0.001163976999919214, "count": 8, "is_parallel": true, "self": 0.001163976999919214 } } } } } } }, "UnityEnvironment.step": { "total": 522.5789754449876, "count": 31568, "is_parallel": true, "self": 13.71885985996687, "children": { "UnityEnvironment._generate_step_input": { "total": 11.229444884006512, "count": 31568, "is_parallel": true, "self": 11.229444884006512 }, "communicator.exchange": { "total": 447.429475485005, "count": 31568, "is_parallel": true, "self": 447.429475485005 }, "steps_from_proto": { "total": 50.20119521600918, "count": 31568, "is_parallel": true, "self": 10.971166037053763, "children": { "_process_rank_one_or_two_observation": { "total": 39.23002917895542, "count": 252544, "is_parallel": true, "self": 39.23002917895542 } } } } } } } } } } }, "trainer_advance": { "total": 320.4408505819962, "count": 31569, "self": 0.9624543269923151, "children": { "process_trajectory": { "total": 72.21191473900467, "count": 31569, "self": 72.11116764900476, "children": { "RLTrainer._checkpoint": { "total": 0.10074708999991344, "count": 1, "self": 0.10074708999991344 } } }, "_update_policy": { "total": 247.2664815159992, "count": 205, "self": 91.97091399598617, "children": { "TorchPPOOptimizer.update": { "total": 155.29556752001304, "count": 11454, "self": 155.29556752001304 } } } } } } }, "trainer_threads": { "total": 1.032999989547534e-06, "count": 1, "self": 1.032999989547534e-06 }, "TrainerController._save_models": { "total": 0.08954216899996936, "count": 1, "self": 0.0017235380000784062, "children": { "RLTrainer._checkpoint": { "total": 0.08781863099989096, "count": 1, "self": 0.08781863099989096 } } } } } } }