{ "name": "root", "gauges": { "Pyramids.Policy.Entropy.mean": { "value": 0.4751316010951996, "min": 0.4751316010951996, "max": 1.4819844961166382, "count": 33 }, "Pyramids.Policy.Entropy.sum": { "value": 14307.1630859375, "min": 14307.1630859375, "max": 44957.48046875, "count": 33 }, "Pyramids.Step.mean": { "value": 989994.0, "min": 29952.0, "max": 989994.0, "count": 33 }, "Pyramids.Step.sum": { "value": 989994.0, "min": 29952.0, "max": 989994.0, "count": 33 }, "Pyramids.Policy.ExtrinsicValueEstimate.mean": { "value": 0.5144892334938049, "min": -0.09246806055307388, "max": 0.5509904026985168, "count": 33 }, "Pyramids.Policy.ExtrinsicValueEstimate.sum": { "value": 141.4845428466797, "min": -22.28480339050293, "max": 149.869384765625, "count": 33 }, "Pyramids.Policy.RndValueEstimate.mean": { "value": -0.02455996535718441, "min": -0.02455996535718441, "max": 0.35849425196647644, "count": 33 }, "Pyramids.Policy.RndValueEstimate.sum": { "value": -6.753990650177002, "min": -6.753990650177002, "max": 84.963134765625, "count": 33 }, "Pyramids.Losses.PolicyLoss.mean": { "value": 0.06890408480402958, "min": 0.06535967395973362, "max": 0.07486838631687523, "count": 33 }, "Pyramids.Losses.PolicyLoss.sum": { "value": 0.9646571872564143, "min": 0.5237277918378153, "max": 1.0463956207580243, "count": 33 }, "Pyramids.Losses.ValueLoss.mean": { "value": 0.014429957925021475, "min": 0.0007994112330046457, "max": 0.017019337494968482, "count": 33 }, "Pyramids.Losses.ValueLoss.sum": { "value": 0.20201941095030065, "min": 0.01119175726206504, "max": 0.23827072492955872, "count": 33 }, "Pyramids.Policy.LearningRate.mean": { "value": 7.566804620621425e-06, "min": 7.566804620621425e-06, "max": 0.00029515063018788575, "count": 33 }, "Pyramids.Policy.LearningRate.sum": { "value": 0.00010593526468869995, "min": 0.00010593526468869995, "max": 0.003507481430839599, "count": 33 }, "Pyramids.Policy.Epsilon.mean": { "value": 0.10252223571428572, "min": 0.10252223571428572, "max": 0.19838354285714285, "count": 33 }, "Pyramids.Policy.Epsilon.sum": { "value": 1.4353113, "min": 1.3886848, "max": 2.5691604000000003, "count": 33 }, "Pyramids.Policy.Beta.mean": { "value": 0.0002619713478571427, "min": 0.0002619713478571427, "max": 0.00983851593142857, "count": 33 }, "Pyramids.Policy.Beta.sum": { "value": 0.0036675988699999985, "min": 0.0036675988699999985, "max": 0.11693912396000003, "count": 33 }, "Pyramids.Losses.RNDLoss.mean": { "value": 0.012692471034824848, "min": 0.012692471034824848, "max": 0.5196684002876282, "count": 33 }, "Pyramids.Losses.RNDLoss.sum": { "value": 0.17769458889961243, "min": 0.17769458889961243, "max": 3.637678623199463, "count": 33 }, "Pyramids.Environment.EpisodeLength.mean": { "value": 366.421686746988, "min": 336.13793103448273, "max": 999.0, "count": 33 }, "Pyramids.Environment.EpisodeLength.sum": { "value": 30413.0, "min": 15984.0, "max": 32666.0, "count": 33 }, "Pyramids.Environment.CumulativeReward.mean": { "value": 1.5130746759564044, "min": -1.0000000521540642, "max": 1.6178666439720955, "count": 33 }, "Pyramids.Environment.CumulativeReward.sum": { "value": 125.58519810438156, "min": -30.69800166785717, "max": 140.7543980255723, "count": 33 }, "Pyramids.Policy.ExtrinsicReward.mean": { "value": 1.5130746759564044, "min": -1.0000000521540642, "max": 1.6178666439720955, "count": 33 }, "Pyramids.Policy.ExtrinsicReward.sum": { "value": 125.58519810438156, "min": -30.69800166785717, "max": 140.7543980255723, "count": 33 }, "Pyramids.Policy.RndReward.mean": { "value": 0.04787124356858752, "min": 0.04468370767527035, "max": 11.574133425951004, "count": 33 }, "Pyramids.Policy.RndReward.sum": { "value": 3.9733132161927642, "min": 3.848675603978336, "max": 185.18613481521606, "count": 33 }, "Pyramids.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 33 }, "Pyramids.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 33 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1674142022", "python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]", "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", "mlagents_version": "0.29.0.dev0", "mlagents_envs_version": "0.29.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.8.1+cu102", "numpy_version": "1.21.6", "end_time_seconds": "1674143995" }, "total": 1973.530090246, "count": 1, "self": 0.4473800710004525, "children": { "run_training.setup": { "total": 0.09791745499978788, "count": 1, "self": 0.09791745499978788 }, "TrainerController.start_learning": { "total": 1972.9847927199999, "count": 1, "self": 1.1670493830349642, "children": { "TrainerController._reset_env": { "total": 6.003774200999942, "count": 1, "self": 6.003774200999942 }, "TrainerController.advance": { "total": 1965.727747302965, "count": 63765, "self": 1.2322513640021953, "children": { "env_step": { "total": 1323.9748242129872, "count": 63765, "self": 1222.152015654914, "children": { "SubprocessEnvManager._take_step": { "total": 101.10016689204167, "count": 63765, "self": 4.278429036076432, "children": { "TorchPolicy.evaluate": { "total": 96.82173785596524, "count": 62572, "self": 32.29616380697303, "children": { "TorchPolicy.sample_actions": { "total": 64.52557404899221, "count": 62572, "self": 64.52557404899221 } } } } }, "workers": { "total": 0.7226416660314499, "count": 63765, "self": 0.0, "children": { "worker_root": { "total": 1968.820748304986, "count": 63765, "is_parallel": true, "self": 841.9783478610161, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.0016313789999458095, "count": 1, "is_parallel": true, "self": 0.0005775209999683284, "children": { "_process_rank_one_or_two_observation": { "total": 0.001053857999977481, "count": 8, "is_parallel": true, "self": 0.001053857999977481 } } }, "UnityEnvironment.step": { "total": 0.04570511399992938, "count": 1, "is_parallel": true, "self": 0.0004949999997734267, "children": { "UnityEnvironment._generate_step_input": { "total": 0.00048383800003648503, "count": 1, "is_parallel": true, "self": 0.00048383800003648503 }, "communicator.exchange": { "total": 0.04314085000009982, "count": 1, "is_parallel": true, "self": 0.04314085000009982 }, "steps_from_proto": { "total": 0.0015854260000196518, "count": 1, "is_parallel": true, "self": 0.00039267199986170453, "children": { "_process_rank_one_or_two_observation": { "total": 0.0011927540001579473, "count": 8, "is_parallel": true, "self": 0.0011927540001579473 } } } } } } }, "UnityEnvironment.step": { "total": 1126.8424004439698, "count": 63764, "is_parallel": true, "self": 26.959808602015755, "children": { "UnityEnvironment._generate_step_input": { "total": 21.303081727966173, "count": 63764, "is_parallel": true, "self": 21.303081727966173 }, "communicator.exchange": { "total": 983.1699928889716, "count": 63764, "is_parallel": true, "self": 983.1699928889716 }, "steps_from_proto": { "total": 95.40951722501632, "count": 63764, "is_parallel": true, "self": 20.77795456709623, "children": { "_process_rank_one_or_two_observation": { "total": 74.63156265792009, "count": 510112, "is_parallel": true, "self": 74.63156265792009 } } } } } } } } } } }, "trainer_advance": { "total": 640.5206717259757, "count": 63765, "self": 2.2660486160366418, "children": { "process_trajectory": { "total": 139.43531687893164, "count": 63765, "self": 139.25119942393167, "children": { "RLTrainer._checkpoint": { "total": 0.18411745499997778, "count": 2, "self": 0.18411745499997778 } } }, "_update_policy": { "total": 498.81930623100743, "count": 450, "self": 187.4774447769887, "children": { "TorchPPOOptimizer.update": { "total": 311.3418614540187, "count": 22794, "self": 311.3418614540187 } } } } } } }, "trainer_threads": { "total": 8.349998097401112e-07, "count": 1, "self": 8.349998097401112e-07 }, "TrainerController._save_models": { "total": 0.08622099800004435, "count": 1, "self": 0.001500321000094118, "children": { "RLTrainer._checkpoint": { "total": 0.08472067699995023, "count": 1, "self": 0.08472067699995023 } } } } } } }