{ "name": "root", "gauges": { "Pyramids.Policy.Entropy.mean": { "value": 0.30226588249206543, "min": 0.2905525863170624, "max": 0.48415157198905945, "count": 33 }, "Pyramids.Policy.Entropy.sum": { "value": 9043.794921875, "min": 8693.3330078125, "max": 14447.771484375, "count": 33 }, "Pyramids.Step.mean": { "value": 1979893.0, "min": 1019901.0, "max": 1979893.0, "count": 33 }, "Pyramids.Step.sum": { "value": 1979893.0, "min": 1019901.0, "max": 1979893.0, "count": 33 }, "Pyramids.Policy.ExtrinsicValueEstimate.mean": { "value": 0.6581579446792603, "min": 0.10869690775871277, "max": 0.6835697889328003, "count": 33 }, "Pyramids.Policy.ExtrinsicValueEstimate.sum": { "value": 184.9423828125, "min": 24.538314819335938, "max": 197.91285705566406, "count": 33 }, "Pyramids.Policy.RndValueEstimate.mean": { "value": 0.05591478571295738, "min": -0.5486251711845398, "max": 0.6454031467437744, "count": 33 }, "Pyramids.Policy.RndValueEstimate.sum": { "value": 15.712055206298828, "min": -149.22604370117188, "max": 179.4220733642578, "count": 33 }, "Pyramids.Environment.EpisodeLength.mean": { "value": 291.6868686868687, "min": 273.9642857142857, "max": 716.9, "count": 33 }, "Pyramids.Environment.EpisodeLength.sum": { "value": 28877.0, "min": 15408.0, "max": 32226.0, "count": 33 }, "Pyramids.Environment.CumulativeReward.mean": { "value": 1.6867179843783378, "min": 0.5828799590468406, "max": 1.7276306189932265, "count": 33 }, "Pyramids.Environment.CumulativeReward.sum": { "value": 168.6717984378338, "min": 18.585199385881424, "max": 191.76699870824814, "count": 33 }, "Pyramids.Policy.ExtrinsicReward.mean": { "value": 1.6867179843783378, "min": 0.5828799590468406, "max": 1.7276306189932265, "count": 33 }, "Pyramids.Policy.ExtrinsicReward.sum": { "value": 168.6717984378338, "min": 18.585199385881424, "max": 191.76699870824814, "count": 33 }, "Pyramids.Policy.RndReward.mean": { "value": 0.08323891130188713, "min": 0.07760038152614512, "max": 0.38253927688783734, "count": 33 }, "Pyramids.Policy.RndReward.sum": { "value": 8.323891130188713, "min": 8.065886851632968, "max": 15.301571075513493, "count": 33 }, "Pyramids.Losses.PolicyLoss.mean": { "value": 0.030638242301730706, "min": 0.02839826929682334, "max": 0.03363850301996405, "count": 33 }, "Pyramids.Losses.PolicyLoss.sum": { "value": 0.4289353922242299, "min": 0.3010105590987951, "max": 0.49610404586419454, "count": 33 }, "Pyramids.Losses.ValueLoss.mean": { "value": 0.01592927757717137, "min": 0.00933230190874181, "max": 0.07634348353991904, "count": 33 }, "Pyramids.Losses.ValueLoss.sum": { "value": 0.22300988608039915, "min": 0.08399071717867629, "max": 1.1451522530987857, "count": 33 }, "Pyramids.Policy.LearningRate.mean": { "value": 5.261262531992852e-06, "min": 5.261262531992852e-06, "max": 0.00014838705053766665, "count": 33 }, "Pyramids.Policy.LearningRate.sum": { "value": 7.365767544789993e-05, "min": 7.365767544789993e-05, "max": 0.0020256206747933498, "count": 33 }, "Pyramids.Policy.Epsilon.mean": { "value": 0.10175372142857142, "min": 0.10175372142857142, "max": 0.14946233333333336, "count": 33 }, "Pyramids.Policy.Epsilon.sum": { "value": 1.4245520999999999, "min": 1.3451610000000003, "max": 2.11133085, "count": 33 }, "Pyramids.Policy.Beta.mean": { "value": 0.00018519677071428552, "min": 0.00018519677071428552, "max": 0.004951287100000001, "count": 33 }, "Pyramids.Policy.Beta.sum": { "value": 0.0025927547899999973, "min": 0.0025927547899999973, "max": 0.067593144335, "count": 33 }, "Pyramids.Losses.RNDLoss.mean": { "value": 0.027942849323153496, "min": 0.027649715542793274, "max": 0.052572958171367645, "count": 33 }, "Pyramids.Losses.RNDLoss.sum": { "value": 0.39119988679885864, "min": 0.38709601759910583, "max": 0.7247375845909119, "count": 33 }, "Pyramids.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 33 }, "Pyramids.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 33 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1675182632", "python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]", "command_line_arguments": "/usr/local/bin/mlagents-learn --resume ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", "mlagents_version": "0.29.0.dev0", "mlagents_envs_version": "0.29.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.8.1+cu102", "numpy_version": "1.21.6", "end_time_seconds": "1675184765" }, "total": 2133.003628408, "count": 1, "self": 0.4751166099999864, "children": { "run_training.setup": { "total": 0.09911593200013158, "count": 1, "self": 0.09911593200013158 }, "TrainerController.start_learning": { "total": 2132.429395866, "count": 1, "self": 1.1965176899648213, "children": { "TrainerController._reset_env": { "total": 6.112986608000028, "count": 1, "self": 6.112986608000028 }, "TrainerController.advance": { "total": 2125.0332825380347, "count": 64531, "self": 1.3073357259436307, "children": { "env_step": { "total": 1422.273043184955, "count": 64531, "self": 1322.065725131898, "children": { "SubprocessEnvManager._take_step": { "total": 99.47658951301219, "count": 64531, "self": 4.177412174096389, "children": { "TorchPolicy.evaluate": { "total": 95.2991773389158, "count": 62544, "self": 32.42140378492786, "children": { "TorchPolicy.sample_actions": { "total": 62.877773553987936, "count": 62544, "self": 62.877773553987936 } } } } }, "workers": { "total": 0.7307285400447654, "count": 64531, "self": 0.0, "children": { "worker_root": { "total": 2129.417411901921, "count": 64531, "is_parallel": true, "self": 901.1585452369432, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.001725695999994059, "count": 1, "is_parallel": true, "self": 0.0006433660009861342, "children": { "_process_rank_one_or_two_observation": { "total": 0.001082329999007925, "count": 8, "is_parallel": true, "self": 0.001082329999007925 } } }, "UnityEnvironment.step": { "total": 0.04415739600017332, "count": 1, "is_parallel": true, "self": 0.0004756240009555768, "children": { "UnityEnvironment._generate_step_input": { "total": 0.00042504999964876333, "count": 1, "is_parallel": true, "self": 0.00042504999964876333 }, "communicator.exchange": { "total": 0.04169974699971135, "count": 1, "is_parallel": true, "self": 0.04169974699971135 }, "steps_from_proto": { "total": 0.0015569749998576299, "count": 1, "is_parallel": true, "self": 0.00042672600011428585, "children": { "_process_rank_one_or_two_observation": { "total": 0.001130248999743344, "count": 8, "is_parallel": true, "self": 0.001130248999743344 } } } } } } }, "UnityEnvironment.step": { "total": 1228.2588666649776, "count": 64530, "is_parallel": true, "self": 26.56036614386676, "children": { "UnityEnvironment._generate_step_input": { "total": 21.27402726313403, "count": 64530, "is_parallel": true, "self": 21.27402726313403 }, "communicator.exchange": { "total": 1093.3448889038928, "count": 64530, "is_parallel": true, "self": 1093.3448889038928 }, "steps_from_proto": { "total": 87.07958435408409, "count": 64530, "is_parallel": true, "self": 20.499208944890142, "children": { "_process_rank_one_or_two_observation": { "total": 66.58037540919395, "count": 516240, "is_parallel": true, "self": 66.58037540919395 } } } } } } } } } } }, "trainer_advance": { "total": 701.452903627136, "count": 64531, "self": 2.3567661701536053, "children": { "process_trajectory": { "total": 140.65703218398585, "count": 64531, "self": 140.47350847598636, "children": { "RLTrainer._checkpoint": { "total": 0.18352370799948403, "count": 2, "self": 0.18352370799948403 } } }, "_update_policy": { "total": 558.4391052729966, "count": 473, "self": 292.17689421198565, "children": { "TorchPPOOptimizer.update": { "total": 266.26221106101093, "count": 9465, "self": 266.26221106101093 } } } } } } }, "trainer_threads": { "total": 9.080004019779153e-07, "count": 1, "self": 9.080004019779153e-07 }, "TrainerController._save_models": { "total": 0.08660812200014334, "count": 1, "self": 0.0017107240000768797, "children": { "RLTrainer._checkpoint": { "total": 0.08489739800006646, "count": 1, "self": 0.08489739800006646 } } } } } } }