|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.48702165484428406, |
|
"min": 0.44668611884117126, |
|
"max": 1.5974081754684448, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 7293.63623046875, |
|
"min": 6742.52392578125, |
|
"max": 25558.53125, |
|
"count": 100 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 1499927.0, |
|
"min": 14960.0, |
|
"max": 1499927.0, |
|
"count": 100 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 1499927.0, |
|
"min": 14960.0, |
|
"max": 1499927.0, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.1931789666414261, |
|
"min": -0.08827703446149826, |
|
"max": 0.54588782787323, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 24.147371292114258, |
|
"min": -10.593244552612305, |
|
"max": 71.51130676269531, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": 0.10692010819911957, |
|
"min": -2.319406270980835, |
|
"max": 0.5430359244346619, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": 13.365013122558594, |
|
"min": -313.1198425292969, |
|
"max": 72.2237777709961, |
|
"count": 100 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.021887752918216086, |
|
"min": 0.016317666446169218, |
|
"max": 0.03001637246925384, |
|
"count": 100 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 0.06566325875464826, |
|
"min": 0.04895299933850765, |
|
"max": 0.1022449663025327, |
|
"count": 100 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.028128571606551606, |
|
"min": 0.0004217532914481126, |
|
"max": 0.5521492043510079, |
|
"count": 100 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.08438571481965482, |
|
"min": 0.0012652598743443377, |
|
"max": 2.2085968174040316, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 1.1040105591555517e-06, |
|
"min": 1.1040105591555517e-06, |
|
"max": 0.00019877120061440002, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 3.3120316774666553e-06, |
|
"min": 3.3120316774666553e-06, |
|
"max": 0.0007798576100711998, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.10055195555555556, |
|
"min": 0.10055195555555556, |
|
"max": 0.1993856, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 0.30165586666666666, |
|
"min": 0.30165586666666666, |
|
"max": 0.7899288, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 6.514035999999981e-05, |
|
"min": 6.514035999999981e-05, |
|
"max": 0.00993862144, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.00019542107999999945, |
|
"min": 0.00019542107999999945, |
|
"max": 0.03899388712000001, |
|
"count": 100 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.01588110625743866, |
|
"min": 0.015369528904557228, |
|
"max": 0.8264577984809875, |
|
"count": 100 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.04764331877231598, |
|
"min": 0.04751599207520485, |
|
"max": 1.652915596961975, |
|
"count": 100 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 605.9090909090909, |
|
"min": 358.6363636363636, |
|
"max": 999.0, |
|
"count": 99 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 13330.0, |
|
"min": 7480.0, |
|
"max": 18408.0, |
|
"count": 99 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.0303272245959803, |
|
"min": -1.0000000521540642, |
|
"max": 1.6413636089048602, |
|
"count": 100 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 22.667198941111565, |
|
"min": -15.999400839209557, |
|
"max": 72.21999879181385, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.0303272245959803, |
|
"min": -1.0000000521540642, |
|
"max": 1.6413636089048602, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 22.667198941111565, |
|
"min": -15.999400839209557, |
|
"max": 72.21999879181385, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.09671802150974558, |
|
"min": 0.07045210495099044, |
|
"max": 11.204274728894234, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 2.127796473214403, |
|
"min": 2.127796473214403, |
|
"max": 104.2868239581585, |
|
"count": 100 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 100 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 100 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1679323052", |
|
"python_version": "3.9.16 (main, Dec 7 2022, 01:11:51) \n[GCC 9.4.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training 3 --no-graphics", |
|
"mlagents_version": "0.31.0.dev0", |
|
"mlagents_envs_version": "0.31.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.11.0+cu102", |
|
"numpy_version": "1.21.2", |
|
"end_time_seconds": "1679326214" |
|
}, |
|
"total": 3162.679552165, |
|
"count": 1, |
|
"self": 0.44162624799992045, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.10628935299996556, |
|
"count": 1, |
|
"self": 0.10628935299996556 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 3162.131636564, |
|
"count": 1, |
|
"self": 2.04367966191694, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 10.231304194000018, |
|
"count": 1, |
|
"self": 10.231304194000018 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 3149.743723493083, |
|
"count": 95475, |
|
"self": 2.1986011099693314, |
|
"children": { |
|
"env_step": { |
|
"total": 2213.671983656081, |
|
"count": 95475, |
|
"self": 2052.434392665081, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 160.00268999499417, |
|
"count": 95475, |
|
"self": 6.980408748963498, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 153.02228124603067, |
|
"count": 93823, |
|
"self": 153.02228124603067 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 1.2349009960059334, |
|
"count": 95475, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 3155.096824597045, |
|
"count": 95475, |
|
"is_parallel": true, |
|
"self": 1275.8812516060202, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.00515687000000753, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0036788550000323994, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0014780149999751302, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0014780149999751302 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.0757186139999817, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005660490000423124, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.00046223299995062916, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00046223299995062916 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.07301252199999908, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.07301252199999908 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0016778099999896767, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0004385029999980361, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0012393069999916406, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0012393069999916406 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 1879.2155729910246, |
|
"count": 95474, |
|
"is_parallel": true, |
|
"self": 46.984084795974695, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 33.91037586009372, |
|
"count": 95474, |
|
"is_parallel": true, |
|
"self": 33.91037586009372 |
|
}, |
|
"communicator.exchange": { |
|
"total": 1661.6547364499272, |
|
"count": 95474, |
|
"is_parallel": true, |
|
"self": 1661.6547364499272 |
|
}, |
|
"steps_from_proto": { |
|
"total": 136.6663758850288, |
|
"count": 95474, |
|
"is_parallel": true, |
|
"self": 28.916061298933585, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 107.75031458609521, |
|
"count": 763792, |
|
"is_parallel": true, |
|
"self": 107.75031458609521 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 933.8731387270326, |
|
"count": 95475, |
|
"self": 3.929698067035474, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 177.41394104199668, |
|
"count": 95475, |
|
"self": 177.12017251699655, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.2937685250001323, |
|
"count": 3, |
|
"self": 0.2937685250001323 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 752.5294996180004, |
|
"count": 353, |
|
"self": 648.6307422760165, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 103.89875734198398, |
|
"count": 7150, |
|
"self": 103.89875734198398 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 8.530000741302501e-07, |
|
"count": 1, |
|
"self": 8.530000741302501e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.11292836199982048, |
|
"count": 1, |
|
"self": 0.0014282719998846005, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.11150008999993588, |
|
"count": 1, |
|
"self": 0.11150008999993588 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |