spatial's picture
Pyramids
9bfb45b
{
"name": "root",
"gauges": {
"Pyramids.Policy.Entropy.mean": {
"value": 0.4560242295265198,
"min": 0.428190678358078,
"max": 1.506645917892456,
"count": 33
},
"Pyramids.Policy.Entropy.sum": {
"value": 13782.8759765625,
"min": 12647.0400390625,
"max": 45705.609375,
"count": 33
},
"Pyramids.Step.mean": {
"value": 989882.0,
"min": 29952.0,
"max": 989882.0,
"count": 33
},
"Pyramids.Step.sum": {
"value": 989882.0,
"min": 29952.0,
"max": 989882.0,
"count": 33
},
"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.06469903141260147,
"min": -0.11465805768966675,
"max": 0.09703339636325836,
"count": 33
},
"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
"value": 16.11005973815918,
"min": -27.632591247558594,
"max": 24.064281463623047,
"count": 33
},
"Pyramids.Policy.RndValueEstimate.mean": {
"value": 0.009364745579659939,
"min": 0.0039476146921515465,
"max": 0.09955163300037384,
"count": 33
},
"Pyramids.Policy.RndValueEstimate.sum": {
"value": 2.3318216800689697,
"min": 0.9592703580856323,
"max": 23.892391204833984,
"count": 33
},
"Pyramids.Losses.PolicyLoss.mean": {
"value": 0.06846382050398028,
"min": 0.06525789853455287,
"max": 0.07563013646861022,
"count": 33
},
"Pyramids.Losses.PolicyLoss.sum": {
"value": 0.9584934870557239,
"min": 0.4899245364361994,
"max": 1.046818327301926,
"count": 33
},
"Pyramids.Losses.ValueLoss.mean": {
"value": 0.00719148833975071,
"min": 4.861112191611242e-05,
"max": 0.008414805138145262,
"count": 33
},
"Pyramids.Losses.ValueLoss.sum": {
"value": 0.10068083675650995,
"min": 0.0006319445849094614,
"max": 0.11780727193403366,
"count": 33
},
"Pyramids.Policy.LearningRate.mean": {
"value": 7.607926035485714e-06,
"min": 7.607926035485714e-06,
"max": 0.00029515063018788575,
"count": 33
},
"Pyramids.Policy.LearningRate.sum": {
"value": 0.0001065109644968,
"min": 0.0001065109644968,
"max": 0.0032258860247046995,
"count": 33
},
"Pyramids.Policy.Epsilon.mean": {
"value": 0.10253594285714286,
"min": 0.10253594285714286,
"max": 0.19838354285714285,
"count": 33
},
"Pyramids.Policy.Epsilon.sum": {
"value": 1.4355032,
"min": 1.3886848,
"max": 2.3467824,
"count": 33
},
"Pyramids.Policy.Beta.mean": {
"value": 0.0002633406914285715,
"min": 0.0002633406914285715,
"max": 0.00983851593142857,
"count": 33
},
"Pyramids.Policy.Beta.sum": {
"value": 0.003686769680000001,
"min": 0.003686769680000001,
"max": 0.10754200047000001,
"count": 33
},
"Pyramids.Losses.RNDLoss.mean": {
"value": 0.011606285348534584,
"min": 0.011606285348534584,
"max": 0.25451597571372986,
"count": 33
},
"Pyramids.Losses.RNDLoss.sum": {
"value": 0.16248799860477448,
"min": 0.16248799860477448,
"max": 1.7816119194030762,
"count": 33
},
"Pyramids.Environment.EpisodeLength.mean": {
"value": 832.4358974358975,
"min": 708.95,
"max": 999.0,
"count": 33
},
"Pyramids.Environment.EpisodeLength.sum": {
"value": 32465.0,
"min": 15984.0,
"max": 32465.0,
"count": 33
},
"Pyramids.Environment.CumulativeReward.mean": {
"value": 0.1416820106215966,
"min": -1.0000000521540642,
"max": 0.39079496581107376,
"count": 33
},
"Pyramids.Environment.CumulativeReward.sum": {
"value": 5.525598414242268,
"min": -30.998201623558998,
"max": 15.631798632442951,
"count": 33
},
"Pyramids.Policy.ExtrinsicReward.mean": {
"value": 0.1416820106215966,
"min": -1.0000000521540642,
"max": 0.39079496581107376,
"count": 33
},
"Pyramids.Policy.ExtrinsicReward.sum": {
"value": 5.525598414242268,
"min": -30.998201623558998,
"max": 15.631798632442951,
"count": 33
},
"Pyramids.Policy.RndReward.mean": {
"value": 0.10104023319600412,
"min": 0.09197263081587152,
"max": 4.949434297159314,
"count": 33
},
"Pyramids.Policy.RndReward.sum": {
"value": 3.940569094644161,
"min": 3.6150847100652754,
"max": 79.19094875454903,
"count": 33
},
"Pyramids.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 33
},
"Pyramids.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 33
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1676123783",
"python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
"mlagents_version": "0.29.0.dev0",
"mlagents_envs_version": "0.29.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "1.8.1+cu102",
"numpy_version": "1.21.6",
"end_time_seconds": "1676125917"
},
"total": 2134.5542478700004,
"count": 1,
"self": 0.4748590039998817,
"children": {
"run_training.setup": {
"total": 0.12283512400017571,
"count": 1,
"self": 0.12283512400017571
},
"TrainerController.start_learning": {
"total": 2133.9565537420003,
"count": 1,
"self": 1.2193468790214865,
"children": {
"TrainerController._reset_env": {
"total": 6.190092013999674,
"count": 1,
"self": 6.190092013999674
},
"TrainerController.advance": {
"total": 2126.45938309598,
"count": 63093,
"self": 1.3071009229843185,
"children": {
"env_step": {
"total": 1406.5567779079456,
"count": 63093,
"self": 1299.393295936864,
"children": {
"SubprocessEnvManager._take_step": {
"total": 106.42281186701302,
"count": 63093,
"self": 4.400783107010284,
"children": {
"TorchPolicy.evaluate": {
"total": 102.02202876000274,
"count": 62573,
"self": 35.028317536955,
"children": {
"TorchPolicy.sample_actions": {
"total": 66.99371122304774,
"count": 62573,
"self": 66.99371122304774
}
}
}
}
},
"workers": {
"total": 0.740670104068613,
"count": 63093,
"self": 0.0,
"children": {
"worker_root": {
"total": 2129.3964883450444,
"count": 63093,
"is_parallel": true,
"self": 936.8135326430443,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.0018469239998921694,
"count": 1,
"is_parallel": true,
"self": 0.000733351000235416,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0011135729996567534,
"count": 8,
"is_parallel": true,
"self": 0.0011135729996567534
}
}
},
"UnityEnvironment.step": {
"total": 0.048866593999719043,
"count": 1,
"is_parallel": true,
"self": 0.0005057670000496728,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.00045822999982192414,
"count": 1,
"is_parallel": true,
"self": 0.00045822999982192414
},
"communicator.exchange": {
"total": 0.04631425499974284,
"count": 1,
"is_parallel": true,
"self": 0.04631425499974284
},
"steps_from_proto": {
"total": 0.0015883420001046034,
"count": 1,
"is_parallel": true,
"self": 0.0004039530003865366,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0011843889997180668,
"count": 8,
"is_parallel": true,
"self": 0.0011843889997180668
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 1192.5829557020002,
"count": 63092,
"is_parallel": true,
"self": 30.818812181998965,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 22.479508520041236,
"count": 63092,
"is_parallel": true,
"self": 22.479508520041236
},
"communicator.exchange": {
"total": 1038.942287997074,
"count": 63092,
"is_parallel": true,
"self": 1038.942287997074
},
"steps_from_proto": {
"total": 100.34234700288607,
"count": 63092,
"is_parallel": true,
"self": 21.711927341807495,
"children": {
"_process_rank_one_or_two_observation": {
"total": 78.63041966107858,
"count": 504736,
"is_parallel": true,
"self": 78.63041966107858
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 718.5955042650498,
"count": 63093,
"self": 2.198287098133278,
"children": {
"process_trajectory": {
"total": 155.85582828990937,
"count": 63093,
"self": 155.6649238869095,
"children": {
"RLTrainer._checkpoint": {
"total": 0.19090440299987677,
"count": 2,
"self": 0.19090440299987677
}
}
},
"_update_policy": {
"total": 560.5413888770072,
"count": 434,
"self": 216.26933375304588,
"children": {
"TorchPPOOptimizer.update": {
"total": 344.2720551239613,
"count": 22818,
"self": 344.2720551239613
}
}
}
}
}
}
},
"trainer_threads": {
"total": 9.069999578059651e-07,
"count": 1,
"self": 9.069999578059651e-07
},
"TrainerController._save_models": {
"total": 0.08773084599943104,
"count": 1,
"self": 0.001455425000131072,
"children": {
"RLTrainer._checkpoint": {
"total": 0.08627542099929997,
"count": 1,
"self": 0.08627542099929997
}
}
}
}
}
}
}