ppo-Pyramids / run_logs /timers.json
kaljr's picture
First Push
849c0e6 verified
raw
history blame
18.7 kB
{
"name": "root",
"gauges": {
"Pyramids.Policy.Entropy.mean": {
"value": 0.25450700521469116,
"min": 0.2513265013694763,
"max": 1.425731897354126,
"count": 33
},
"Pyramids.Policy.Entropy.sum": {
"value": 7716.65283203125,
"min": 7531.7529296875,
"max": 43251.00390625,
"count": 33
},
"Pyramids.Step.mean": {
"value": 989956.0,
"min": 29902.0,
"max": 989956.0,
"count": 33
},
"Pyramids.Step.sum": {
"value": 989956.0,
"min": 29902.0,
"max": 989956.0,
"count": 33
},
"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.5468913912773132,
"min": -0.10540304332971573,
"max": 0.6365823149681091,
"count": 33
},
"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
"value": 151.48892211914062,
"min": -25.296730041503906,
"max": 180.7893829345703,
"count": 33
},
"Pyramids.Policy.RndValueEstimate.mean": {
"value": 0.027380799874663353,
"min": 0.007756194565445185,
"max": 0.40319085121154785,
"count": 33
},
"Pyramids.Policy.RndValueEstimate.sum": {
"value": 7.584481716156006,
"min": 2.1019287109375,
"max": 95.55622863769531,
"count": 33
},
"Pyramids.Losses.PolicyLoss.mean": {
"value": 0.06598515946857837,
"min": 0.06474892868610162,
"max": 0.07235195697878317,
"count": 33
},
"Pyramids.Losses.PolicyLoss.sum": {
"value": 0.9897773920286757,
"min": 0.5616991292927818,
"max": 1.0584658651422096,
"count": 33
},
"Pyramids.Losses.ValueLoss.mean": {
"value": 0.017123018421019275,
"min": 0.00023954040768810967,
"max": 0.017123018421019275,
"count": 33
},
"Pyramids.Losses.ValueLoss.sum": {
"value": 0.25684527631528914,
"min": 0.0033535657076335353,
"max": 0.25684527631528914,
"count": 33
},
"Pyramids.Policy.LearningRate.mean": {
"value": 7.443477518873336e-06,
"min": 7.443477518873336e-06,
"max": 0.000295215076594975,
"count": 33
},
"Pyramids.Policy.LearningRate.sum": {
"value": 0.00011165216278310004,
"min": 0.00011165216278310004,
"max": 0.0036090342969886,
"count": 33
},
"Pyramids.Policy.Epsilon.mean": {
"value": 0.10248112666666669,
"min": 0.10248112666666669,
"max": 0.19840502499999998,
"count": 33
},
"Pyramids.Policy.Epsilon.sum": {
"value": 1.5372169000000002,
"min": 1.4776296000000002,
"max": 2.5725222000000003,
"count": 33
},
"Pyramids.Policy.Beta.mean": {
"value": 0.00025786455400000013,
"min": 0.00025786455400000013,
"max": 0.0098406619975,
"count": 33
},
"Pyramids.Policy.Beta.sum": {
"value": 0.003867968310000002,
"min": 0.003867968310000002,
"max": 0.12031083886000002,
"count": 33
},
"Pyramids.Losses.RNDLoss.mean": {
"value": 0.014584985561668873,
"min": 0.014120169915258884,
"max": 0.5579977035522461,
"count": 33
},
"Pyramids.Losses.RNDLoss.sum": {
"value": 0.21877478063106537,
"min": 0.19768238067626953,
"max": 4.463981628417969,
"count": 33
},
"Pyramids.Environment.EpisodeLength.mean": {
"value": 328.7956989247312,
"min": 285.9,
"max": 999.0,
"count": 33
},
"Pyramids.Environment.EpisodeLength.sum": {
"value": 30578.0,
"min": 15934.0,
"max": 33048.0,
"count": 33
},
"Pyramids.Environment.CumulativeReward.mean": {
"value": 1.5599412869500078,
"min": -0.9998000515624881,
"max": 1.6929050364879648,
"count": 33
},
"Pyramids.Environment.CumulativeReward.sum": {
"value": 143.5145983994007,
"min": -31.99360164999962,
"max": 167.5975986123085,
"count": 33
},
"Pyramids.Policy.ExtrinsicReward.mean": {
"value": 1.5599412869500078,
"min": -0.9998000515624881,
"max": 1.6929050364879648,
"count": 33
},
"Pyramids.Policy.ExtrinsicReward.sum": {
"value": 143.5145983994007,
"min": -31.99360164999962,
"max": 167.5975986123085,
"count": 33
},
"Pyramids.Policy.RndReward.mean": {
"value": 0.0500471337480754,
"min": 0.04836135261516896,
"max": 12.475103815086186,
"count": 33
},
"Pyramids.Policy.RndReward.sum": {
"value": 4.604336304822937,
"min": 4.1674862858781125,
"max": 199.60166104137897,
"count": 33
},
"Pyramids.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 33
},
"Pyramids.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 33
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1708911350",
"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
"mlagents_version": "1.1.0.dev0",
"mlagents_envs_version": "1.1.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.2.1+cu121",
"numpy_version": "1.23.5",
"end_time_seconds": "1708914527"
},
"total": 3177.1321454090003,
"count": 1,
"self": 0.6001731570004267,
"children": {
"run_training.setup": {
"total": 0.06533630900003118,
"count": 1,
"self": 0.06533630900003118
},
"TrainerController.start_learning": {
"total": 3176.466635943,
"count": 1,
"self": 2.178739297989523,
"children": {
"TrainerController._reset_env": {
"total": 4.414482060999944,
"count": 1,
"self": 4.414482060999944
},
"TrainerController.advance": {
"total": 3169.7864719760105,
"count": 64068,
"self": 2.5467041879733188,
"children": {
"env_step": {
"total": 2130.257791092021,
"count": 64068,
"self": 1969.038138135983,
"children": {
"SubprocessEnvManager._take_step": {
"total": 159.8559913420636,
"count": 64068,
"self": 6.671488224062955,
"children": {
"TorchPolicy.evaluate": {
"total": 153.18450311800063,
"count": 62550,
"self": 153.18450311800063
}
}
},
"workers": {
"total": 1.3636616139742728,
"count": 64068,
"self": 0.0,
"children": {
"worker_root": {
"total": 3170.7778017090354,
"count": 64068,
"is_parallel": true,
"self": 1367.4470129960123,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.007462790999966273,
"count": 1,
"is_parallel": true,
"self": 0.005348088999880929,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0021147020000853445,
"count": 8,
"is_parallel": true,
"self": 0.0021147020000853445
}
}
},
"UnityEnvironment.step": {
"total": 0.06342643000004955,
"count": 1,
"is_parallel": true,
"self": 0.0007525450000684941,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0005173430000695589,
"count": 1,
"is_parallel": true,
"self": 0.0005173430000695589
},
"communicator.exchange": {
"total": 0.0600727989999541,
"count": 1,
"is_parallel": true,
"self": 0.0600727989999541
},
"steps_from_proto": {
"total": 0.002083742999957394,
"count": 1,
"is_parallel": true,
"self": 0.000438400999996702,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0016453419999606922,
"count": 8,
"is_parallel": true,
"self": 0.0016453419999606922
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 1803.3307887130231,
"count": 64067,
"is_parallel": true,
"self": 47.36134188999449,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 27.392768350986103,
"count": 64067,
"is_parallel": true,
"self": 27.392768350986103
},
"communicator.exchange": {
"total": 1600.4127628180036,
"count": 64067,
"is_parallel": true,
"self": 1600.4127628180036
},
"steps_from_proto": {
"total": 128.1639156540391,
"count": 64067,
"is_parallel": true,
"self": 26.994489046058447,
"children": {
"_process_rank_one_or_two_observation": {
"total": 101.16942660798065,
"count": 512536,
"is_parallel": true,
"self": 101.16942660798065
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 1036.9819766960163,
"count": 64068,
"self": 4.510689651992379,
"children": {
"process_trajectory": {
"total": 158.17156564502625,
"count": 64068,
"self": 157.95296877902615,
"children": {
"RLTrainer._checkpoint": {
"total": 0.2185968660000981,
"count": 2,
"self": 0.2185968660000981
}
}
},
"_update_policy": {
"total": 874.2997213989977,
"count": 456,
"self": 350.3324504190109,
"children": {
"TorchPPOOptimizer.update": {
"total": 523.9672709799868,
"count": 22764,
"self": 523.9672709799868
}
}
}
}
}
}
},
"trainer_threads": {
"total": 1.1319998520775698e-06,
"count": 1,
"self": 1.1319998520775698e-06
},
"TrainerController._save_models": {
"total": 0.08694147599999269,
"count": 1,
"self": 0.0019458599999779835,
"children": {
"RLTrainer._checkpoint": {
"total": 0.0849956160000147,
"count": 1,
"self": 0.0849956160000147
}
}
}
}
}
}
}