jackhhhh's picture
Push
204cb5f
{
"name": "root",
"gauges": {
"Pyramids.Policy.Entropy.mean": {
"value": 0.2992294430732727,
"min": 0.2992294430732727,
"max": 1.492452621459961,
"count": 33
},
"Pyramids.Policy.Entropy.sum": {
"value": 9048.6982421875,
"min": 9048.6982421875,
"max": 45275.04296875,
"count": 33
},
"Pyramids.Step.mean": {
"value": 989926.0,
"min": 29957.0,
"max": 989926.0,
"count": 33
},
"Pyramids.Step.sum": {
"value": 989926.0,
"min": 29957.0,
"max": 989926.0,
"count": 33
},
"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.587913990020752,
"min": -0.09508303552865982,
"max": 0.6669148206710815,
"count": 33
},
"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
"value": 162.26426696777344,
"min": -22.91501235961914,
"max": 194.07220458984375,
"count": 33
},
"Pyramids.Policy.RndValueEstimate.mean": {
"value": 0.011886782944202423,
"min": -0.031833529472351074,
"max": 0.20138977468013763,
"count": 33
},
"Pyramids.Policy.RndValueEstimate.sum": {
"value": 3.280752182006836,
"min": -7.576379776000977,
"max": 48.736324310302734,
"count": 33
},
"Pyramids.Losses.PolicyLoss.mean": {
"value": 0.0704758680319459,
"min": 0.06429999697040727,
"max": 0.07241002595678549,
"count": 33
},
"Pyramids.Losses.PolicyLoss.sum": {
"value": 0.9866621524472425,
"min": 0.5020450306949259,
"max": 1.0506646613745638,
"count": 33
},
"Pyramids.Losses.ValueLoss.mean": {
"value": 0.014914674551175816,
"min": 0.0001606622993645703,
"max": 0.015761754097286067,
"count": 33
},
"Pyramids.Losses.ValueLoss.sum": {
"value": 0.20880544371646143,
"min": 0.0022492721911039843,
"max": 0.2339067940566547,
"count": 33
},
"Pyramids.Policy.LearningRate.mean": {
"value": 7.690511722242855e-06,
"min": 7.690511722242855e-06,
"max": 0.00029523818730155715,
"count": 33
},
"Pyramids.Policy.LearningRate.sum": {
"value": 0.00010766716411139996,
"min": 0.00010766716411139996,
"max": 0.0036084981971673,
"count": 33
},
"Pyramids.Policy.Epsilon.mean": {
"value": 0.10256347142857143,
"min": 0.10256347142857143,
"max": 0.19841272857142855,
"count": 33
},
"Pyramids.Policy.Epsilon.sum": {
"value": 1.4358886,
"min": 1.3888890999999999,
"max": 2.5695068,
"count": 33
},
"Pyramids.Policy.Beta.mean": {
"value": 0.00026609079571428566,
"min": 0.00026609079571428566,
"max": 0.009841431584285715,
"count": 33
},
"Pyramids.Policy.Beta.sum": {
"value": 0.0037252711399999995,
"min": 0.0037252711399999995,
"max": 0.12029298673,
"count": 33
},
"Pyramids.Losses.RNDLoss.mean": {
"value": 0.01237169187515974,
"min": 0.01237169187515974,
"max": 0.3624524772167206,
"count": 33
},
"Pyramids.Losses.RNDLoss.sum": {
"value": 0.17320369184017181,
"min": 0.17320369184017181,
"max": 2.5371673107147217,
"count": 33
},
"Pyramids.Environment.EpisodeLength.mean": {
"value": 328.22727272727275,
"min": 284.6990291262136,
"max": 999.0,
"count": 33
},
"Pyramids.Environment.EpisodeLength.sum": {
"value": 28884.0,
"min": 16628.0,
"max": 32781.0,
"count": 33
},
"Pyramids.Environment.CumulativeReward.mean": {
"value": 1.649034072306346,
"min": -0.9998375521972775,
"max": 1.7141851693115853,
"count": 33
},
"Pyramids.Environment.CumulativeReward.sum": {
"value": 145.11499836295843,
"min": -31.99480167031288,
"max": 185.1319982856512,
"count": 33
},
"Pyramids.Policy.ExtrinsicReward.mean": {
"value": 1.649034072306346,
"min": -0.9998375521972775,
"max": 1.7141851693115853,
"count": 33
},
"Pyramids.Policy.ExtrinsicReward.sum": {
"value": 145.11499836295843,
"min": -31.99480167031288,
"max": 185.1319982856512,
"count": 33
},
"Pyramids.Policy.RndReward.mean": {
"value": 0.04222177033476659,
"min": 0.03835009137839328,
"max": 7.25148319453001,
"count": 33
},
"Pyramids.Policy.RndReward.sum": {
"value": 3.7155157894594595,
"min": 3.7155157894594595,
"max": 123.27521430701017,
"count": 33
},
"Pyramids.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 33
},
"Pyramids.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 33
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1679200891",
"python_version": "3.9.16 (main, Dec 7 2022, 01:11:51) \n[GCC 9.4.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
"mlagents_version": "0.31.0.dev0",
"mlagents_envs_version": "0.31.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "1.11.0+cu102",
"numpy_version": "1.21.2",
"end_time_seconds": "1679203020"
},
"total": 2129.645745955,
"count": 1,
"self": 0.4741174550008509,
"children": {
"run_training.setup": {
"total": 0.10579601399967942,
"count": 1,
"self": 0.10579601399967942
},
"TrainerController.start_learning": {
"total": 2129.0658324859996,
"count": 1,
"self": 1.506976754923926,
"children": {
"TrainerController._reset_env": {
"total": 6.197753757999635,
"count": 1,
"self": 6.197753757999635
},
"TrainerController.advance": {
"total": 2121.268153165076,
"count": 64017,
"self": 1.602584594106247,
"children": {
"env_step": {
"total": 1503.9630158600344,
"count": 64017,
"self": 1389.157125215048,
"children": {
"SubprocessEnvManager._take_step": {
"total": 113.89014844903159,
"count": 64017,
"self": 4.751692930037734,
"children": {
"TorchPolicy.evaluate": {
"total": 109.13845551899385,
"count": 62558,
"self": 109.13845551899385
}
}
},
"workers": {
"total": 0.9157421959548628,
"count": 64017,
"self": 0.0,
"children": {
"worker_root": {
"total": 2124.198507129002,
"count": 64017,
"is_parallel": true,
"self": 853.9254579731282,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.0019010460000572493,
"count": 1,
"is_parallel": true,
"self": 0.0006330769997475727,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0012679690003096766,
"count": 8,
"is_parallel": true,
"self": 0.0012679690003096766
}
}
},
"UnityEnvironment.step": {
"total": 0.08576096200022221,
"count": 1,
"is_parallel": true,
"self": 0.0005926660001023265,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.00040959699981613085,
"count": 1,
"is_parallel": true,
"self": 0.00040959699981613085
},
"communicator.exchange": {
"total": 0.08316502000025139,
"count": 1,
"is_parallel": true,
"self": 0.08316502000025139
},
"steps_from_proto": {
"total": 0.0015936790000523615,
"count": 1,
"is_parallel": true,
"self": 0.00036088500019104686,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0012327939998613147,
"count": 8,
"is_parallel": true,
"self": 0.0012327939998613147
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 1270.2730491558737,
"count": 64016,
"is_parallel": true,
"self": 31.001365252864616,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 22.399567527079853,
"count": 64016,
"is_parallel": true,
"self": 22.399567527079853
},
"communicator.exchange": {
"total": 1125.852470723948,
"count": 64016,
"is_parallel": true,
"self": 1125.852470723948
},
"steps_from_proto": {
"total": 91.01964565198114,
"count": 64016,
"is_parallel": true,
"self": 19.654464270681274,
"children": {
"_process_rank_one_or_two_observation": {
"total": 71.36518138129986,
"count": 512128,
"is_parallel": true,
"self": 71.36518138129986
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 615.7025527109354,
"count": 64017,
"self": 2.8630582349819633,
"children": {
"process_trajectory": {
"total": 117.09458153496371,
"count": 64017,
"self": 116.89556704396409,
"children": {
"RLTrainer._checkpoint": {
"total": 0.1990144909996161,
"count": 2,
"self": 0.1990144909996161
}
}
},
"_update_policy": {
"total": 495.7449129409897,
"count": 458,
"self": 312.1669926319523,
"children": {
"TorchPPOOptimizer.update": {
"total": 183.57792030903738,
"count": 22791,
"self": 183.57792030903738
}
}
}
}
}
}
},
"trainer_threads": {
"total": 9.420000424142927e-07,
"count": 1,
"self": 9.420000424142927e-07
},
"TrainerController._save_models": {
"total": 0.09294786600003135,
"count": 1,
"self": 0.0014057910002520657,
"children": {
"RLTrainer._checkpoint": {
"total": 0.09154207499977929,
"count": 1,
"self": 0.09154207499977929
}
}
}
}
}
}
}