|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.38535264134407043, |
|
"min": 0.38535264134407043, |
|
"max": 1.4340118169784546, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 11622.2353515625, |
|
"min": 11515.4736328125, |
|
"max": 43502.18359375, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 989971.0, |
|
"min": 29901.0, |
|
"max": 989971.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 989971.0, |
|
"min": 29901.0, |
|
"max": 989971.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.643875777721405, |
|
"min": -0.10255663841962814, |
|
"max": 0.643875777721405, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 184.79234313964844, |
|
"min": -24.818706512451172, |
|
"max": 184.79234313964844, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": 0.010809449478983879, |
|
"min": -0.005641380324959755, |
|
"max": 0.6432042717933655, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": 3.1023120880126953, |
|
"min": -1.5457382202148438, |
|
"max": 152.4394073486328, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.06856560069302628, |
|
"min": 0.06486136321870596, |
|
"max": 0.07316504085871962, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 0.959918409702368, |
|
"min": 0.4832980583188386, |
|
"max": 1.0612731124685308, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.015947685946316813, |
|
"min": 0.0005039816814433899, |
|
"max": 0.026813511493280946, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.22326760324843536, |
|
"min": 0.006551761858764068, |
|
"max": 0.24162014279863797, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 7.564854621271427e-06, |
|
"min": 7.564854621271427e-06, |
|
"max": 0.0002952351015883, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 0.00010590796469779998, |
|
"min": 0.00010590796469779998, |
|
"max": 0.0033802268732578008, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.10252158571428571, |
|
"min": 0.10252158571428571, |
|
"max": 0.1984117, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 1.4353022, |
|
"min": 1.3888819, |
|
"max": 2.5267422, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 0.00026190641285714285, |
|
"min": 0.00026190641285714285, |
|
"max": 0.00984132883, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.00366668978, |
|
"min": 0.00366668978, |
|
"max": 0.11270154578000001, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.01548650860786438, |
|
"min": 0.01548650860786438, |
|
"max": 0.8159781694412231, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.21681112051010132, |
|
"min": 0.21681112051010132, |
|
"max": 5.711847305297852, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 287.3047619047619, |
|
"min": 287.3047619047619, |
|
"max": 999.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 30167.0, |
|
"min": 16700.0, |
|
"max": 32432.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.6745885523302215, |
|
"min": -0.999987552408129, |
|
"max": 1.6745885523302215, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 175.83179799467325, |
|
"min": -31.999601677060127, |
|
"max": 175.83179799467325, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.6745885523302215, |
|
"min": -0.999987552408129, |
|
"max": 1.6745885523302215, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 175.83179799467325, |
|
"min": -31.999601677060127, |
|
"max": 175.83179799467325, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.04611302747840195, |
|
"min": 0.04611302747840195, |
|
"max": 17.58480724341729, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 4.841867885232205, |
|
"min": 4.660183200932806, |
|
"max": 298.94172313809395, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1673497079", |
|
"python_version": "3.8.16 (default, Dec 7 2022, 01:12:13) \n[GCC 7.5.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
|
"mlagents_version": "0.29.0.dev0", |
|
"mlagents_envs_version": "0.29.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.8.1+cu102", |
|
"numpy_version": "1.21.6", |
|
"end_time_seconds": "1673499111" |
|
}, |
|
"total": 2032.4949281039999, |
|
"count": 1, |
|
"self": 0.384770509999953, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.10326109800007544, |
|
"count": 1, |
|
"self": 0.10326109800007544 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 2032.0068964959999, |
|
"count": 1, |
|
"self": 1.2466524079970895, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 6.2558559799999784, |
|
"count": 1, |
|
"self": 6.2558559799999784 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 2024.4139960590023, |
|
"count": 63947, |
|
"self": 1.2847530909477882, |
|
"children": { |
|
"env_step": { |
|
"total": 1366.9868217920723, |
|
"count": 63947, |
|
"self": 1264.833158251176, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 101.37037233291721, |
|
"count": 63947, |
|
"self": 4.2471907519106935, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 97.12318158100652, |
|
"count": 62560, |
|
"self": 32.473596955978564, |
|
"children": { |
|
"TorchPolicy.sample_actions": { |
|
"total": 64.64958462502796, |
|
"count": 62560, |
|
"self": 64.64958462502796 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 0.7832912079791186, |
|
"count": 63947, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 2027.7310040110192, |
|
"count": 63947, |
|
"is_parallel": true, |
|
"self": 860.8068762800001, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.00181788199984112, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0006273579999742651, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0011905239998668549, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0011905239998668549 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.04761529399979736, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0004845369999202376, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.00044205399990460137, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00044205399990460137 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.04513455899996188, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.04513455899996188 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0015541440000106377, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00041471899930911604, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0011394250007015216, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0011394250007015216 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 1166.924127731019, |
|
"count": 63946, |
|
"is_parallel": true, |
|
"self": 27.618510007978557, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 22.577149495026788, |
|
"count": 63946, |
|
"is_parallel": true, |
|
"self": 22.577149495026788 |
|
}, |
|
"communicator.exchange": { |
|
"total": 1017.1851497929922, |
|
"count": 63946, |
|
"is_parallel": true, |
|
"self": 1017.1851497929922 |
|
}, |
|
"steps_from_proto": { |
|
"total": 99.54331843502155, |
|
"count": 63946, |
|
"is_parallel": true, |
|
"self": 21.79434892397103, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 77.74896951105052, |
|
"count": 511568, |
|
"is_parallel": true, |
|
"self": 77.74896951105052 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 656.1424211759822, |
|
"count": 63947, |
|
"self": 2.426197324955865, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 142.53838653202888, |
|
"count": 63947, |
|
"self": 142.33866893302934, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.19971759899954122, |
|
"count": 2, |
|
"self": 0.19971759899954122 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 511.1778373189975, |
|
"count": 452, |
|
"self": 199.35278211000355, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 311.82505520899394, |
|
"count": 22779, |
|
"self": 311.82505520899394 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 9.300001693191007e-07, |
|
"count": 1, |
|
"self": 9.300001693191007e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.09039111900028729, |
|
"count": 1, |
|
"self": 0.0014103810003689432, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.08898073799991835, |
|
"count": 1, |
|
"self": 0.08898073799991835 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |