|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.27549049258232117, |
|
"min": 0.26731228828430176, |
|
"max": 1.4493860006332397, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 8317.609375, |
|
"min": 7942.3828125, |
|
"max": 43968.57421875, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 989963.0, |
|
"min": 29995.0, |
|
"max": 989963.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 989963.0, |
|
"min": 29995.0, |
|
"max": 989963.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.3820275366306305, |
|
"min": -0.20250090956687927, |
|
"max": 0.4386945366859436, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 101.61932373046875, |
|
"min": -48.19521713256836, |
|
"max": 118.44752502441406, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": 0.05105531960725784, |
|
"min": -0.0468810498714447, |
|
"max": 0.1877581626176834, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": 13.58071517944336, |
|
"min": -12.048429489135742, |
|
"max": 44.68644332885742, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.07022312540832107, |
|
"min": 0.06500805549841884, |
|
"max": 0.07482881779885955, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 0.983123755716495, |
|
"min": 0.5584108903175807, |
|
"max": 1.1224322669828932, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.013360547542758549, |
|
"min": 0.0003223785652858879, |
|
"max": 0.013360547542758549, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.18704766559861968, |
|
"min": 0.0038685427834306545, |
|
"max": 0.18704766559861968, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 7.2578475807500015e-06, |
|
"min": 7.2578475807500015e-06, |
|
"max": 0.0002952216390927875, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 0.00010160986613050003, |
|
"min": 0.00010160986613050003, |
|
"max": 0.0032229553256815997, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.10241924999999999, |
|
"min": 0.10241924999999999, |
|
"max": 0.19840721249999999, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 1.4338695, |
|
"min": 1.4338695, |
|
"max": 2.4426861, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 0.000251683075, |
|
"min": 0.000251683075, |
|
"max": 0.009840880528750002, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.00352356305, |
|
"min": 0.00352356305, |
|
"max": 0.10744440815999999, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.008525403216481209, |
|
"min": 0.00841066800057888, |
|
"max": 0.27556312084198, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.11935564875602722, |
|
"min": 0.11774935573339462, |
|
"max": 2.20450496673584, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 477.74242424242425, |
|
"min": 410.72463768115944, |
|
"max": 999.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 31531.0, |
|
"min": 15899.0, |
|
"max": 32971.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.2411784319923473, |
|
"min": -0.9999419873760592, |
|
"max": 1.4189882068073048, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 80.67659807950258, |
|
"min": -31.99760165810585, |
|
"max": 96.65619876235723, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.2411784319923473, |
|
"min": -0.9999419873760592, |
|
"max": 1.4189882068073048, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 80.67659807950258, |
|
"min": -31.99760165810585, |
|
"max": 96.65619876235723, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.043198116634084724, |
|
"min": 0.03816441814056556, |
|
"max": 5.634947238955647, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 2.8078775812155072, |
|
"min": 2.4962405982078053, |
|
"max": 90.15915582329035, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1674832998", |
|
"python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
|
"mlagents_version": "0.29.0.dev0", |
|
"mlagents_envs_version": "0.29.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.8.1+cu102", |
|
"numpy_version": "1.21.6", |
|
"end_time_seconds": "1674834891" |
|
}, |
|
"total": 1893.6942188510002, |
|
"count": 1, |
|
"self": 0.3832569720002539, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0976965290001317, |
|
"count": 1, |
|
"self": 0.0976965290001317 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 1893.2132653499998, |
|
"count": 1, |
|
"self": 1.137411571040957, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 5.762282159999813, |
|
"count": 1, |
|
"self": 5.762282159999813 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 1886.2316672889592, |
|
"count": 63616, |
|
"self": 1.1827673718380538, |
|
"children": { |
|
"env_step": { |
|
"total": 1261.6161743459515, |
|
"count": 63616, |
|
"self": 1161.435774440035, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 99.44296559802024, |
|
"count": 63616, |
|
"self": 4.168602229000953, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 95.27436336901928, |
|
"count": 62589, |
|
"self": 32.35999166103511, |
|
"children": { |
|
"TorchPolicy.sample_actions": { |
|
"total": 62.914371707984174, |
|
"count": 62589, |
|
"self": 62.914371707984174 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 0.7374343078963648, |
|
"count": 63616, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 1890.0498098860203, |
|
"count": 63616, |
|
"is_parallel": true, |
|
"self": 821.1282908740286, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.0017148389997601043, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0006409549996533315, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0010738840001067729, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0010738840001067729 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.04614013199989131, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005768969999735418, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.00039142200012065587, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00039142200012065587 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.04350961699992695, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.04350961699992695 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.001662195999870164, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00045956600069985143, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0012026299991703127, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0012026299991703127 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 1068.9215190119917, |
|
"count": 63615, |
|
"is_parallel": true, |
|
"self": 26.496172006321558, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 22.42524333183428, |
|
"count": 63615, |
|
"is_parallel": true, |
|
"self": 22.42524333183428 |
|
}, |
|
"communicator.exchange": { |
|
"total": 929.8074193029115, |
|
"count": 63615, |
|
"is_parallel": true, |
|
"self": 929.8074193029115 |
|
}, |
|
"steps_from_proto": { |
|
"total": 90.19268437092433, |
|
"count": 63615, |
|
"is_parallel": true, |
|
"self": 21.02469858789027, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 69.16798578303406, |
|
"count": 508920, |
|
"is_parallel": true, |
|
"self": 69.16798578303406 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 623.4327255711696, |
|
"count": 63616, |
|
"self": 2.1293135190171597, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 142.43744580915336, |
|
"count": 63616, |
|
"self": 142.24659025815345, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.19085555099991325, |
|
"count": 2, |
|
"self": 0.19085555099991325 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 478.8659662429991, |
|
"count": 448, |
|
"self": 177.89730654393043, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 300.96865969906867, |
|
"count": 22770, |
|
"self": 300.96865969906867 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 8.830002116155811e-07, |
|
"count": 1, |
|
"self": 8.830002116155811e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.08190344699960406, |
|
"count": 1, |
|
"self": 0.0014646529998572078, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.08043879399974685, |
|
"count": 1, |
|
"self": 0.08043879399974685 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |