|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.32455044984817505, |
|
"min": 0.32455044984817505, |
|
"max": 1.4014934301376343, |
|
"count": 38 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 9658.62109375, |
|
"min": 9658.62109375, |
|
"max": 42515.703125, |
|
"count": 38 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 1139913.0, |
|
"min": 29952.0, |
|
"max": 1139913.0, |
|
"count": 38 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 1139913.0, |
|
"min": 29952.0, |
|
"max": 1139913.0, |
|
"count": 38 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.7032342553138733, |
|
"min": -0.08691871911287308, |
|
"max": 0.7546818256378174, |
|
"count": 38 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 198.3120574951172, |
|
"min": -20.947410583496094, |
|
"max": 221.87646484375, |
|
"count": 38 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": -0.0030358193907886744, |
|
"min": -0.0030358193907886744, |
|
"max": 0.7074459195137024, |
|
"count": 38 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": -0.8561010956764221, |
|
"min": -0.8561010956764221, |
|
"max": 167.66468811035156, |
|
"count": 38 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.0678462937241257, |
|
"min": 0.0659452210711912, |
|
"max": 0.073509724354841, |
|
"count": 38 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 0.9498481121377599, |
|
"min": 0.5125883137292079, |
|
"max": 1.0995384643188741, |
|
"count": 38 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.014161616487898775, |
|
"min": 0.0009429177532035344, |
|
"max": 0.022875304939388996, |
|
"count": 38 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.19826263083058285, |
|
"min": 0.011315013038442413, |
|
"max": 0.25841210885760924, |
|
"count": 38 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 0.00018744825894583095, |
|
"min": 0.00018744825894583095, |
|
"max": 0.00029838354339596195, |
|
"count": 38 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 0.0026242756252416333, |
|
"min": 0.0020886848037717336, |
|
"max": 0.004011005562998167, |
|
"count": 38 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.16248274047619052, |
|
"min": 0.16248274047619052, |
|
"max": 0.19946118095238097, |
|
"count": 38 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 2.274758366666667, |
|
"min": 1.3962282666666668, |
|
"max": 2.782524833333333, |
|
"count": 38 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 0.006252025773571429, |
|
"min": 0.006252025773571429, |
|
"max": 0.009946171977142856, |
|
"count": 38 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.08752836083, |
|
"min": 0.06962320384, |
|
"max": 0.13370648315, |
|
"count": 38 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.011095731519162655, |
|
"min": 0.011095731519162655, |
|
"max": 0.6866158246994019, |
|
"count": 38 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.15534023940563202, |
|
"min": 0.15534023940563202, |
|
"max": 4.806310653686523, |
|
"count": 38 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 282.92727272727274, |
|
"min": 245.7520661157025, |
|
"max": 999.0, |
|
"count": 38 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 31122.0, |
|
"min": 15984.0, |
|
"max": 33343.0, |
|
"count": 38 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.6625486049083396, |
|
"min": -1.0000000521540642, |
|
"max": 1.7377140310185015, |
|
"count": 38 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 181.217797935009, |
|
"min": -29.920001707971096, |
|
"max": 210.26339775323868, |
|
"count": 38 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.6625486049083396, |
|
"min": -1.0000000521540642, |
|
"max": 1.7377140310185015, |
|
"count": 38 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 181.217797935009, |
|
"min": -29.920001707971096, |
|
"max": 210.26339775323868, |
|
"count": 38 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.032435735565858013, |
|
"min": 0.02944811480552774, |
|
"max": 15.783606315031648, |
|
"count": 38 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 3.5354951766785234, |
|
"min": 3.5354951766785234, |
|
"max": 252.53770104050636, |
|
"count": 38 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 38 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 38 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1674331976", |
|
"python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
|
"mlagents_version": "0.29.0.dev0", |
|
"mlagents_envs_version": "0.29.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.8.1+cu102", |
|
"numpy_version": "1.21.6", |
|
"end_time_seconds": "1674334362" |
|
}, |
|
"total": 2386.036490971, |
|
"count": 1, |
|
"self": 0.33600176700065276, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.10314740299963887, |
|
"count": 1, |
|
"self": 0.10314740299963887 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 2385.597341801, |
|
"count": 1, |
|
"self": 1.277292170997498, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 5.984121487000266, |
|
"count": 1, |
|
"self": 5.984121487000266 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 2378.1859671930024, |
|
"count": 74138, |
|
"self": 1.30607813296092, |
|
"children": { |
|
"env_step": { |
|
"total": 1644.9988005469818, |
|
"count": 74138, |
|
"self": 1534.900517766784, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 109.30514457307163, |
|
"count": 74138, |
|
"self": 4.62598370005162, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 104.67916087302001, |
|
"count": 72249, |
|
"self": 35.43943694206746, |
|
"children": { |
|
"TorchPolicy.sample_actions": { |
|
"total": 69.23972393095255, |
|
"count": 72249, |
|
"self": 69.23972393095255 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 0.7931382071260487, |
|
"count": 74137, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 2381.2596111110156, |
|
"count": 74137, |
|
"is_parallel": true, |
|
"self": 951.2278270509796, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.0016657150003993593, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005783720012004778, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0010873429991988814, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0010873429991988814 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.042329461999997875, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0004626690001714451, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.00042751699993459624, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00042751699993459624 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.0399360749997868, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0399360749997868 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0015032010001050367, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0003869020006277424, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0011162989994772943, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0011162989994772943 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 1430.031784060036, |
|
"count": 74136, |
|
"is_parallel": true, |
|
"self": 30.897817024909273, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 24.33003257004748, |
|
"count": 74136, |
|
"is_parallel": true, |
|
"self": 24.33003257004748 |
|
}, |
|
"communicator.exchange": { |
|
"total": 1265.2588427510855, |
|
"count": 74136, |
|
"is_parallel": true, |
|
"self": 1265.2588427510855 |
|
}, |
|
"steps_from_proto": { |
|
"total": 109.54509171399377, |
|
"count": 74136, |
|
"is_parallel": true, |
|
"self": 23.531156822258254, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 86.01393489173552, |
|
"count": 593088, |
|
"is_parallel": true, |
|
"self": 86.01393489173552 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 731.8810885130597, |
|
"count": 74137, |
|
"self": 2.467187754024053, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 160.07127956703243, |
|
"count": 74137, |
|
"self": 159.89747450903224, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.1738050580001982, |
|
"count": 2, |
|
"self": 0.1738050580001982 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 569.3426211920032, |
|
"count": 526, |
|
"self": 219.76144839701283, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 349.5811727949904, |
|
"count": 26319, |
|
"self": 349.5811727949904 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 1.3239996405900456e-06, |
|
"count": 1, |
|
"self": 1.3239996405900456e-06 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.1499596260000544, |
|
"count": 1, |
|
"self": 0.0037016400001448346, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.14625798599990958, |
|
"count": 1, |
|
"self": 0.14625798599990958 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |