ArneL2206's picture
init
b4d1748
{
"name": "root",
"gauges": {
"Pyramids.Policy.Entropy.mean": {
"value": 0.32455044984817505,
"min": 0.32455044984817505,
"max": 1.4014934301376343,
"count": 38
},
"Pyramids.Policy.Entropy.sum": {
"value": 9658.62109375,
"min": 9658.62109375,
"max": 42515.703125,
"count": 38
},
"Pyramids.Step.mean": {
"value": 1139913.0,
"min": 29952.0,
"max": 1139913.0,
"count": 38
},
"Pyramids.Step.sum": {
"value": 1139913.0,
"min": 29952.0,
"max": 1139913.0,
"count": 38
},
"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.7032342553138733,
"min": -0.08691871911287308,
"max": 0.7546818256378174,
"count": 38
},
"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
"value": 198.3120574951172,
"min": -20.947410583496094,
"max": 221.87646484375,
"count": 38
},
"Pyramids.Policy.RndValueEstimate.mean": {
"value": -0.0030358193907886744,
"min": -0.0030358193907886744,
"max": 0.7074459195137024,
"count": 38
},
"Pyramids.Policy.RndValueEstimate.sum": {
"value": -0.8561010956764221,
"min": -0.8561010956764221,
"max": 167.66468811035156,
"count": 38
},
"Pyramids.Losses.PolicyLoss.mean": {
"value": 0.0678462937241257,
"min": 0.0659452210711912,
"max": 0.073509724354841,
"count": 38
},
"Pyramids.Losses.PolicyLoss.sum": {
"value": 0.9498481121377599,
"min": 0.5125883137292079,
"max": 1.0995384643188741,
"count": 38
},
"Pyramids.Losses.ValueLoss.mean": {
"value": 0.014161616487898775,
"min": 0.0009429177532035344,
"max": 0.022875304939388996,
"count": 38
},
"Pyramids.Losses.ValueLoss.sum": {
"value": 0.19826263083058285,
"min": 0.011315013038442413,
"max": 0.25841210885760924,
"count": 38
},
"Pyramids.Policy.LearningRate.mean": {
"value": 0.00018744825894583095,
"min": 0.00018744825894583095,
"max": 0.00029838354339596195,
"count": 38
},
"Pyramids.Policy.LearningRate.sum": {
"value": 0.0026242756252416333,
"min": 0.0020886848037717336,
"max": 0.004011005562998167,
"count": 38
},
"Pyramids.Policy.Epsilon.mean": {
"value": 0.16248274047619052,
"min": 0.16248274047619052,
"max": 0.19946118095238097,
"count": 38
},
"Pyramids.Policy.Epsilon.sum": {
"value": 2.274758366666667,
"min": 1.3962282666666668,
"max": 2.782524833333333,
"count": 38
},
"Pyramids.Policy.Beta.mean": {
"value": 0.006252025773571429,
"min": 0.006252025773571429,
"max": 0.009946171977142856,
"count": 38
},
"Pyramids.Policy.Beta.sum": {
"value": 0.08752836083,
"min": 0.06962320384,
"max": 0.13370648315,
"count": 38
},
"Pyramids.Losses.RNDLoss.mean": {
"value": 0.011095731519162655,
"min": 0.011095731519162655,
"max": 0.6866158246994019,
"count": 38
},
"Pyramids.Losses.RNDLoss.sum": {
"value": 0.15534023940563202,
"min": 0.15534023940563202,
"max": 4.806310653686523,
"count": 38
},
"Pyramids.Environment.EpisodeLength.mean": {
"value": 282.92727272727274,
"min": 245.7520661157025,
"max": 999.0,
"count": 38
},
"Pyramids.Environment.EpisodeLength.sum": {
"value": 31122.0,
"min": 15984.0,
"max": 33343.0,
"count": 38
},
"Pyramids.Environment.CumulativeReward.mean": {
"value": 1.6625486049083396,
"min": -1.0000000521540642,
"max": 1.7377140310185015,
"count": 38
},
"Pyramids.Environment.CumulativeReward.sum": {
"value": 181.217797935009,
"min": -29.920001707971096,
"max": 210.26339775323868,
"count": 38
},
"Pyramids.Policy.ExtrinsicReward.mean": {
"value": 1.6625486049083396,
"min": -1.0000000521540642,
"max": 1.7377140310185015,
"count": 38
},
"Pyramids.Policy.ExtrinsicReward.sum": {
"value": 181.217797935009,
"min": -29.920001707971096,
"max": 210.26339775323868,
"count": 38
},
"Pyramids.Policy.RndReward.mean": {
"value": 0.032435735565858013,
"min": 0.02944811480552774,
"max": 15.783606315031648,
"count": 38
},
"Pyramids.Policy.RndReward.sum": {
"value": 3.5354951766785234,
"min": 3.5354951766785234,
"max": 252.53770104050636,
"count": 38
},
"Pyramids.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 38
},
"Pyramids.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 38
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1674331976",
"python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
"mlagents_version": "0.29.0.dev0",
"mlagents_envs_version": "0.29.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "1.8.1+cu102",
"numpy_version": "1.21.6",
"end_time_seconds": "1674334362"
},
"total": 2386.036490971,
"count": 1,
"self": 0.33600176700065276,
"children": {
"run_training.setup": {
"total": 0.10314740299963887,
"count": 1,
"self": 0.10314740299963887
},
"TrainerController.start_learning": {
"total": 2385.597341801,
"count": 1,
"self": 1.277292170997498,
"children": {
"TrainerController._reset_env": {
"total": 5.984121487000266,
"count": 1,
"self": 5.984121487000266
},
"TrainerController.advance": {
"total": 2378.1859671930024,
"count": 74138,
"self": 1.30607813296092,
"children": {
"env_step": {
"total": 1644.9988005469818,
"count": 74138,
"self": 1534.900517766784,
"children": {
"SubprocessEnvManager._take_step": {
"total": 109.30514457307163,
"count": 74138,
"self": 4.62598370005162,
"children": {
"TorchPolicy.evaluate": {
"total": 104.67916087302001,
"count": 72249,
"self": 35.43943694206746,
"children": {
"TorchPolicy.sample_actions": {
"total": 69.23972393095255,
"count": 72249,
"self": 69.23972393095255
}
}
}
}
},
"workers": {
"total": 0.7931382071260487,
"count": 74137,
"self": 0.0,
"children": {
"worker_root": {
"total": 2381.2596111110156,
"count": 74137,
"is_parallel": true,
"self": 951.2278270509796,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.0016657150003993593,
"count": 1,
"is_parallel": true,
"self": 0.0005783720012004778,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0010873429991988814,
"count": 8,
"is_parallel": true,
"self": 0.0010873429991988814
}
}
},
"UnityEnvironment.step": {
"total": 0.042329461999997875,
"count": 1,
"is_parallel": true,
"self": 0.0004626690001714451,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.00042751699993459624,
"count": 1,
"is_parallel": true,
"self": 0.00042751699993459624
},
"communicator.exchange": {
"total": 0.0399360749997868,
"count": 1,
"is_parallel": true,
"self": 0.0399360749997868
},
"steps_from_proto": {
"total": 0.0015032010001050367,
"count": 1,
"is_parallel": true,
"self": 0.0003869020006277424,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0011162989994772943,
"count": 8,
"is_parallel": true,
"self": 0.0011162989994772943
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 1430.031784060036,
"count": 74136,
"is_parallel": true,
"self": 30.897817024909273,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 24.33003257004748,
"count": 74136,
"is_parallel": true,
"self": 24.33003257004748
},
"communicator.exchange": {
"total": 1265.2588427510855,
"count": 74136,
"is_parallel": true,
"self": 1265.2588427510855
},
"steps_from_proto": {
"total": 109.54509171399377,
"count": 74136,
"is_parallel": true,
"self": 23.531156822258254,
"children": {
"_process_rank_one_or_two_observation": {
"total": 86.01393489173552,
"count": 593088,
"is_parallel": true,
"self": 86.01393489173552
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 731.8810885130597,
"count": 74137,
"self": 2.467187754024053,
"children": {
"process_trajectory": {
"total": 160.07127956703243,
"count": 74137,
"self": 159.89747450903224,
"children": {
"RLTrainer._checkpoint": {
"total": 0.1738050580001982,
"count": 2,
"self": 0.1738050580001982
}
}
},
"_update_policy": {
"total": 569.3426211920032,
"count": 526,
"self": 219.76144839701283,
"children": {
"TorchPPOOptimizer.update": {
"total": 349.5811727949904,
"count": 26319,
"self": 349.5811727949904
}
}
}
}
}
}
},
"trainer_threads": {
"total": 1.3239996405900456e-06,
"count": 1,
"self": 1.3239996405900456e-06
},
"TrainerController._save_models": {
"total": 0.1499596260000544,
"count": 1,
"self": 0.0037016400001448346,
"children": {
"RLTrainer._checkpoint": {
"total": 0.14625798599990958,
"count": 1,
"self": 0.14625798599990958
}
}
}
}
}
}
}