ppo-pyramid-default / run_logs /timers.json

init

b4d1748 about 2 years ago

19.2 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.32455044984817505,
	"min": 0.32455044984817505,
	"max": 1.4014934301376343,
	"count": 38
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 9658.62109375,
	"min": 9658.62109375,
	"max": 42515.703125,
	"count": 38
	},
	"Pyramids.Step.mean": {
	"value": 1139913.0,
	"min": 29952.0,
	"max": 1139913.0,
	"count": 38
	},
	"Pyramids.Step.sum": {
	"value": 1139913.0,
	"min": 29952.0,
	"max": 1139913.0,
	"count": 38
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.7032342553138733,
	"min": -0.08691871911287308,
	"max": 0.7546818256378174,
	"count": 38
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 198.3120574951172,
	"min": -20.947410583496094,
	"max": 221.87646484375,
	"count": 38
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": -0.0030358193907886744,
	"min": -0.0030358193907886744,
	"max": 0.7074459195137024,
	"count": 38
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": -0.8561010956764221,
	"min": -0.8561010956764221,
	"max": 167.66468811035156,
	"count": 38
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.0678462937241257,
	"min": 0.0659452210711912,
	"max": 0.073509724354841,
	"count": 38
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9498481121377599,
	"min": 0.5125883137292079,
	"max": 1.0995384643188741,
	"count": 38
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.014161616487898775,
	"min": 0.0009429177532035344,
	"max": 0.022875304939388996,
	"count": 38
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.19826263083058285,
	"min": 0.011315013038442413,
	"max": 0.25841210885760924,
	"count": 38
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 0.00018744825894583095,
	"min": 0.00018744825894583095,
	"max": 0.00029838354339596195,
	"count": 38
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.0026242756252416333,
	"min": 0.0020886848037717336,
	"max": 0.004011005562998167,
	"count": 38
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.16248274047619052,
	"min": 0.16248274047619052,
	"max": 0.19946118095238097,
	"count": 38
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 2.274758366666667,
	"min": 1.3962282666666668,
	"max": 2.782524833333333,
	"count": 38
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.006252025773571429,
	"min": 0.006252025773571429,
	"max": 0.009946171977142856,
	"count": 38
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.08752836083,
	"min": 0.06962320384,
	"max": 0.13370648315,
	"count": 38
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.011095731519162655,
	"min": 0.011095731519162655,
	"max": 0.6866158246994019,
	"count": 38
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.15534023940563202,
	"min": 0.15534023940563202,
	"max": 4.806310653686523,
	"count": 38
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 282.92727272727274,
	"min": 245.7520661157025,
	"max": 999.0,
	"count": 38
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 31122.0,
	"min": 15984.0,
	"max": 33343.0,
	"count": 38
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.6625486049083396,
	"min": -1.0000000521540642,
	"max": 1.7377140310185015,
	"count": 38
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 181.217797935009,
	"min": -29.920001707971096,
	"max": 210.26339775323868,
	"count": 38
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.6625486049083396,
	"min": -1.0000000521540642,
	"max": 1.7377140310185015,
	"count": 38
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 181.217797935009,
	"min": -29.920001707971096,
	"max": 210.26339775323868,
	"count": 38
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.032435735565858013,
	"min": 0.02944811480552774,
	"max": 15.783606315031648,
	"count": 38
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 3.5354951766785234,
	"min": 3.5354951766785234,
	"max": 252.53770104050636,
	"count": 38
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 38
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 38
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1674331976",
	"python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "0.29.0.dev0",
	"mlagents_envs_version": "0.29.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.8.1+cu102",
	"numpy_version": "1.21.6",
	"end_time_seconds": "1674334362"
	},
	"total": 2386.036490971,
	"count": 1,
	"self": 0.33600176700065276,
	"children": {
	"run_training.setup": {
	"total": 0.10314740299963887,
	"count": 1,
	"self": 0.10314740299963887
	},
	"TrainerController.start_learning": {
	"total": 2385.597341801,
	"count": 1,
	"self": 1.277292170997498,
	"children": {
	"TrainerController._reset_env": {
	"total": 5.984121487000266,
	"count": 1,
	"self": 5.984121487000266
	},
	"TrainerController.advance": {
	"total": 2378.1859671930024,
	"count": 74138,
	"self": 1.30607813296092,
	"children": {
	"env_step": {
	"total": 1644.9988005469818,
	"count": 74138,
	"self": 1534.900517766784,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 109.30514457307163,
	"count": 74138,
	"self": 4.62598370005162,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 104.67916087302001,
	"count": 72249,
	"self": 35.43943694206746,
	"children": {
	"TorchPolicy.sample_actions": {
	"total": 69.23972393095255,
	"count": 72249,
	"self": 69.23972393095255
	}
	}
	}
	}
	},
	"workers": {
	"total": 0.7931382071260487,
	"count": 74137,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2381.2596111110156,
	"count": 74137,
	"is_parallel": true,
	"self": 951.2278270509796,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0016657150003993593,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005783720012004778,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0010873429991988814,
	"count": 8,
	"is_parallel": true,
	"self": 0.0010873429991988814
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.042329461999997875,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004626690001714451,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.00042751699993459624,
	"count": 1,
	"is_parallel": true,
	"self": 0.00042751699993459624
	},
	"communicator.exchange": {
	"total": 0.0399360749997868,
	"count": 1,
	"is_parallel": true,
	"self": 0.0399360749997868
	},
	"steps_from_proto": {
	"total": 0.0015032010001050367,
	"count": 1,
	"is_parallel": true,
	"self": 0.0003869020006277424,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0011162989994772943,
	"count": 8,
	"is_parallel": true,
	"self": 0.0011162989994772943
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1430.031784060036,
	"count": 74136,
	"is_parallel": true,
	"self": 30.897817024909273,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 24.33003257004748,
	"count": 74136,
	"is_parallel": true,
	"self": 24.33003257004748
	},
	"communicator.exchange": {
	"total": 1265.2588427510855,
	"count": 74136,
	"is_parallel": true,
	"self": 1265.2588427510855
	},
	"steps_from_proto": {
	"total": 109.54509171399377,
	"count": 74136,
	"is_parallel": true,
	"self": 23.531156822258254,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 86.01393489173552,
	"count": 593088,
	"is_parallel": true,
	"self": 86.01393489173552
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 731.8810885130597,
	"count": 74137,
	"self": 2.467187754024053,
	"children": {
	"process_trajectory": {
	"total": 160.07127956703243,
	"count": 74137,
	"self": 159.89747450903224,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.1738050580001982,
	"count": 2,
	"self": 0.1738050580001982
	}
	}
	},
	"_update_policy": {
	"total": 569.3426211920032,
	"count": 526,
	"self": 219.76144839701283,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 349.5811727949904,
	"count": 26319,
	"self": 349.5811727949904
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.3239996405900456e-06,
	"count": 1,
	"self": 1.3239996405900456e-06
	},
	"TrainerController._save_models": {
	"total": 0.1499596260000544,
	"count": 1,
	"self": 0.0037016400001448346,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.14625798599990958,
	"count": 1,
	"self": 0.14625798599990958
	}
	}
	}
	}
	}
	}
	}