First Push

849c0e6 verified 9 months ago

18.7 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.25450700521469116,
	"min": 0.2513265013694763,
	"max": 1.425731897354126,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 7716.65283203125,
	"min": 7531.7529296875,
	"max": 43251.00390625,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989956.0,
	"min": 29902.0,
	"max": 989956.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989956.0,
	"min": 29902.0,
	"max": 989956.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.5468913912773132,
	"min": -0.10540304332971573,
	"max": 0.6365823149681091,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 151.48892211914062,
	"min": -25.296730041503906,
	"max": 180.7893829345703,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.027380799874663353,
	"min": 0.007756194565445185,
	"max": 0.40319085121154785,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 7.584481716156006,
	"min": 2.1019287109375,
	"max": 95.55622863769531,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06598515946857837,
	"min": 0.06474892868610162,
	"max": 0.07235195697878317,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9897773920286757,
	"min": 0.5616991292927818,
	"max": 1.0584658651422096,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.017123018421019275,
	"min": 0.00023954040768810967,
	"max": 0.017123018421019275,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.25684527631528914,
	"min": 0.0033535657076335353,
	"max": 0.25684527631528914,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.443477518873336e-06,
	"min": 7.443477518873336e-06,
	"max": 0.000295215076594975,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.00011165216278310004,
	"min": 0.00011165216278310004,
	"max": 0.0036090342969886,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10248112666666669,
	"min": 0.10248112666666669,
	"max": 0.19840502499999998,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.5372169000000002,
	"min": 1.4776296000000002,
	"max": 2.5725222000000003,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.00025786455400000013,
	"min": 0.00025786455400000013,
	"max": 0.0098406619975,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.003867968310000002,
	"min": 0.003867968310000002,
	"max": 0.12031083886000002,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.014584985561668873,
	"min": 0.014120169915258884,
	"max": 0.5579977035522461,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.21877478063106537,
	"min": 0.19768238067626953,
	"max": 4.463981628417969,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 328.7956989247312,
	"min": 285.9,
	"max": 999.0,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 30578.0,
	"min": 15934.0,
	"max": 33048.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.5599412869500078,
	"min": -0.9998000515624881,
	"max": 1.6929050364879648,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 143.5145983994007,
	"min": -31.99360164999962,
	"max": 167.5975986123085,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.5599412869500078,
	"min": -0.9998000515624881,
	"max": 1.6929050364879648,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 143.5145983994007,
	"min": -31.99360164999962,
	"max": 167.5975986123085,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.0500471337480754,
	"min": 0.04836135261516896,
	"max": 12.475103815086186,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 4.604336304822937,
	"min": 4.1674862858781125,
	"max": 199.60166104137897,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1708911350",
	"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.2.1+cu121",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1708914527"
	},
	"total": 3177.1321454090003,
	"count": 1,
	"self": 0.6001731570004267,
	"children": {
	"run_training.setup": {
	"total": 0.06533630900003118,
	"count": 1,
	"self": 0.06533630900003118
	},
	"TrainerController.start_learning": {
	"total": 3176.466635943,
	"count": 1,
	"self": 2.178739297989523,
	"children": {
	"TrainerController._reset_env": {
	"total": 4.414482060999944,
	"count": 1,
	"self": 4.414482060999944
	},
	"TrainerController.advance": {
	"total": 3169.7864719760105,
	"count": 64068,
	"self": 2.5467041879733188,
	"children": {
	"env_step": {
	"total": 2130.257791092021,
	"count": 64068,
	"self": 1969.038138135983,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 159.8559913420636,
	"count": 64068,
	"self": 6.671488224062955,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 153.18450311800063,
	"count": 62550,
	"self": 153.18450311800063
	}
	}
	},
	"workers": {
	"total": 1.3636616139742728,
	"count": 64068,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 3170.7778017090354,
	"count": 64068,
	"is_parallel": true,
	"self": 1367.4470129960123,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.007462790999966273,
	"count": 1,
	"is_parallel": true,
	"self": 0.005348088999880929,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0021147020000853445,
	"count": 8,
	"is_parallel": true,
	"self": 0.0021147020000853445
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.06342643000004955,
	"count": 1,
	"is_parallel": true,
	"self": 0.0007525450000684941,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0005173430000695589,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005173430000695589
	},
	"communicator.exchange": {
	"total": 0.0600727989999541,
	"count": 1,
	"is_parallel": true,
	"self": 0.0600727989999541
	},
	"steps_from_proto": {
	"total": 0.002083742999957394,
	"count": 1,
	"is_parallel": true,
	"self": 0.000438400999996702,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0016453419999606922,
	"count": 8,
	"is_parallel": true,
	"self": 0.0016453419999606922
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1803.3307887130231,
	"count": 64067,
	"is_parallel": true,
	"self": 47.36134188999449,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 27.392768350986103,
	"count": 64067,
	"is_parallel": true,
	"self": 27.392768350986103
	},
	"communicator.exchange": {
	"total": 1600.4127628180036,
	"count": 64067,
	"is_parallel": true,
	"self": 1600.4127628180036
	},
	"steps_from_proto": {
	"total": 128.1639156540391,
	"count": 64067,
	"is_parallel": true,
	"self": 26.994489046058447,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 101.16942660798065,
	"count": 512536,
	"is_parallel": true,
	"self": 101.16942660798065
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 1036.9819766960163,
	"count": 64068,
	"self": 4.510689651992379,
	"children": {
	"process_trajectory": {
	"total": 158.17156564502625,
	"count": 64068,
	"self": 157.95296877902615,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.2185968660000981,
	"count": 2,
	"self": 0.2185968660000981
	}
	}
	},
	"_update_policy": {
	"total": 874.2997213989977,
	"count": 456,
	"self": 350.3324504190109,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 523.9672709799868,
	"count": 22764,
	"self": 523.9672709799868
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.1319998520775698e-06,
	"count": 1,
	"self": 1.1319998520775698e-06
	},
	"TrainerController._save_models": {
	"total": 0.08694147599999269,
	"count": 1,
	"self": 0.0019458599999779835,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.0849956160000147,
	"count": 1,
	"self": 0.0849956160000147
	}
	}
	}
	}
	}
	}
	}