ppo-PyramidsRND / run_logs /timers.json
pabloyesteb's picture
Subida I
6138f93
raw
history blame
18.7 kB
{
"name": "root",
"gauges": {
"Pyramids.Policy.Entropy.mean": {
"value": 0.3176240026950836,
"min": 0.3176240026950836,
"max": 1.4078160524368286,
"count": 33
},
"Pyramids.Policy.Entropy.sum": {
"value": 9625.27734375,
"min": 9625.27734375,
"max": 42707.5078125,
"count": 33
},
"Pyramids.Step.mean": {
"value": 989952.0,
"min": 29934.0,
"max": 989952.0,
"count": 33
},
"Pyramids.Step.sum": {
"value": 989952.0,
"min": 29934.0,
"max": 989952.0,
"count": 33
},
"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.6264662146568298,
"min": -0.07948450744152069,
"max": 0.6330125331878662,
"count": 33
},
"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
"value": 179.16934204101562,
"min": -19.155765533447266,
"max": 179.16934204101562,
"count": 33
},
"Pyramids.Policy.RndValueEstimate.mean": {
"value": -0.010167896747589111,
"min": -0.03611525148153305,
"max": 0.405227929353714,
"count": 33
},
"Pyramids.Policy.RndValueEstimate.sum": {
"value": -2.9080185890197754,
"min": -10.148386001586914,
"max": 96.03901672363281,
"count": 33
},
"Pyramids.Losses.PolicyLoss.mean": {
"value": 0.06750961403633329,
"min": 0.06569960350819658,
"max": 0.07435372414840578,
"count": 33
},
"Pyramids.Losses.PolicyLoss.sum": {
"value": 1.0126442105449993,
"min": 0.47958796095064893,
"max": 1.0785029756370932,
"count": 33
},
"Pyramids.Losses.ValueLoss.mean": {
"value": 0.018250664120260017,
"min": 0.0008854382073355037,
"max": 0.01881936385820643,
"count": 33
},
"Pyramids.Losses.ValueLoss.sum": {
"value": 0.2737599618039003,
"min": 0.008854382073355037,
"max": 0.2737599618039003,
"count": 33
},
"Pyramids.Policy.LearningRate.mean": {
"value": 7.5208174930933344e-06,
"min": 7.5208174930933344e-06,
"max": 0.00029515063018788575,
"count": 33
},
"Pyramids.Policy.LearningRate.sum": {
"value": 0.00011281226239640002,
"min": 0.00011281226239640002,
"max": 0.0037603354465548995,
"count": 33
},
"Pyramids.Policy.Epsilon.mean": {
"value": 0.10250690666666668,
"min": 0.10250690666666668,
"max": 0.19838354285714285,
"count": 33
},
"Pyramids.Policy.Epsilon.sum": {
"value": 1.5376036000000002,
"min": 1.3886848,
"max": 2.6534451,
"count": 33
},
"Pyramids.Policy.Beta.mean": {
"value": 0.00026043997600000006,
"min": 0.00026043997600000006,
"max": 0.00983851593142857,
"count": 33
},
"Pyramids.Policy.Beta.sum": {
"value": 0.003906599640000001,
"min": 0.003906599640000001,
"max": 0.12535916548999998,
"count": 33
},
"Pyramids.Losses.RNDLoss.mean": {
"value": 0.009131926111876965,
"min": 0.009062698110938072,
"max": 0.42660340666770935,
"count": 33
},
"Pyramids.Losses.RNDLoss.sum": {
"value": 0.1369788944721222,
"min": 0.1268777698278427,
"max": 2.9862239360809326,
"count": 33
},
"Pyramids.Environment.EpisodeLength.mean": {
"value": 274.2,
"min": 274.2,
"max": 991.8235294117648,
"count": 33
},
"Pyramids.Environment.EpisodeLength.sum": {
"value": 28791.0,
"min": 16861.0,
"max": 32631.0,
"count": 33
},
"Pyramids.Environment.CumulativeReward.mean": {
"value": 1.7257999879973276,
"min": -0.9275563033297658,
"max": 1.7257999879973276,
"count": 33
},
"Pyramids.Environment.CumulativeReward.sum": {
"value": 181.2089987397194,
"min": -29.681801706552505,
"max": 181.2089987397194,
"count": 33
},
"Pyramids.Policy.ExtrinsicReward.mean": {
"value": 1.7257999879973276,
"min": -0.9275563033297658,
"max": 1.7257999879973276,
"count": 33
},
"Pyramids.Policy.ExtrinsicReward.sum": {
"value": 181.2089987397194,
"min": -29.681801706552505,
"max": 181.2089987397194,
"count": 33
},
"Pyramids.Policy.RndReward.mean": {
"value": 0.02603166069444948,
"min": 0.02603166069444948,
"max": 9.20870790674406,
"count": 33
},
"Pyramids.Policy.RndReward.sum": {
"value": 2.7333243729171954,
"min": 2.7333243729171954,
"max": 156.548034414649,
"count": 33
},
"Pyramids.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 33
},
"Pyramids.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 33
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1692474035",
"python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
"mlagents_version": "0.31.0.dev0",
"mlagents_envs_version": "0.31.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "1.11.0+cu102",
"numpy_version": "1.21.2",
"end_time_seconds": "1692476421"
},
"total": 2385.7635191300005,
"count": 1,
"self": 1.1398265700017873,
"children": {
"run_training.setup": {
"total": 0.039800353999453364,
"count": 1,
"self": 0.039800353999453364
},
"TrainerController.start_learning": {
"total": 2384.5838922059993,
"count": 1,
"self": 1.43175545304166,
"children": {
"TrainerController._reset_env": {
"total": 4.028379483999743,
"count": 1,
"self": 4.028379483999743
},
"TrainerController.advance": {
"total": 2378.9574415559573,
"count": 64200,
"self": 1.5593161039860206,
"children": {
"env_step": {
"total": 1696.1974868390162,
"count": 64200,
"self": 1581.1558944628578,
"children": {
"SubprocessEnvManager._take_step": {
"total": 114.15801947410091,
"count": 64200,
"self": 4.988137964079215,
"children": {
"TorchPolicy.evaluate": {
"total": 109.1698815100217,
"count": 62565,
"self": 109.1698815100217
}
}
},
"workers": {
"total": 0.8835729020574945,
"count": 64200,
"self": 0.0,
"children": {
"worker_root": {
"total": 2378.8353249059937,
"count": 64200,
"is_parallel": true,
"self": 920.0597535019606,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.002013928999986092,
"count": 1,
"is_parallel": true,
"self": 0.000578698000026634,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0014352309999594581,
"count": 8,
"is_parallel": true,
"self": 0.0014352309999594581
}
}
},
"UnityEnvironment.step": {
"total": 0.053157956000177364,
"count": 1,
"is_parallel": true,
"self": 0.0006968959996811463,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0006791390005673748,
"count": 1,
"is_parallel": true,
"self": 0.0006791390005673748
},
"communicator.exchange": {
"total": 0.049708182999893324,
"count": 1,
"is_parallel": true,
"self": 0.049708182999893324
},
"steps_from_proto": {
"total": 0.0020737380000355188,
"count": 1,
"is_parallel": true,
"self": 0.0003893570001309854,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0016843809999045334,
"count": 8,
"is_parallel": true,
"self": 0.0016843809999045334
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 1458.7755714040331,
"count": 64199,
"is_parallel": true,
"self": 35.262679826835665,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 24.55862793507731,
"count": 64199,
"is_parallel": true,
"self": 24.55862793507731
},
"communicator.exchange": {
"total": 1285.7376632601145,
"count": 64199,
"is_parallel": true,
"self": 1285.7376632601145
},
"steps_from_proto": {
"total": 113.21660038200571,
"count": 64199,
"is_parallel": true,
"self": 22.551804732842356,
"children": {
"_process_rank_one_or_two_observation": {
"total": 90.66479564916335,
"count": 513592,
"is_parallel": true,
"self": 90.66479564916335
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 681.2006386129551,
"count": 64200,
"self": 2.826157913771567,
"children": {
"process_trajectory": {
"total": 118.92526791418186,
"count": 64200,
"self": 118.63489813118122,
"children": {
"RLTrainer._checkpoint": {
"total": 0.2903697830006422,
"count": 2,
"self": 0.2903697830006422
}
}
},
"_update_policy": {
"total": 559.4492127850017,
"count": 459,
"self": 364.9500068950574,
"children": {
"TorchPPOOptimizer.update": {
"total": 194.49920588994428,
"count": 22845,
"self": 194.49920588994428
}
}
}
}
}
}
},
"trainer_threads": {
"total": 1.4260003808885813e-06,
"count": 1,
"self": 1.4260003808885813e-06
},
"TrainerController._save_models": {
"total": 0.16631428700020479,
"count": 1,
"self": 0.001997520999793778,
"children": {
"RLTrainer._checkpoint": {
"total": 0.164316766000411,
"count": 1,
"self": 0.164316766000411
}
}
}
}
}
}
}